# Test Recurrent Policy with Extreme Parameter Variation 

In [1]:
import numpy as np
import os,sys



sys.path.append('../../../RL_lib/Agents')
sys.path.append('../../../RL_lib/Policies/PPO')
sys.path.append('../../../RL_lib/Policies/Common')
sys.path.append('../../../RL_lib/Utils')
sys.path.append('../../../Env')
sys.path.append('../../../Imaging')


%load_ext autoreload
%load_ext autoreload
%autoreload 2
%matplotlib nbagg
import os
print(os.getcwd())

The autoreload extension is already loaded. To reload it, use:
  %reload_ext autoreload
/Users/briangaudet/Study/Subjects/MachineLearning/Projects/Asteroid_CPO_seeker-master/Experiments/Extended/Optimize_HF


In [2]:
%%html
<style>
.output_wrapper, .output {
    height:auto !important;
    max-height:1000px;  /* your desired max-height here */
}
.output_scroll {
    box-shadow:none !important;
    webkit-box-shadow:none !important;
}
</style>

# Optimize Policy

In [3]:
from env import Env
import env_utils as envu
from dynamics_model import Dynamics_model
from lander_model import Lander_model
from ic_gen import Landing_icgen
import rl_utils
import attitude_utils as attu
import optics_utils as optu
from arch_policy_vf import Arch

from policy_ppo import Policy
from softmax_pd import Softmax_pd as PD
from value_function import Value_function

import policy_nets as policy_nets
import valfunc_nets as valfunc_nets


from agent import Agent


import torch.nn as nn

from flat_constraint import Flat_constraint
from glideslope_constraint import Glideslope_constraint
from rh_constraint import RH_constraint
from no_attitude_constraint import Attitude_constraint
from w_constraint import W_constraint
from reward_attitude import Reward
from asteroid_hfr import Asteroid

from thruster_model_cubesat import Thruster_model

from sensor import Sensor
from seeker import Seeker

landing_site_range = 0.0
landing_site = None #np.asarray([-250.,0.,0.])

asteroid_model = Asteroid(landing_site_override=landing_site, omega_range=(1e-5,5e-4))

ap = attu.Quaternion_attitude()

C_cb = optu.rotate_optical_axis(0.0, 0.0, np.pi)
r_cb = np.asarray([0,0,0])
fov=envu.deg2rad(90)
seeker = Seeker(attitude_parameterization=ap, C_cb=C_cb, r_cb=r_cb,
                radome_slope_bounds=(-0.05,0.05), range_bias=(-0.05,0.05),
                   fov=fov, debug=False)
sensor = Sensor(seeker, attitude_parameterization=ap,  use_range=True, apf_tau1=300, use_dp=False,
                      landing_site_range=landing_site_range,
                      pool_type='max', state_type=Sensor.optflow_state_range_dp1)
print(sensor.track_func)
sensor.track_func = sensor.track_func1
print(sensor.track_func)
logger = rl_utils.Logger()
dynamics_model = Dynamics_model(h=2)
thruster_model = Thruster_model(pulsed=True, scale=1.0, offset=0.4)
lander_model = Lander_model(asteroid_model, thruster_model, attitude_parameterization=ap, sensor=sensor, 
                             landing_site_range=landing_site_range, com_range=(-0.10,0.10),
                              attitude_bias=0.05, omega_bias=0.05)

lander_model.get_state_agent = lander_model.get_state_agent_sensor_att_w2

obs_dim = 13
action_dim = 12
actions_per_dim = 2
logit_dim = action_dim * actions_per_dim

recurrent_steps = 60

reward_object = Reward(landing_rlimit=2, landing_vlimit=0.1, 
                       tracking_bias=0.01, fov_coeff=-50., 
                       att_coeff=-0.20,
                       tracking_coeff=-0.5, magv_coeff=-1.0,
                       fuel_coeff=-0.10,  landing_coeff=10.0)

glideslope_constraint = Glideslope_constraint(gs_limit=-1.0)
shape_constraint = Flat_constraint()
attitude_constraint = Attitude_constraint(ap)
w_constraint = W_constraint(w_limit=(0.1,0.1,0.1), w_margin=(0.05,0.05,0.05))
rh_constraint = RH_constraint(rh_limit=150)

wi=0.05
ic_gen = Landing_icgen((800,1000), 
                           p_engine_fail=0.5,
                           engine_fail_scale=(0.5,1.0),
                           lander_wll=(-wi,-wi,-wi),
                           lander_wul=(wi,wi,wi),
                           attitude_parameterization=ap,
                           position_error=(0,np.pi/4),
                           heading_error=(0,np.pi/8),
                           attitude_error=(0,np.pi/16),
                           min_mass=450, max_mass=500,
                           mag_v=(0.05,0.1),
                           debug=False,
                           inertia_uncertainty_diag=10.0,
                           inertia_uncertainty_offdiag=1.0)

env = Env(ic_gen, lander_model, dynamics_model, logger,
          landing_site_range=landing_site_range,
          debug_done=False,
          reward_object=reward_object,
          glideslope_constraint=glideslope_constraint,
          attitude_constraint=attitude_constraint,
          w_constraint=w_constraint,
          rh_constraint=rh_constraint,
          tf_limit=5000.0,print_every=10,nav_period=6)




env.ic_gen.show()

arch = Arch()

policy = Policy(policy_nets.GRU1(obs_dim, logit_dim, recurrent_steps=recurrent_steps), 
                PD(action_dim, actions_per_dim),
                shuffle=False,
                kl_targ=0.001,epochs=20, beta=0.1, servo_kl=True, max_grad_norm=30, scale_vector_obs=True,
                init_func=rl_utils.xn_init)
value_function = Value_function(valfunc_nets.GRU1(obs_dim, recurrent_steps=recurrent_steps), scale_obs=True,
                                shuffle=False, batch_size=9999999, max_grad_norm=30, 
                                verbose=False)

agent = Agent(arch, policy, value_function, None, env, logger,
              policy_episodes=30, policy_steps=3000, gamma1=0.95, gamma2=0.995, 
              recurrent_steps=recurrent_steps, monitor=env.rl_stats)
agent.train(120000)

Quaternion_attitude
Euler321 Attitude
C_cb: 
[[ 1.0000000e+00  0.0000000e+00 -0.0000000e+00]
 [ 0.0000000e+00 -1.0000000e+00  1.2246468e-16]
 [ 0.0000000e+00 -1.2246468e-16 -1.0000000e+00]]
[ 0.0000000e+00 -1.2246468e-16 -1.0000000e+00]
using max  pooling
V4: Output State type:  <function Sensor.optflow_state_range_dp1 at 0x134adf378>
<bound method Sensor.track_func1 of <sensor.Sensor object at 0x124a81748>>
<bound method Sensor.track_func1 of <sensor.Sensor object at 0x124a81748>>
6dof dynamics model 
thruster model: 
Inertia Tensor:  [[333.33333333   0.           0.        ]
 [  0.         333.33333333   0.        ]
 [  0.           0.         333.33333333]]
Lander Model: 
Reward_terminal equator
queue fixed
Flat Constraint
Attitude Constraint
Rotational Velocity Constraint
Position Hysterises Constraint


<IPython.core.display.Javascript object>

<IPython.core.display.Javascript object>

<IPython.core.display.Javascript object>

<IPython.core.display.Javascript object>

<IPython.core.display.Javascript object>

<IPython.core.display.Javascript object>

<IPython.core.display.Javascript object>

lander env RHL
Landing_icgen:
[[-1.]
 [ 1.]]
Policy with vectorized sample
	xn_init: layer  Linear(in_features=13, out_features=130, bias=True)
	xn_init: layer  GRUCell(130, 176)
	xn_init: layer  Linear(in_features=176, out_features=240, bias=True)
	xn_init: layer  Linear(in_features=240, out_features=24, bias=True)
Policy: recurrent steps > 1, disabling shuffle
	Test Mode:          False
	Clip Param:         0.1
	Shuffle :           False
	Shuffle by Chunks:  False
	Max Grad Norm:      30
	Recurrent Steps:    60
	Rollout Limit:      1
	Advantage Func:     <advantage_utils.Adv_default object at 0x134b83dd8>
	Advantage Norm:     <function Adv_normalizer.apply at 0x133e6e378>
	PD:                 <softmax_pd.Softmax_pd object at 0x134b75588>
	Loss Function:      <bound method Policy.calc_loss1 of <policy_ppo.Policy object at 0x134b83c18>>
Value Funtion
	xn_init: layer  Linear(in_features=13, out_features=130, bias=True)
	xn_init: layer  GRUCell(130, 25)
	xn_init: layer  Linear(in_feature

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0988   0.0293   0.1419   0.1549   0.1094   0.0369
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.2234   0.0869   0.3310   6.4661   2.1407   2.4885
***** Episode 226, Mean R = -256.7  Std R = 137.1  Min R = -661.4
PolicyLoss: -0.0173
Policy_Beta: 0.0667
Policy_Entropy: 0.000337
Policy_KL: 0.00181
Policy_SD: 0.954
Policy_lr_mult: 1
Steps: 4.31e+03
TotalSteps: 2.31e+04
VF_0_ExplainedVarNew: -0.035
VF_0_ExplainedVarOld: -0.0672
VF_0_Loss : 0.716


ADV1:  -0.0651024621978907 0.8444949418624327 0.9246363343589954 -3.56367723418722
ADV2:  0.021405792508485018 0.8840502485318387 1.0768849442045172 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.1029   0.0288   0.1454   0.1549   0.1094   0.0369
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.1247   0.0443   0.1887   6.4661   2.1407   2.4885
***** Episode 257, Mean R = -236.5  Std R = 76.6  Min R = -468.2
PolicyLoss: -0.0161
Policy_Beta: 0.0444
Policy_Entropy: 0.000339
Pol

*** RH VIO  CNT:  100
ADV1:  0.021295362516059766 0.47980683236593324 0.630780997073928 -3.8342138063640423
ADV2:  0.03980830558660767 0.7196848433901515 1.2070115512963613 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0693   0.0135   0.0923   0.1891   0.1175   0.0433
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0740   0.0366   0.1484   6.4661   2.1407   2.4885
***** Episode 505, Mean R = -435.8  Std R = 199.4  Min R = -776.3
PolicyLoss: -0.0512
Policy_Beta: 0.0444
Policy_Entropy: 0.000355
Policy_KL: 0.00059
Policy_SD: 0.954
Policy_lr_mult: 1
Steps: 9.54e+03
TotalSteps: 8.56e+04
VF_0_ExplainedVarNew: 0.197
VF_0_ExplainedVarOld: 0.0901
VF_0_Loss : 0.219


ADV1:  0.04599266573281997 0.3919979259412024 0.6414798548375189 -4.053520970811192
ADV2:  0.03379843346604599 0.6805116116148054 1.435656688090787 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0865   0.0168   0.1074   0.1891   0.1175   0.0433
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0687   0

***** Episode 753, Mean R = -456.8  Std R = 173.9  Min R = -1138.2
PolicyLoss: -0.0317
Policy_Beta: 0.0667
Policy_Entropy: 0.000373
Policy_KL: 0.00087
Policy_SD: 0.955
Policy_lr_mult: 1
Steps: 1.09e+04
TotalSteps: 1.7e+05
VF_0_ExplainedVarNew: 0.555
VF_0_ExplainedVarOld: 0.528
VF_0_Loss : 0.0682


ADV1:  0.017930275427944047 0.23141447766397688 1.6146483313275264 -3.724148708022498
ADV2:  0.020337854307910904 0.7200900182233716 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0920   0.0261   0.1357   0.1891   0.1175   0.0433
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0276   0.0101   0.0536   6.4661   2.1407   2.4885
***** Episode 784, Mean R = -450.8  Std R = 166.5  Min R = -945.5
PolicyLoss: -0.0312
Policy_Beta: 0.0667
Policy_Entropy: 0.000371
Policy_KL: 0.00107
Policy_SD: 0.955
Policy_lr_mult: 1
Steps: 1.05e+04
TotalSteps: 1.81e+05
VF_0_ExplainedVarNew: 0.614
VF_0_ExplainedVarOld: 0.587
VF_0_Loss : 0.0617


ADV1:  0.008986241938503869 0.16333232063334704 1.6722

ADV1:  0.024613483554414485 0.18762134821623747 2.1631508445739747 -1.1937530418384972
ADV2:  -0.011236088934352444 0.8257841328879736 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0926   0.0226   0.1382   0.1891   0.1175   0.0433
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0409   0.0182   0.0942   6.4661   2.1407   2.4885
***** Episode 1032, Mean R = -434.3  Std R = 131.5  Min R = -706.4
PolicyLoss: -0.00193
Policy_Beta: 0.0667
Policy_Entropy: 0.000384
Policy_KL: 0.000936
Policy_SD: 0.955
Policy_lr_mult: 1
Steps: 1.07e+04
TotalSteps: 2.71e+05
VF_0_ExplainedVarNew: 0.706
VF_0_ExplainedVarOld: 0.656
VF_0_Loss : 0.0342


ADV1:  -0.001892114854385927 0.16733265837277259 1.0419596738309624 -1.3726505359013896
ADV2:  0.028262621345500522 0.8298675248026322 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0808   0.0110   0.1033   0.1891   0.1175   0.0433
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0192   0.0057   0.0268   6.4661   2.1407   2.488

*** RH VIO  CNT:  600
ADV1:  -0.0141770871402647 0.17936118921019653 1.7916882734544457 -1.3585442034403505
ADV2:  0.02119694196533315 0.7995262045768042 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.1102   0.0263   0.1575   0.2055   0.1304   0.0433
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0337   0.0153   0.0668   6.4661   2.1407   2.4885
***** Episode 1311, Mean R = -472.8  Std R = 192.8  Min R = -1060.1
PolicyLoss: -0.0199
Policy_Beta: 0.0667
Policy_Entropy: 0.000406
Policy_KL: 0.00108
Policy_SD: 0.955
Policy_lr_mult: 1
Steps: 1.15e+04
TotalSteps: 3.77e+05
VF_0_ExplainedVarNew: 0.742
VF_0_ExplainedVarOld: 0.691
VF_0_Loss : 0.0399


ADV1:  0.012180657819092344 0.19726753456741142 2.0510713334572586 -1.3829529775156266
ADV2:  0.007084967991595376 0.8503020913102657 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.1087   0.0292   0.1739   0.2055   0.1304   0.0433
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0385   0.0169   0.0789   6.4661

cs_angles | -0.0216  0.0215 |  0.3370  0.3293 | -0.9999 -0.9999 |  0.9999  1.0000
optical_flow | -0.0000  0.0001 |  0.0019  0.0019 | -0.0202 -0.0580 |  0.0131  0.0194
v_err    | -0.4690 |  0.1660 | -1.0799 |  0.5062
landing_rewards |    0.00 |    0.00 |    0.00 |    0.00
landing_margin |  912.67 |  248.58 |   38.61 | 1303.68
tracking_rewards | -424.11 |  177.20 |-1023.58 |  -97.11
steps    |     388 |     157 |     126 |     834
***** Episode 1590, Mean R = -517.6  Std R = 194.7  Min R = -982.2
PolicyLoss: -0.0323
Policy_Beta: 0.0667
Policy_Entropy: 0.00042
Policy_KL: 0.00107
Policy_SD: 0.956
Policy_lr_mult: 1
Steps: 1.26e+04
TotalSteps: 4.86e+05
VF_0_ExplainedVarNew: 0.671
VF_0_ExplainedVarOld: 0.65
VF_0_Loss : 0.0586


*** RH VIO  CNT:  800
ADV1:  -0.003606256973056323 0.17640975716261587 1.2800624640782674 -2.918919506073002
ADV2:  0.02847253310829393 0.7673382120449785 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.1456   0.0411   0.2208   0.2208   0.1456   0.0433
Va

w        |   -0.00    0.00    0.00 |    0.02    0.02    0.02 |   -0.09   -0.08   -0.08 |    0.09    0.08    0.10
a_f      |   -0.09    0.14 |    0.69    1.85 |   -1.50   -3.09 |    1.50    3.14
w_f      |   -0.00    0.00    0.00 |    0.02    0.02    0.02 |   -0.09   -0.05   -0.07 |    0.06    0.07    0.07
w_rewards |   -1.42 |    1.31 |   -6.17 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |  -30.16 |   24.46 |  -50.00 |    0.00
theta_cv |    1.48 |    0.68 |    0.01 |    3.14
seeker_angles |    0.02    0.06 |    0.35    0.34 |   -1.00   -1.00 |    1.00    1.00
cs_angles |  0.0156  0.0607 |  0.3524  0.3363 | -0.9999 -0.9999 |  0.9999  0.9999
optical_flow |  0.0002  0.0003 |  0.0025  0.0024 | -0.0274 -0.0320 |  0.0553  0.0324
v_err    | -0.3925 |  0.1900 | -1.2515 |  0.8587
landing_rewards |    0.00 |    0.00 |    0.00 |    0.00
landing_margin |  759.64 |  299.57 |   76.75 | 1298.88
tracking_rewards | -371.54 |  132.19 | -989.98 | -148.82
steps    |     373 |  

w        |   -0.00    0.00    0.00 |    0.02    0.02    0.02 |   -0.09   -0.09   -0.08 |    0.09    0.09    0.08
a_f      |   -0.01   -0.09 |    0.69    1.80 |   -1.52   -3.14 |    1.52    3.09
w_f      |   -0.00    0.00    0.00 |    0.02    0.02    0.02 |   -0.05   -0.06   -0.06 |    0.06    0.05    0.06
w_rewards |   -0.53 |    0.60 |   -3.65 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |  -42.10 |   18.24 |  -50.00 |    0.00
theta_cv |    1.26 |    0.64 |    0.00 |    3.13
seeker_angles |   -0.02    0.02 |    0.36    0.32 |   -1.00   -1.00 |    1.00    1.00
cs_angles | -0.0217  0.0186 |  0.3603  0.3244 | -1.0000 -0.9999 |  0.9999  0.9997
optical_flow | -0.0003  0.0000 |  0.0042  0.0034 | -0.0544 -0.0703 |  0.0540  0.0423
v_err    | -0.2262 |  0.2496 | -1.0946 |  1.0725
landing_rewards |    0.00 |    0.00 |    0.00 |    0.00
landing_margin |  539.51 |  275.33 |   53.41 | 1219.01
tracking_rewards | -230.00 |   85.09 | -696.40 | -103.01
steps    |     292 |  

w        |   -0.00    0.00    0.00 |    0.02    0.02    0.02 |   -0.07   -0.07   -0.07 |    0.08    0.07    0.08
a_f      |    0.02   -0.16 |    0.66    1.77 |   -1.50   -3.13 |    1.44    3.12
w_f      |    0.00    0.00    0.00 |    0.02    0.02    0.02 |   -0.05   -0.05   -0.05 |    0.05    0.04    0.04
w_rewards |   -0.14 |    0.20 |   -1.24 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |  -44.68 |   15.42 |  -50.00 |    0.00
theta_cv |    0.97 |    0.53 |    0.00 |    3.11
seeker_angles |    0.02   -0.03 |    0.36    0.32 |   -1.00   -1.00 |    1.00    1.00
cs_angles |  0.0161 -0.0259 |  0.3613  0.3211 | -0.9999 -1.0000 |  1.0000  0.9998
optical_flow |  0.0001 -0.0001 |  0.0049  0.0043 | -0.1681 -0.1347 |  0.1300  0.0770
v_err    | -0.1182 |  0.2496 | -1.4189 |  0.9786
landing_rewards |    0.00 |    0.00 |    0.00 |    0.00
landing_margin |  463.55 |  224.05 |   18.93 | 1227.41
tracking_rewards | -158.05 |   49.73 | -486.51 |  -86.75
steps    |     246 |  

theta_cv |    0.76 |    0.41 |    0.00 |    2.97
seeker_angles |   -0.01    0.01 |    0.36    0.31 |   -1.00   -1.00 |    1.00    1.00
cs_angles | -0.0060  0.0083 |  0.3577  0.3063 | -0.9999 -0.9999 |  0.9999  1.0000
optical_flow | -0.0001  0.0006 |  0.0054  0.0046 | -0.0464 -0.0527 |  0.0641  0.0895
v_err    | -0.0470 |  0.2194 | -1.0668 |  1.0056
landing_rewards |    0.00 |    0.00 |    0.00 |    0.00
landing_margin |  388.57 |  176.83 |   54.38 |  979.84
tracking_rewards | -123.66 |   27.93 | -296.83 |  -74.02
steps    |     233 |      36 |     163 |     387
***** Episode 2830, Mean R = -176.1  Std R = 23.6  Min R = -234.1
PolicyLoss: -0.0253
Policy_Beta: 0.0667
Policy_Entropy: 0.000872
Policy_KL: 0.00108
Policy_SD: 0.959
Policy_lr_mult: 1
Steps: 7.18e+03
TotalSteps: 8.4e+05
VF_0_ExplainedVarNew: 0.959
VF_0_ExplainedVarOld: 0.939
VF_0_Loss : 0.147


ADV1:  -0.005490388830508771 0.08766159585413255 0.37548159648094637 -0.5708124065399192
ADV2:  0.018697134895990345 0.8824285996411804

attitude |   -0.01    0.00    0.03 |    1.35    0.67    1.90 |   -3.14   -1.56   -3.14 |    3.14    1.56    3.14
w        |   -0.00    0.00    0.00 |    0.02    0.02    0.02 |   -0.06   -0.06   -0.06 |    0.07    0.06    0.06
a_f      |    0.01    0.01 |    0.67    1.90 |   -1.47   -3.13 |    1.40    3.14
w_f      |    0.00   -0.00    0.00 |    0.02    0.02    0.02 |   -0.04   -0.04   -0.04 |    0.05    0.04    0.04
w_rewards |   -0.04 |    0.07 |   -0.33 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |  -47.58 |   10.73 |  -50.00 |    0.00
theta_cv |    0.66 |    0.36 |    0.00 |    2.78
seeker_angles |   -0.02   -0.02 |    0.36    0.31 |   -1.00   -1.00 |    1.00    1.00
cs_angles | -0.0167 -0.0168 |  0.3648  0.3106 | -0.9999 -1.0000 |  0.9999  0.9999
optical_flow | -0.0002  0.0003 |  0.0054  0.0047 | -0.0457 -0.1424 |  0.1187  0.0797
v_err    | -0.0423 |  0.1727 | -1.0388 |  0.6999
landing_rewards |    0.00 |    0.00 |    0.00 |    0.00
landing_margin |  353

attitude |   -0.08   -0.02    0.07 |    1.18    0.66    1.82 |   -3.14   -1.56   -3.14 |    3.14    1.57    3.14
w        |   -0.00    0.00    0.00 |    0.02    0.01    0.01 |   -0.06   -0.06   -0.06 |    0.06    0.07    0.06
a_f      |   -0.01    0.08 |    0.67    1.79 |   -1.56   -3.14 |    1.49    3.07
w_f      |   -0.00   -0.00    0.00 |    0.02    0.01    0.01 |   -0.04   -0.04   -0.04 |    0.06    0.04    0.05
w_rewards |   -0.02 |    0.06 |   -0.57 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |  -47.58 |   10.73 |  -50.00 |    0.00
theta_cv |    0.62 |    0.33 |    0.00 |    2.40
seeker_angles |   -0.02    0.03 |    0.36    0.32 |   -1.00   -1.00 |    1.00    1.00
cs_angles | -0.0156  0.0315 |  0.3607  0.3194 | -0.9999 -0.9991 |  1.0000  0.9996
optical_flow | -0.0003  0.0011 |  0.0052  0.0050 | -0.1481 -0.1720 |  0.0557  0.0851
v_err    | -0.0558 |  0.1314 | -1.3068 |  0.6294
landing_rewards |    0.00 |    0.00 |    0.00 |    0.00
landing_margin |  343

theta_cv |    0.56 |    0.29 |    0.00 |    2.09
seeker_angles |   -0.04   -0.00 |    0.36    0.33 |   -1.00   -1.00 |    1.00    1.00
cs_angles | -0.0351 -0.0015 |  0.3592  0.3268 | -0.9998 -1.0000 |  1.0000  0.9999
optical_flow | -0.0004  0.0007 |  0.0058  0.0051 | -0.1144 -0.1863 |  0.2111  0.0855
v_err    | -0.0473 |  0.1127 | -0.5740 |  0.6342
landing_rewards |    0.00 |    0.00 |    0.00 |    0.00
landing_margin |  300.16 |  141.60 |    8.95 |  789.50
tracking_rewards |  -93.75 |   20.18 | -160.96 |  -55.47
steps    |     257 |      45 |     150 |     380
***** Episode 3760, Mean R = -154.9  Std R = 19.5  Min R = -190.6
PolicyLoss: 0.016
Policy_Beta: 0.0667
Policy_Entropy: 0.0015
Policy_KL: 0.00106
Policy_SD: 0.959
Policy_lr_mult: 1
Steps: 8.3e+03
TotalSteps: 1.07e+06
VF_0_ExplainedVarNew: 0.875
VF_0_ExplainedVarOld: 0.867
VF_0_Loss : 0.136


ADV1:  -0.009550781038545824 0.13920516833961055 1.740693179766337 -1.379275115331016
ADV2:  0.022612718027546674 0.7920987757517546 3.0 -3

a_f      |   -0.03   -0.08 |    0.64    1.78 |   -1.33   -3.14 |    1.42    3.10
w_f      |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.04   -0.03   -0.04 |    0.03    0.04    0.04
w_rewards |   -0.00 |    0.02 |   -0.19 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |  -49.35 |    5.64 |  -50.00 |    0.00
theta_cv |    0.55 |    0.29 |    0.00 |    2.32
seeker_angles |    0.00    0.02 |    0.34    0.33 |   -1.00   -1.00 |    1.00    1.00
cs_angles |  0.0007  0.0198 |  0.3402  0.3343 | -0.9999 -0.9999 |  0.9999  0.9999
optical_flow | -0.0002  0.0007 |  0.0067  0.0064 | -0.1836 -0.1427 |  0.1258  0.2180
v_err    | -0.0392 |  0.1049 | -0.4669 |  0.5633
landing_rewards |    0.00 |    0.00 |    0.00 |    0.00
landing_margin |  262.81 |  136.16 |   12.72 |  697.27
tracking_rewards |  -88.04 |   18.45 | -149.08 |  -54.76
steps    |     260 |      44 |     142 |     391
***** Episode 4070, Mean R = -147.7  Std R = 20.1  Min R = -196.3
PolicyLoss: -0.0113


attitude |    0.01   -0.02   -0.14 |    1.22    0.66    1.87 |   -3.14   -1.57   -3.14 |    3.14    1.57    3.14
w        |   -0.00   -0.00    0.00 |    0.01    0.01    0.01 |   -0.06   -0.06   -0.06 |    0.06    0.06    0.06
a_f      |   -0.01    0.02 |    0.65    1.87 |   -1.41   -3.13 |    1.48    3.13
w_f      |    0.00   -0.00   -0.00 |    0.01    0.01    0.01 |   -0.04   -0.04   -0.03 |    0.04    0.03    0.03
w_rewards |   -0.00 |    0.02 |   -0.16 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |  -48.87 |    7.43 |  -50.00 |    0.00
theta_cv |    0.56 |    0.29 |    0.00 |    2.28
seeker_angles |    0.01   -0.00 |    0.33    0.33 |   -1.00   -1.00 |    1.00    1.00
cs_angles |  0.0107 -0.0023 |  0.3268  0.3319 | -0.9999 -0.9994 |  0.9998  1.0000
optical_flow |  0.0001  0.0003 |  0.0067  0.0070 | -0.1170 -0.1114 |  0.1123  0.1662
v_err    | -0.0313 |  0.0991 | -0.4712 |  0.5567
landing_rewards |    0.00 |    0.00 |    0.00 |    0.00
landing_margin |  233

w        |   -0.00   -0.00    0.00 |    0.01    0.01    0.01 |   -0.05   -0.05   -0.05 |    0.05    0.06    0.06
a_f      |   -0.02    0.10 |    0.66    1.95 |   -1.36   -3.13 |    1.47    3.13
w_f      |    0.00   -0.00    0.00 |    0.01    0.01    0.01 |   -0.03   -0.03   -0.03 |    0.04    0.03    0.04
w_rewards |   -0.00 |    0.02 |   -0.24 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |  -49.35 |    5.64 |  -50.00 |    0.00
theta_cv |    0.56 |    0.30 |    0.00 |    2.19
seeker_angles |    0.03    0.00 |    0.33    0.33 |   -1.00   -1.00 |    1.00    1.00
cs_angles |  0.0348  0.0021 |  0.3256  0.3290 | -0.9996 -0.9996 |  1.0000  1.0000
optical_flow |  0.0004  0.0004 |  0.0078  0.0080 | -0.1253 -0.1201 |  0.1343  0.1157
v_err    | -0.0286 |  0.0980 | -0.4786 |  0.5922
landing_rewards |    0.00 |    0.00 |    0.00 |    0.00
landing_margin |  209.28 |  131.46 |   15.98 |  588.11
tracking_rewards |  -84.52 |   18.96 | -155.68 |  -49.77
steps    |     276 |  

w        |    0.00   -0.00    0.00 |    0.01    0.01    0.01 |   -0.05   -0.05   -0.06 |    0.05    0.05    0.05
a_f      |    0.03    0.12 |    0.65    1.83 |   -1.32   -3.14 |    1.50    3.13
w_f      |   -0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.03   -0.04   -0.04 |    0.03    0.04    0.03
w_rewards |   -0.00 |    0.01 |   -0.14 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |  -47.26 |   11.38 |  -50.00 |    0.00
theta_cv |    0.57 |    0.30 |    0.00 |    2.42
seeker_angles |    0.02    0.01 |    0.33    0.32 |   -1.00   -1.00 |    1.00    1.00
cs_angles |  0.0237  0.0071 |  0.3297  0.3236 | -0.9999 -0.9999 |  0.9999  0.9996
optical_flow |  0.0004 -0.0001 |  0.0091  0.0089 | -0.1477 -0.1582 |  0.2308  0.1977
v_err    | -0.0231 |  0.0967 | -0.5111 |  0.6321
landing_rewards |    0.00 |    0.00 |    0.00 |    0.00
landing_margin |  193.30 |  122.53 |    2.25 |  561.59
tracking_rewards |  -83.31 |   17.88 | -138.83 |  -48.42
steps    |     280 |  

w        |   -0.00   -0.00    0.00 |    0.01    0.01    0.01 |   -0.06   -0.06   -0.05 |    0.05    0.05    0.06
a_f      |    0.02    0.10 |    0.69    1.76 |   -1.45   -3.14 |    1.48    3.13
w_f      |    0.00   -0.00    0.00 |    0.01    0.01    0.01 |   -0.04   -0.04   -0.04 |    0.03    0.04    0.04
w_rewards |   -0.00 |    0.01 |   -0.21 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |  -46.77 |   12.28 |  -50.00 |    0.00
theta_cv |    0.57 |    0.32 |    0.00 |    2.35
seeker_angles |    0.03    0.02 |    0.31    0.33 |   -1.00   -1.00 |    1.00    1.00
cs_angles |  0.0294  0.0180 |  0.3104  0.3287 | -0.9998 -0.9999 |  0.9999  0.9996
optical_flow |  0.0000  0.0001 |  0.0093  0.0092 | -0.2381 -0.1772 |  0.1655  0.1101
v_err    | -0.0207 |  0.0934 | -0.4622 |  0.6265
landing_rewards |    0.00 |    0.00 |    0.00 |    0.00
landing_margin |  183.74 |  128.67 |    7.13 |  547.35
tracking_rewards |  -82.52 |   18.19 | -154.44 |  -40.91
steps    |     287 |  

w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.06
a_f      |   -0.03   -0.03 |    0.71    1.85 |   -1.52   -3.13 |    1.47    3.14
w_f      |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.04   -0.04   -0.03 |    0.03    0.04    0.03
w_rewards |   -0.00 |    0.00 |   -0.05 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |  -46.13 |   13.36 |  -50.00 |    0.00
theta_cv |    0.59 |    0.32 |    0.00 |    3.00
seeker_angles |    0.06    0.01 |    0.32    0.33 |   -1.00   -1.00 |    1.00    1.00
cs_angles |  0.0563  0.0073 |  0.3203  0.3267 | -1.0000 -0.9999 |  1.0000  0.9998
optical_flow |  0.0002  0.0000 |  0.0099  0.0094 | -0.2764 -0.1924 |  0.2730  0.2874
v_err    | -0.0187 |  0.0920 | -0.4797 |  0.6745
landing_rewards |    0.00 |    0.00 |    0.00 |    0.00
landing_margin |  164.92 |  116.23 |   10.72 |  561.81
tracking_rewards |  -83.84 |   19.00 | -135.24 |  -46.91
steps    |     292 |  

w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |   -0.03    0.03 |    0.66    1.83 |   -1.52   -3.13 |    1.46    3.10
w_f      |    0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.03   -0.04   -0.04 |    0.04    0.03    0.03
w_rewards |   -0.00 |    0.00 |   -0.04 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |  -45.00 |   15.00 |  -50.00 |    0.00
theta_cv |    0.60 |    0.34 |    0.00 |    2.89
seeker_angles |    0.04    0.02 |    0.32    0.33 |   -1.00   -1.00 |    1.00    1.00
cs_angles |  0.0440  0.0192 |  0.3163  0.3272 | -1.0000 -0.9999 |  1.0000  0.9998
optical_flow |  0.0000  0.0000 |  0.0103  0.0108 | -0.4503 -0.1974 |  0.1881  0.1505
v_err    | -0.0174 |  0.0918 | -0.4605 |  1.1150
landing_rewards |    0.00 |    0.00 |    0.00 |    0.00
landing_margin |  150.77 |  109.82 |    0.93 |  605.63
tracking_rewards |  -84.09 |   19.45 | -146.72 |  -49.13
steps    |     299 |  

attitude |   -0.01   -0.00   -0.14 |    1.23    0.67    1.86 |   -3.14   -1.56   -3.14 |    3.14    1.56    3.14
w        |    0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.05   -0.06   -0.05 |    0.05    0.05    0.05
a_f      |    0.00   -0.17 |    0.68    1.86 |   -1.54   -3.14 |    1.42    3.09
w_f      |   -0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.04   -0.03   -0.03 |    0.04    0.03    0.04
w_rewards |   -0.00 |    0.01 |   -0.11 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |  -45.97 |   13.61 |  -50.00 |    0.00
theta_cv |    0.60 |    0.33 |    0.00 |    2.53
seeker_angles |    0.06    0.02 |    0.32    0.32 |   -1.00   -1.00 |    1.00    1.00
cs_angles |  0.0597  0.0153 |  0.3194  0.3153 | -0.9999 -1.0000 |  0.9998  0.9997
optical_flow |  0.0001  0.0001 |  0.0110  0.0105 | -0.4894 -0.3258 |  0.3652  0.1893
v_err    | -0.0215 |  0.0869 | -0.4782 |  0.6641
landing_rewards |    0.00 |    0.00 |    0.00 |    0.00
landing_margin |  152

w        |    0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |    0.02    0.18 |    0.65    1.82 |   -1.54   -3.14 |    1.51    3.14
w_f      |   -0.00   -0.00   -0.00 |    0.01    0.01    0.01 |   -0.03   -0.03   -0.03 |    0.03    0.03    0.03
w_rewards |   -0.00 |    0.00 |   -0.04 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |  -46.61 |   12.57 |  -50.00 |    0.00
theta_cv |    0.59 |    0.33 |    0.00 |    2.68
seeker_angles |    0.05    0.01 |    0.31    0.31 |   -1.00   -1.00 |    1.00    1.00
cs_angles |  0.0483  0.0149 |  0.3139  0.3076 | -0.9999 -1.0000 |  0.9996  1.0000
optical_flow |  0.0001 -0.0002 |  0.0109  0.0105 | -0.2195 -0.2535 |  0.4467  0.4126
v_err    | -0.0223 |  0.0858 | -0.4557 |  1.1588
landing_rewards |    0.00 |    0.00 |    0.00 |    0.00
landing_margin |  146.77 |  106.28 |    3.87 |  560.40
tracking_rewards |  -79.93 |   16.46 | -123.92 |  -43.69
steps    |     301 |  

attitude |   -0.00   -0.04   -0.05 |    1.12    0.65    1.84 |   -3.14   -1.57   -3.14 |    3.14    1.56    3.14
w        |    0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.05   -0.06   -0.05 |    0.05    0.05    0.05
a_f      |   -0.04    0.04 |    0.65    1.84 |   -1.51   -3.13 |    1.50    3.13
w_f      |   -0.00   -0.00   -0.00 |    0.01    0.01    0.01 |   -0.03   -0.03   -0.04 |    0.04    0.02    0.04
w_rewards |   -0.00 |    0.01 |   -0.10 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |  -44.84 |   15.21 |  -50.00 |    0.00
theta_cv |    0.61 |    0.33 |    0.00 |    2.91
seeker_angles |    0.04    0.01 |    0.32    0.31 |   -1.00   -1.00 |    1.00    1.00
cs_angles |  0.0428  0.0072 |  0.3185  0.3092 | -0.9999 -0.9999 |  0.9995  1.0000
optical_flow | -0.0002  0.0003 |  0.0110  0.0107 | -0.4109 -0.6504 |  0.5689  0.3466
v_err    | -0.0226 |  0.0863 | -0.5596 |  0.5948
landing_rewards |    0.00 |    0.00 |    0.00 |    0.00
landing_margin |  150

norm_thrust |    1.57 |    0.68 |    0.00 |    3.46
fuel     |    4.59 |    0.71 |    2.35 |    5.85
rewards  | -136.18 |   21.53 | -255.59 |  -67.83
fuel_rewards |  -13.13 |    2.04 |  -16.73 |   -6.72
glideslope_rewards |    0.00 |    0.00 |    0.00 |    0.00
glideslope_penalty |    0.00 |    0.00 |    0.00 |    0.00
glideslope |    3.43 |   15.31 |    0.01 |  191.34
norm_af  |    1.76 |    0.87 |    0.12 |    3.36
norm_wf  |    0.02 |    0.01 |    0.00 |    0.08
rh_penalty |    0.00 |    0.00 |    0.00 |    0.00
att_rewards |    0.00 |    0.00 |    0.00 |    0.00
att_penalty |    0.00 |    0.00 |    0.00 |    0.00
attitude |    0.13   -0.03    0.14 |    1.21    0.65    1.88 |   -3.14   -1.56   -3.14 |    3.14    1.56    3.14
w        |    0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |   -0.02    0.23 |    0.68    1.83 |   -1.51   -3.11 |    1.54    3.13
w_f      |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.

ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0340   0.0150   0.0682   6.4661   2.1407   2.4885
Update Cnt = 240    ET =    996.0   Stats:  Mean, Std, Min, Max
r_f      |  -17.46    9.82    6.06 |  244.99  236.20  248.95 | -814.41 -744.01 -806.51 |  549.03  710.59  754.12
v_f      |    0.05   -0.02    0.01 |    0.33    0.36    0.36 |   -0.80   -1.16   -0.90 |    0.90    1.26    1.22
r_i      |  -45.13   25.38  -13.72 |  684.05  694.78  737.20 |-1289.24-1348.94-1314.74 | 1226.96 1274.25 1323.23
v_i      |    0.00   -0.00    0.00 |    0.04    0.04    0.05 |   -0.09   -0.09   -0.09 |    0.10    0.10    0.10
norm_rf  |  133.65 |  105.01 |    8.41 |  554.90
norm_vf  |    0.57 |    0.21 |    0.16 |    1.50
gs_f     |    1.01 |    1.57 |    0.02 |   19.78
thrust   |    0.01   -0.00    0.01 |    0.99    1.00    0.99 |   -3.39   -3.44   -3.37 |    3.46    3.45    3.39
norm_thrust |    1.58 |    0.68 |    0.00 |    3.46
fuel     |    4.62 |    0.69 |    2.27 |    5.80
rewards  | -137.94 |

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.3526   0.1207   0.6619   1.3010   0.5878   0.2545
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0271   0.0085   0.0518   6.4661   2.1407   2.4885
***** Episode 7759, Mean R = -137.6  Std R = 18.5  Min R = -172.7
PolicyLoss: -0.00611
Policy_Beta: 0.0667
Policy_Entropy: 0.00578
Policy_KL: 0.00104
Policy_SD: 0.955
Policy_lr_mult: 1
Steps: 9.32e+03
TotalSteps: 2.24e+06
VF_0_ExplainedVarNew: 0.932
VF_0_ExplainedVarOld: 0.906
VF_0_Loss : 0.141


ADV1:  -0.002579745913731668 0.11300176654330513 0.47215004470219446 -0.9753886477152527
ADV2:  0.030466916841207486 0.8147092728093063 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.4768   0.1463   0.9007   1.3010   0.5878   0.2545
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0277   0.0086   0.0471   6.4661   2.1407   2.4885
Update Cnt = 250    ET =    909.7   Stats:  Mean, Std, Min, Max
r_f      |  -30.49  -19.65    4.02 |  243.35  231.31  242.11 | -682.25 -837.73 -4

ADV1:  -0.0047702932166656655 0.14093212145482498 2.248818932881336 -0.9562161775601521
ADV2:  -0.002370126922144098 0.7061171076459931 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.3974   0.1302   0.6635   1.3298   0.6221   0.2545
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0231   0.0092   0.0380   6.4661   2.1407   2.4885
***** Episode 8038, Mean R = -131.2  Std R = 16.9  Min R = -160.7
PolicyLoss: 0.00301
Policy_Beta: 0.0667
Policy_Entropy: 0.00575
Policy_KL: 0.00104
Policy_SD: 0.954
Policy_lr_mult: 1
Steps: 9.52e+03
TotalSteps: 2.33e+06
VF_0_ExplainedVarNew: 0.906
VF_0_ExplainedVarOld: 0.872
VF_0_Loss : 0.15


ADV1:  -0.0030499336485622125 0.16878039316313517 2.2735746479034424 -1.6679517242417483
ADV2:  -0.009970443506813557 0.6830106386058025 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.4732   0.1756   0.8673   1.3298   0.6221   0.2545
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0310   0.0100   0.0491   6.4661   2.1407   2.4885
*

ADV1:  -0.008112180222376468 0.1487159738010508 2.2930814901987713 -0.9464549446105979
ADV2:  -0.02110559529142184 0.6939864741694989 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.4518   0.1340   0.7348   1.3298   0.6221   0.2545
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0157   0.0065   0.0346   6.4661   2.1407   2.4885
***** Episode 8317, Mean R = -137.2  Std R = 24.3  Min R = -211.6
PolicyLoss: 0.0251
Policy_Beta: 0.0667
Policy_Entropy: 0.00643
Policy_KL: 0.000919
Policy_SD: 0.955
Policy_lr_mult: 1
Steps: 9.96e+03
TotalSteps: 2.42e+06
VF_0_ExplainedVarNew: 0.879
VF_0_ExplainedVarOld: 0.857
VF_0_Loss : 0.141


ADV1:  -0.010969663802561631 0.1393982343888975 2.0669401558672664 -0.925377100951623
ADV2:  -0.015848988867708486 0.6971063515881274 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.4180   0.1324   0.8266   1.3298   0.6221   0.2545
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0246   0.0112   0.0535   6.4661   2.1407   2.4885
*****

ADV1:  -0.0006900399666393304 0.142124476522603 2.1745198345184327 -1.481076094125092
ADV2:  -0.006858215661971001 0.7060042842437739 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.4295   0.0957   0.6921   2.0937   0.7178   0.3971
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0316   0.0098   0.0520   6.4661   2.1407   2.4885
***** Episode 8596, Mean R = -135.6  Std R = 17.7  Min R = -184.1
PolicyLoss: 0.00486
Policy_Beta: 0.0667
Policy_Entropy: 0.00665
Policy_KL: 0.00092
Policy_SD: 0.953
Policy_lr_mult: 1
Steps: 9.7e+03
TotalSteps: 2.51e+06
VF_0_ExplainedVarNew: 0.895
VF_0_ExplainedVarOld: 0.874
VF_0_Loss : 0.138


ADV1:  3.988709024846909e-05 0.16978742982640185 2.220130023956299 -1.4615041939417543
ADV2:  -0.02565988832419801 0.6643968828922103 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.3091   0.0818   0.5372   2.0937   0.7178   0.3971
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0311   0.0073   0.0450   6.4661   2.1407   2.4885
***** 

Dynamics: Max Disturbance (m/s^2):  [0.00179836 0.00129319 0.00168267] 0.0027816982941464494
ADV1:  -0.016761726559850063 0.1589980608053896 1.94890602866854 -0.8227999303609699
ADV2:  -0.024080357364298435 0.6956871995299 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.5466   0.2544   1.2453   2.0937   0.7178   0.3971
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0284   0.0123   0.0600   6.4661   2.1407   2.4885
***** Episode 8875, Mean R = -134.6  Std R = 19.4  Min R = -169.0
PolicyLoss: 0.034
Policy_Beta: 0.0667
Policy_Entropy: 0.00689
Policy_KL: 0.000896
Policy_SD: 0.952
Policy_lr_mult: 1
Steps: 1.01e+04
TotalSteps: 2.6e+06
VF_0_ExplainedVarNew: 0.865
VF_0_ExplainedVarOld: 0.828
VF_0_Loss : 0.115


ADV1:  -0.019287908200182623 0.15521664673081945 2.1627286942799886 -1.3548418601353984
ADV2:  0.006440878558293336 0.7330428305661647 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.4325   0.1383   0.8289   2.0937   0.7178   0.3971
ValFun  Gradients: u

ADV1:  0.006098038722277928 0.15311283345358312 2.100024668375651 -1.8353400850296042
ADV2:  -0.01317956373850215 0.6709575420501604 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.3691   0.0965   0.6969   2.0937   0.7178   0.3971
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0256   0.0059   0.0399   6.4661   2.1407   2.4885
***** Episode 9154, Mean R = -132.1  Std R = 23.2  Min R = -176.9
PolicyLoss: 0.00761
Policy_Beta: 0.0667
Policy_Entropy: 0.00779
Policy_KL: 0.000872
Policy_SD: 0.953
Policy_lr_mult: 1
Steps: 9.81e+03
TotalSteps: 2.69e+06
VF_0_ExplainedVarNew: 0.874
VF_0_ExplainedVarOld: 0.851
VF_0_Loss : 0.113


Dynamics: Max Disturbance (m/s^2):  [0.00179836 0.00129319 0.00168267] 0.0027816982941464494
ADV1:  -0.007696350616436231 0.14958840431672013 1.9126126755280524 -1.2063813829422019
ADV2:  -0.0012270470108189093 0.7320333627572068 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.4466   0.1291   0.7319   2.0937   0.7178   0.3971
ValFun  Grad

ADV1:  0.02043747167420177 0.20039488637758973 2.32348695119222 -1.4848330338796
ADV2:  -0.031762316200333165 0.6749172955982469 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.3746   0.1194   0.7509   2.0937   0.8026   0.3971
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0359   0.0143   0.0731   6.4661   2.1407   2.4885
***** Episode 9433, Mean R = -123.7  Std R = 29.6  Min R = -168.6
PolicyLoss: 0.0219
Policy_Beta: 0.0667
Policy_Entropy: 0.00781
Policy_KL: 0.0012
Policy_SD: 0.952
Policy_lr_mult: 1
Steps: 9.98e+03
TotalSteps: 2.78e+06
VF_0_ExplainedVarNew: 0.797
VF_0_ExplainedVarOld: 0.714
VF_0_Loss : 0.0834


ADV1:  0.0028802105605978587 0.1794965884857694 2.0827430432976084 -1.736005608713456
ADV2:  -0.018519462143205507 0.7167378614188088 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.3862   0.1055   0.5885   2.0937   0.8026   0.3971
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0220   0.0073   0.0390   6.4661   2.1407   2.4885
***** Episo

ADV1:  -0.030647130926222284 0.1435829003569027 1.361883101463318 -1.5236092535654726
ADV2:  0.03359863739211977 0.7805997813815037 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.7980   0.4128   2.0480   2.0937   0.8026   0.4128
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0473   0.0251   0.0971   6.4661   2.1407   2.4885
***** Episode 9712, Mean R = -135.6  Std R = 15.8  Min R = -176.4
PolicyLoss: -0.0197
Policy_Beta: 0.0667
Policy_Entropy: 0.00808
Policy_KL: 0.00101
Policy_SD: 0.949
Policy_lr_mult: 1
Steps: 1.03e+04
TotalSteps: 2.87e+06
VF_0_ExplainedVarNew: 0.925
VF_0_ExplainedVarOld: 0.87
VF_0_Loss : 0.0584


ADV1:  0.019363769043980673 0.19261596295799252 2.280898045160059 -1.2506214619776492
ADV2:  -0.05108622603274336 0.657651149646766 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.3737   0.1372   0.6620   2.0937   0.8026   0.4128
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0518   0.0247   0.1021   6.4661   2.1407   2.4885
***** Epi

ADV1:  -0.017011465187516478 0.17553028272898236 2.063206743809943 -1.567807046143293
ADV2:  0.007561407084778342 0.7461196288272945 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.4845   0.1532   0.7939   2.0937   0.8026   0.4128
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0325   0.0127   0.0614   6.4661   2.1407   2.4885
***** Episode 9991, Mean R = -129.2  Std R = 21.7  Min R = -186.5
PolicyLoss: -0.00277
Policy_Beta: 0.0667
Policy_Entropy: 0.00868
Policy_KL: 0.001
Policy_SD: 0.95
Policy_lr_mult: 1
Steps: 9.94e+03
TotalSteps: 2.96e+06
VF_0_ExplainedVarNew: 0.852
VF_0_ExplainedVarOld: 0.805
VF_0_Loss : 0.0618


ADV1:  -0.0016797594773009824 0.15904543626802164 1.9719149696910452 -1.1273475615183535
ADV2:  -0.008384013689985731 0.7176410597036781 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.6515   0.2578   1.4117   2.0937   0.8026   0.4128
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0159   0.0058   0.0282   6.4661   2.1407   2.4885
****

cs_angles |  0.0347 -0.0112 |  0.2855  0.2832 | -1.0000 -0.9997 |  1.0000  0.9995
optical_flow |  0.0004  0.0001 |  0.0168  0.0151 | -0.5194 -0.4118 |  1.1183  0.6063
v_err    | -0.0203 |  0.0747 | -0.5009 |  0.5746
landing_rewards |    0.03 |    0.57 |    0.00 |   10.00
landing_margin |   73.10 |   83.47 |   -0.02 |  457.26
tracking_rewards |  -74.97 |   16.73 | -128.27 |  -36.55
steps    |     335 |      38 |     153 |     402
***** Episode 10270, Mean R = -131.2  Std R = 30.5  Min R = -191.7
PolicyLoss: 0.0106
Policy_Beta: 0.0667
Policy_Entropy: 0.00915
Policy_KL: 0.00123
Policy_SD: 0.95
Policy_lr_mult: 1
Steps: 1.03e+04
TotalSteps: 3.06e+06
VF_0_ExplainedVarNew: 0.826
VF_0_ExplainedVarOld: 0.775
VF_0_Loss : 0.066


ADV1:  -0.03221310583968131 0.21146562443354827 2.3367218653361004 -1.5043561784426394
ADV2:  -0.00018542054391893563 0.7200407286075423 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.3948   0.0839   0.5780   2.0937   0.8026   0.4128
ValFun  Gradients: u/s

w        |   -0.00   -0.00    0.00 |    0.01    0.01    0.01 |   -0.06   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |    0.07   -0.02 |    0.64    1.84 |   -1.53   -3.14 |    1.48    3.12
w_f      |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.06   -0.05   -0.04 |    0.05    0.05    0.04
w_rewards |   -0.00 |    0.01 |   -0.14 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |  -42.26 |   18.09 |  -50.00 |    0.00
theta_cv |    0.60 |    0.32 |    0.00 |    2.86
seeker_angles |    0.04   -0.01 |    0.28    0.28 |   -1.00   -1.00 |    1.00    1.00
cs_angles |  0.0354 -0.0124 |  0.2805  0.2813 | -0.9996 -0.9991 |  0.9998  0.9998
optical_flow |  0.0002 -0.0000 |  0.0174  0.0166 | -1.0232 -1.1904 |  0.7561  0.5584
v_err    | -0.0198 |  0.0748 | -0.5104 |  0.4992
landing_rewards |    0.10 |    0.98 |    0.00 |   10.00
landing_margin |   67.98 |   81.68 |   -0.06 |  510.01
tracking_rewards |  -74.18 |   14.18 | -114.24 |  -44.00
steps    |     335 |  

attitude |   -0.05   -0.05    0.18 |    1.12    0.63    1.83 |   -3.14   -1.55   -3.14 |    3.14    1.56    3.14
w        |   -0.00   -0.00    0.00 |    0.01    0.01    0.01 |   -0.06   -0.05   -0.05 |    0.06    0.05    0.05
a_f      |   -0.03    0.12 |    0.63    1.82 |   -1.50   -3.12 |    1.42    3.14
w_f      |   -0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.04   -0.05   -0.04 |    0.05    0.04    0.03
w_rewards |   -0.00 |    0.02 |   -0.38 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |  -43.55 |   16.76 |  -50.00 |    0.00
theta_cv |    0.61 |    0.32 |    0.00 |    3.01
seeker_angles |    0.03   -0.01 |    0.29    0.27 |   -1.00   -1.00 |    1.00    1.00
cs_angles |  0.0318 -0.0081 |  0.2924  0.2651 | -0.9997 -0.9995 |  0.9999  0.9999
optical_flow | -0.0000  0.0002 |  0.0179  0.0150 | -0.6802 -0.9301 |  1.0301  0.5665
v_err    | -0.0190 |  0.0746 | -0.5045 |  0.5201
landing_rewards |    0.06 |    0.80 |    0.00 |   10.00
landing_margin |   60

attitude |    0.07    0.04    0.11 |    1.18    0.69    1.87 |   -3.14   -1.57   -3.14 |    3.14    1.55    3.14
w        |   -0.00   -0.00    0.00 |    0.01    0.01    0.01 |   -0.07   -0.05   -0.06 |    0.06    0.06    0.05
a_f      |    0.01    0.12 |    0.69    1.87 |   -1.46   -3.13 |    1.36    3.14
w_f      |   -0.00    0.00   -0.00 |    0.02    0.01    0.01 |   -0.07   -0.05   -0.03 |    0.06    0.06    0.04
w_rewards |   -0.00 |    0.03 |   -0.32 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |  -40.65 |   19.50 |  -50.00 |    0.00
theta_cv |    0.59 |    0.31 |    0.00 |    3.01
seeker_angles |    0.04   -0.00 |    0.27    0.27 |   -1.00   -1.00 |    1.00    1.00
cs_angles |  0.0427 -0.0022 |  0.2697  0.2719 | -1.0000 -1.0000 |  0.9999  0.9995
optical_flow |  0.0002 -0.0000 |  0.0187  0.0174 | -0.8730 -0.5652 |  0.9977  0.7910
v_err    | -0.0188 |  0.0757 | -0.5031 |  1.1563
landing_rewards |    0.23 |    1.49 |    0.00 |   10.00
landing_margin |   51

attitude |    0.05   -0.02    0.06 |    1.18    0.63    1.85 |   -3.14   -1.57   -3.14 |    3.14    1.56    3.14
w        |   -0.00   -0.00    0.00 |    0.01    0.01    0.01 |   -0.06   -0.06   -0.05 |    0.06    0.06    0.05
a_f      |    0.00    0.08 |    0.65    1.90 |   -1.52   -3.13 |    1.51    3.13
w_f      |   -0.00   -0.00    0.00 |    0.02    0.01    0.01 |   -0.05   -0.06   -0.05 |    0.05    0.05    0.05
w_rewards |   -0.00 |    0.01 |   -0.19 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |  -37.58 |   21.60 |  -50.00 |    0.00
theta_cv |    0.59 |    0.33 |    0.00 |    3.07
seeker_angles |    0.04   -0.00 |    0.28    0.27 |   -1.00   -1.00 |    1.00    1.00
cs_angles |  0.0373 -0.0011 |  0.2800  0.2658 | -0.9997 -0.9999 |  1.0000  0.9994
optical_flow |  0.0004 -0.0001 |  0.0215  0.0189 | -1.0519 -0.7933 |  0.9364  0.9222
v_err    | -0.0188 |  0.0737 | -0.5112 |  0.5070
landing_rewards |    0.29 |    1.68 |    0.00 |   10.00
landing_margin |   48

w        |   -0.00   -0.00    0.00 |    0.01    0.01    0.01 |   -0.06   -0.06   -0.05 |    0.06    0.05    0.05
a_f      |    0.10   -0.00 |    0.63    1.87 |   -1.34   -3.14 |    1.47    3.11
w_f      |   -0.00   -0.00    0.00 |    0.02    0.01    0.01 |   -0.05   -0.06   -0.04 |    0.06    0.04    0.04
w_rewards |   -0.00 |    0.01 |   -0.11 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |  -37.58 |   21.60 |  -50.00 |    0.00
theta_cv |    0.58 |    0.32 |    0.00 |    3.11
seeker_angles |    0.03    0.01 |    0.28    0.26 |   -1.00   -1.00 |    1.00    1.00
cs_angles |  0.0345  0.0053 |  0.2767  0.2581 | -0.9996 -0.9991 |  0.9997  0.9990
optical_flow |  0.0005  0.0000 |  0.0231  0.0182 | -1.2367 -1.0211 |  1.2903  0.8007
v_err    | -0.0183 |  0.0735 | -0.5131 |  0.5130
landing_rewards |    0.55 |    2.28 |    0.00 |   10.00
landing_margin |   46.03 |   77.46 |   -0.08 |  538.90
tracking_rewards |  -71.91 |   16.79 | -127.53 |  -37.05
steps    |     344 |  

w        |   -0.00   -0.00    0.00 |    0.01    0.01    0.01 |   -0.05   -0.05   -0.05 |    0.06    0.05    0.05
a_f      |    0.05    0.11 |    0.61    1.87 |   -1.41   -3.14 |    1.51    3.14
w_f      |   -0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.05   -0.05   -0.05 |    0.06    0.04    0.03
w_rewards |   -0.00 |    0.01 |   -0.12 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |  -35.97 |   22.47 |  -50.00 |    0.00
theta_cv |    0.59 |    0.31 |    0.00 |    2.69
seeker_angles |    0.02    0.00 |    0.28    0.25 |   -1.00   -1.00 |    1.00    1.00
cs_angles |  0.0156  0.0043 |  0.2807  0.2521 | -1.0000 -0.9997 |  0.9999  0.9999
optical_flow |  0.0002 -0.0000 |  0.0227  0.0176 | -0.8486 -1.1932 |  1.2280  0.8199
v_err    | -0.0179 |  0.0724 | -0.5192 |  0.5128
landing_rewards |    0.55 |    2.28 |    0.00 |   10.00
landing_margin |   38.08 |   61.69 |   -0.06 |  439.54
tracking_rewards |  -72.41 |   17.15 | -148.37 |  -36.33
steps    |     348 |  

w        |   -0.00   -0.00    0.00 |    0.01    0.01    0.01 |   -0.07   -0.06   -0.05 |    0.05    0.06    0.05
a_f      |    0.06   -0.01 |    0.66    1.87 |   -1.52   -3.14 |    1.40    3.14
w_f      |   -0.00    0.00    0.00 |    0.02    0.01    0.01 |   -0.06   -0.04   -0.04 |    0.05    0.06    0.04
w_rewards |   -0.00 |    0.02 |   -0.28 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |  -32.10 |   23.97 |  -50.00 |    0.00
theta_cv |    0.57 |    0.30 |    0.00 |    3.09
seeker_angles |    0.01    0.00 |    0.27    0.23 |   -1.00   -1.00 |    1.00    1.00
cs_angles |  0.0148  0.0013 |  0.2712  0.2342 | -1.0000 -0.9996 |  0.9998  0.9999
optical_flow |  0.0004  0.0002 |  0.0242  0.0191 | -0.6882 -0.8685 |  1.1502  0.9785
v_err    | -0.0153 |  0.0719 | -0.5032 |  0.4803
landing_rewards |    1.03 |    3.04 |    0.00 |   10.00
landing_margin |   29.40 |   47.75 |   -0.07 |  366.34
tracking_rewards |  -69.63 |   15.75 | -129.20 |  -35.64
steps    |     351 |  

w        |   -0.00   -0.00    0.00 |    0.01    0.01    0.01 |   -0.06   -0.05   -0.07 |    0.06    0.07    0.05
a_f      |    0.04    0.19 |    0.66    1.85 |   -1.40   -3.11 |    1.48    3.13
w_f      |   -0.00   -0.00    0.00 |    0.02    0.02    0.01 |   -0.06   -0.05   -0.04 |    0.06    0.04    0.05
w_rewards |   -0.01 |    0.07 |   -1.25 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |  -30.97 |   24.28 |  -50.00 |    0.00
theta_cv |    0.56 |    0.30 |    0.00 |    2.91
seeker_angles |    0.01   -0.01 |    0.26    0.23 |   -1.00   -1.00 |    1.00    1.00
cs_angles |  0.0098 -0.0066 |  0.2555  0.2330 | -0.9999 -0.9987 |  0.9996  0.9998
optical_flow |  0.0002 -0.0000 |  0.0255  0.0198 | -1.0910 -0.8191 |  1.2999  0.9223
v_err    | -0.0144 |  0.0742 | -0.5013 |  1.1727
landing_rewards |    1.58 |    3.65 |    0.00 |   10.00
landing_margin |   24.27 |   44.25 |   -0.07 |  461.94
tracking_rewards |  -68.56 |   15.69 | -134.76 |  -36.44
steps    |     353 |  

w        |   -0.00   -0.00    0.00 |    0.01    0.01    0.01 |   -0.06   -0.05   -0.05 |    0.06    0.06    0.06
a_f      |    0.04   -0.05 |    0.63    1.82 |   -1.35   -3.13 |    1.42    3.12
w_f      |   -0.00   -0.00    0.00 |    0.02    0.02    0.02 |   -0.05   -0.05   -0.04 |    0.06    0.06    0.05
w_rewards |   -0.00 |    0.02 |   -0.16 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |  -23.39 |   24.95 |  -50.00 |    0.00
theta_cv |    0.55 |    0.29 |    0.00 |    3.04
seeker_angles |    0.01   -0.01 |    0.25    0.22 |   -1.00   -1.00 |    1.00    1.00
cs_angles |  0.0085 -0.0056 |  0.2454  0.2155 | -0.9996 -0.9968 |  0.9992  0.9991
optical_flow |  0.0000  0.0001 |  0.0258  0.0215 | -0.8628 -0.9996 |  0.8848  0.9800
v_err    | -0.0146 |  0.0708 | -0.5037 |  0.4268
landing_rewards |    2.55 |    4.36 |    0.00 |   10.00
landing_margin |   17.90 |   45.21 |   -0.09 |  529.83
tracking_rewards |  -66.74 |   15.59 | -120.43 |  -32.34
steps    |     360 |  

w        |   -0.00   -0.00    0.00 |    0.01    0.01    0.01 |   -0.07   -0.05   -0.07 |    0.06    0.05    0.07
a_f      |   -0.03   -0.04 |    0.66    1.92 |   -1.55   -3.10 |    1.49    3.13
w_f      |   -0.00    0.00    0.00 |    0.02    0.02    0.02 |   -0.06   -0.05   -0.07 |    0.06    0.05    0.07
w_rewards |   -0.01 |    0.03 |   -0.27 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |  -15.81 |   23.25 |  -50.00 |    0.00
theta_cv |    0.51 |    0.27 |    0.00 |    3.10
seeker_angles |    0.01   -0.00 |    0.22    0.20 |   -1.00   -1.00 |    1.00    1.00
cs_angles |  0.0071 -0.0046 |  0.2226  0.1975 | -0.9999 -0.9983 |  0.9989  0.9992
optical_flow |  0.0000  0.0001 |  0.0280  0.0221 | -1.1135 -0.8554 |  0.8178  0.8346
v_err    | -0.0130 |  0.0700 | -0.5039 |  0.4580
landing_rewards |    4.23 |    4.94 |    0.00 |   10.00
landing_margin |   10.53 |   29.57 |   -0.08 |  429.50
tracking_rewards |  -62.47 |   14.82 | -125.71 |  -32.75
steps    |     364 |  

w        |   -0.00   -0.00    0.00 |    0.01    0.01    0.01 |   -0.07   -0.06   -0.05 |    0.06    0.05    0.05
a_f      |    0.00   -0.02 |    0.65    1.88 |   -1.52   -3.12 |    1.45    3.13
w_f      |   -0.00    0.00   -0.00 |    0.02    0.02    0.02 |   -0.07   -0.05   -0.04 |    0.06    0.04    0.05
w_rewards |   -0.01 |    0.05 |   -0.88 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |  -14.68 |   22.77 |  -50.00 |    0.00
theta_cv |    0.52 |    0.28 |    0.00 |    3.12
seeker_angles |    0.00   -0.00 |    0.22    0.19 |   -1.00   -1.00 |    1.00    1.00
cs_angles |  0.0023 -0.0045 |  0.2247  0.1908 | -0.9972 -0.9994 |  1.0000  0.9997
optical_flow | -0.0001  0.0002 |  0.0279  0.0238 | -1.4222 -0.9321 |  1.1621  1.3203
v_err    | -0.0130 |  0.0700 | -0.5051 |  0.4952
landing_rewards |    4.61 |    4.98 |    0.00 |   10.00
landing_margin |   10.28 |   26.71 |   -0.08 |  337.43
tracking_rewards |  -61.66 |   16.51 | -121.26 |  -26.15
steps    |     363 |  

attitude |   -0.05   -0.04   -0.00 |    1.24    0.68    1.95 |   -3.14   -1.57   -3.14 |    3.14    1.57    3.14
w        |   -0.00   -0.00    0.00 |    0.01    0.01    0.01 |   -0.07   -0.05   -0.06 |    0.06    0.05    0.06
a_f      |   -0.02    0.15 |    0.68    1.93 |   -1.51   -3.14 |    1.49    3.13
w_f      |   -0.01    0.00    0.00 |    0.02    0.02    0.02 |   -0.07   -0.05   -0.06 |    0.06    0.05    0.06
w_rewards |   -0.00 |    0.02 |   -0.19 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |   -9.03 |   19.24 |  -50.00 |    0.00
theta_cv |    0.49 |    0.26 |    0.00 |    2.66
seeker_angles |    0.00    0.00 |    0.20    0.18 |   -1.00   -1.00 |    1.00    1.00
cs_angles |  0.0029  0.0046 |  0.1988  0.1827 | -0.9961 -0.9990 |  0.9995  0.9986
optical_flow |  0.0001  0.0002 |  0.0288  0.0242 | -1.3157 -1.1277 |  1.2355  1.2149
v_err    | -0.0111 |  0.0693 | -0.5032 |  0.3611
landing_rewards |    5.39 |    4.98 |    0.00 |   10.00
landing_margin |    5

attitude |   -0.10   -0.04    0.14 |    1.18    0.66    1.84 |   -3.14   -1.57   -3.14 |    3.14    1.57    3.14
w        |   -0.00   -0.00    0.00 |    0.01    0.01    0.01 |   -0.06   -0.07   -0.06 |    0.07    0.05    0.06
a_f      |   -0.05    0.12 |    0.66    1.86 |   -1.38   -3.14 |    1.53    3.13
w_f      |   -0.00   -0.00    0.00 |    0.02    0.02    0.02 |   -0.06   -0.07   -0.06 |    0.06    0.04    0.06
w_rewards |   -0.01 |    0.05 |   -0.53 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |   -4.52 |   14.33 |  -50.00 |    0.00
theta_cv |    0.45 |    0.25 |    0.00 |    2.98
seeker_angles |    0.00   -0.00 |    0.18    0.16 |   -1.00   -0.98 |    1.00    1.00
cs_angles |  0.0027 -0.0011 |  0.1758  0.1574 | -0.9995 -0.9840 |  0.9988  0.9996
optical_flow |  0.0002  0.0001 |  0.0299  0.0254 | -1.2802 -1.1117 |  1.7768  1.3392
v_err    | -0.0093 |  0.0684 | -0.5028 |  0.4045
landing_rewards |    6.39 |    4.80 |    0.00 |   10.00
landing_margin |    2

w        |   -0.00   -0.00    0.00 |    0.01    0.01    0.01 |   -0.06   -0.06   -0.05 |    0.06    0.05    0.05
a_f      |   -0.01   -0.10 |    0.64    1.87 |   -1.50   -3.14 |    1.48    3.14
w_f      |    0.00   -0.00    0.00 |    0.02    0.02    0.02 |   -0.06   -0.06   -0.05 |    0.06    0.04    0.05
w_rewards |   -0.00 |    0.02 |   -0.24 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |   -1.94 |    9.65 |  -50.00 |    0.00
theta_cv |    0.43 |    0.24 |    0.00 |    2.95
seeker_angles |    0.00   -0.00 |    0.16    0.15 |   -1.00   -1.00 |    1.00    1.00
cs_angles |  0.0027 -0.0031 |  0.1614  0.1523 | -0.9986 -0.9983 |  0.9978  0.9995
optical_flow |  0.0002  0.0000 |  0.0308  0.0261 | -1.4139 -0.9284 |  1.2213  1.2988
v_err    | -0.0104 |  0.0671 | -0.5002 |  0.4816
landing_rewards |    7.45 |    4.36 |    0.00 |   10.00
landing_margin |    2.31 |   25.73 |   -0.08 |  446.48
tracking_rewards |  -50.20 |   13.99 | -108.58 |  -28.23
steps    |     373 |  

w        |   -0.00   -0.00    0.00 |    0.01    0.01    0.01 |   -0.05   -0.05   -0.05 |    0.07    0.05    0.07
a_f      |   -0.00    0.16 |    0.65    1.74 |   -1.47   -3.13 |    1.44    3.10
w_f      |   -0.00    0.00    0.00 |    0.02    0.02    0.02 |   -0.05   -0.05   -0.04 |    0.07    0.05    0.07
w_rewards |   -0.00 |    0.01 |   -0.16 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |   -0.97 |    6.89 |  -50.00 |    0.00
theta_cv |    0.42 |    0.25 |    0.00 |    2.66
seeker_angles |    0.00   -0.00 |    0.15    0.15 |   -1.00   -1.00 |    1.00    1.00
cs_angles |  0.0027 -0.0030 |  0.1501  0.1453 | -0.9977 -0.9965 |  0.9975  0.9994
optical_flow |  0.0001  0.0001 |  0.0292  0.0261 | -1.2477 -0.8880 |  1.1917  1.0162
v_err    | -0.0091 |  0.0663 | -0.5002 |  0.4723
landing_rewards |    7.45 |    4.36 |    0.00 |   10.00
landing_margin |    1.87 |   22.18 |   -0.10 |  381.64
tracking_rewards |  -47.11 |   13.43 | -108.58 |  -21.58
steps    |     373 |  

w        |   -0.00   -0.00    0.00 |    0.01    0.01    0.01 |   -0.06   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |   -0.02    0.12 |    0.65    1.84 |   -1.46   -3.14 |    1.55    3.12
w_f      |   -0.00   -0.00    0.00 |    0.03    0.02    0.02 |   -0.06   -0.05   -0.04 |    0.05    0.05    0.05
w_rewards |   -0.00 |    0.01 |   -0.17 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |   -0.65 |    5.64 |  -50.00 |    0.00
theta_cv |    0.40 |    0.25 |    0.00 |    2.84
seeker_angles |    0.00   -0.00 |    0.14    0.14 |   -1.00   -0.98 |    1.00    1.00
cs_angles |  0.0026 -0.0010 |  0.1380  0.1368 | -0.9995 -0.9830 |  0.9971  0.9965
optical_flow |  0.0002  0.0001 |  0.0318  0.0271 | -1.1990 -0.9299 |  1.4913  1.1696
v_err    | -0.0092 |  0.0653 | -0.4998 |  0.2569
landing_rewards |    7.65 |    4.24 |    0.00 |   10.00
landing_margin |    0.22 |    2.02 |   -0.09 |   24.12
tracking_rewards |  -43.85 |   12.77 | -105.30 |  -23.90
steps    |     374 |  

w        |   -0.00   -0.00    0.00 |    0.01    0.01    0.01 |   -0.06   -0.05   -0.05 |    0.05    0.06    0.05
a_f      |   -0.03    0.14 |    0.66    1.81 |   -1.40   -3.12 |    1.54    3.14
w_f      |   -0.01    0.00    0.00 |    0.02    0.01    0.02 |   -0.06   -0.03   -0.04 |    0.05    0.06    0.05
w_rewards |   -0.00 |    0.01 |   -0.22 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |   -0.16 |    2.84 |  -50.00 |    0.00
theta_cv |    0.41 |    0.25 |    0.00 |    1.98
seeker_angles |    0.01   -0.00 |    0.13    0.13 |   -0.99   -0.93 |    1.00    0.98
cs_angles |  0.0073 -0.0045 |  0.1338  0.1277 | -0.9941 -0.9323 |  0.9970  0.9774
optical_flow |  0.0001  0.0002 |  0.0320  0.0253 | -1.1071 -1.1428 |  1.3051  1.1404
v_err    | -0.0097 |  0.0641 | -0.5002 |  0.2129
landing_rewards |    7.97 |    4.02 |    0.00 |   10.00
landing_margin |    0.07 |    1.54 |   -0.07 |   27.05
tracking_rewards |  -42.12 |   11.19 |  -87.83 |  -22.35
steps    |     376 |  

attitude |   -0.00   -0.04    0.11 |    1.25    0.65    1.90 |   -3.14   -1.56   -3.14 |    3.14    1.57    3.14
w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.06   -0.05   -0.05 |    0.07    0.05    0.05
a_f      |   -0.01    0.13 |    0.66    1.87 |   -1.50   -3.13 |    1.45    3.14
w_f      |   -0.00   -0.00    0.00 |    0.02    0.02    0.02 |   -0.06   -0.04   -0.04 |    0.07    0.05    0.05
w_rewards |   -0.00 |    0.02 |   -0.17 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.39 |    0.25 |    0.00 |    2.24
seeker_angles |    0.00   -0.01 |    0.12    0.13 |   -0.99   -0.99 |    1.00    0.99
cs_angles |  0.0044 -0.0078 |  0.1226  0.1252 | -0.9860 -0.9927 |  0.9996  0.9905
optical_flow |  0.0003  0.0001 |  0.0294  0.0238 | -1.1469 -1.1118 |  1.6019  0.8989
v_err    | -0.0096 |  0.0642 | -0.4994 |  0.1650
landing_rewards |    8.16 |    3.87 |    0.00 |   10.00
landing_margin |   -0

attitude |   -0.13   -0.02   -0.05 |    1.21    0.66    1.87 |   -3.14   -1.56   -3.14 |    3.14    1.54    3.14
w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.06   -0.05   -0.05 |    0.07    0.05    0.05
a_f      |   -0.05    0.08 |    0.66    1.87 |   -1.52   -3.14 |    1.34    3.13
w_f      |   -0.00    0.00    0.00 |    0.02    0.01    0.02 |   -0.06   -0.04   -0.04 |    0.07    0.04    0.05
w_rewards |   -0.00 |    0.01 |   -0.22 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |   -0.16 |    2.84 |  -50.00 |    0.00
theta_cv |    0.39 |    0.25 |    0.00 |    1.90
seeker_angles |    0.01   -0.01 |    0.12    0.12 |   -1.00   -1.00 |    1.00    1.00
cs_angles |  0.0095 -0.0124 |  0.1227  0.1166 | -0.9965 -0.9990 |  0.9967  0.9973
optical_flow |  0.0002  0.0001 |  0.0303  0.0251 | -0.9796 -1.0407 |  1.4371  1.0203
v_err    | -0.0095 |  0.0633 | -0.4999 |  0.2056
landing_rewards |    7.74 |    4.18 |    0.00 |   10.00
landing_margin |    0

w        |   -0.00   -0.00    0.00 |    0.01    0.01    0.01 |   -0.06   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |    0.05    0.06 |    0.64    1.88 |   -1.49   -3.14 |    1.47    3.13
w_f      |   -0.00    0.00    0.00 |    0.02    0.01    0.02 |   -0.06   -0.04   -0.05 |    0.05    0.04    0.05
w_rewards |   -0.00 |    0.01 |   -0.14 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.38 |    0.25 |    0.00 |    1.60
seeker_angles |    0.00   -0.01 |    0.12    0.11 |   -1.00   -0.98 |    1.00    1.00
cs_angles |  0.0027 -0.0145 |  0.1194  0.1105 | -0.9999 -0.9796 |  0.9976  0.9977
optical_flow |  0.0003  0.0002 |  0.0310  0.0235 | -1.4125 -0.7840 |  1.6418  1.0410
v_err    | -0.0095 |  0.0621 | -0.4836 |  0.1635
landing_rewards |    7.61 |    4.26 |    0.00 |   10.00
landing_margin |   -0.02 |    0.03 |   -0.08 |    0.07
tracking_rewards |  -36.01 |    9.96 |  -82.44 |  -20.22
steps    |     376 |  

norm_af  |    1.80 |    0.91 |    0.08 |    3.38
norm_wf  |    0.03 |    0.01 |    0.00 |    0.07
rh_penalty |    0.00 |    0.00 |    0.00 |    0.00
att_rewards |    0.00 |    0.00 |    0.00 |    0.00
att_penalty |    0.00 |    0.00 |    0.00 |    0.00
attitude |    0.01   -0.02    0.07 |    1.21    0.68    1.89 |   -3.14   -1.57   -3.14 |    3.14    1.56    3.14
w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.06   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |   -0.02    0.06 |    0.69    1.89 |   -1.54   -3.14 |    1.52    3.14
w_f      |   -0.00    0.00    0.00 |    0.02    0.01    0.02 |   -0.05   -0.03   -0.05 |    0.05    0.04    0.05
w_rewards |   -0.00 |    0.01 |   -0.07 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.37 |    0.25 |    0.00 |    1.84
seeker_angles |   -0.00   -0.02 |    0.11    0.11 |   -0.99   -0.99 |    1.00    1.00
cs_angles | -0.0019 -0.0161 |  0.1142  0

w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.06   -0.05   -0.05 |    0.06    0.05    0.06
a_f      |    0.01    0.16 |    0.66    1.85 |   -1.44   -3.12 |    1.49    3.14
w_f      |    0.00    0.00    0.00 |    0.03    0.01    0.02 |   -0.06   -0.04   -0.05 |    0.06    0.05    0.06
w_rewards |   -0.00 |    0.01 |   -0.14 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.37 |    0.26 |    0.00 |    1.60
seeker_angles |   -0.00   -0.01 |    0.11    0.11 |   -1.00   -1.00 |    1.00    0.99
cs_angles | -0.0015 -0.0124 |  0.1137  0.1082 | -0.9980 -0.9975 |  0.9988  0.9916
optical_flow |  0.0002 -0.0001 |  0.0294  0.0258 | -1.1093 -1.1771 |  1.3224  1.2314
v_err    | -0.0090 |  0.0617 | -0.5002 |  0.1561
landing_rewards |    7.71 |    4.20 |    0.00 |   10.00
landing_margin |   -0.01 |    0.02 |   -0.07 |    0.10
tracking_rewards |  -33.54 |    9.23 |  -83.44 |  -18.18
steps    |     375 |  

w        |   -0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.06   -0.05   -0.05 |    0.06    0.05    0.05
a_f      |    0.02    0.00 |    0.66    1.81 |   -1.50   -3.14 |    1.41    3.14
w_f      |   -0.00    0.00    0.00 |    0.02    0.01    0.02 |   -0.06   -0.03   -0.04 |    0.06    0.04    0.05
w_rewards |   -0.00 |    0.02 |   -0.24 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.37 |    0.26 |    0.00 |    1.55
seeker_angles |   -0.00   -0.01 |    0.11    0.11 |   -1.00   -0.99 |    0.99    0.99
cs_angles | -0.0007 -0.0136 |  0.1094  0.1100 | -0.9998 -0.9947 |  0.9944  0.9927
optical_flow |  0.0002  0.0001 |  0.0299  0.0261 | -1.1224 -1.5868 |  1.4730  0.9239
v_err    | -0.0090 |  0.0614 | -0.4985 |  0.1634
landing_rewards |    7.71 |    4.20 |    0.00 |   10.00
landing_margin |   -0.02 |    0.02 |   -0.07 |    0.09
tracking_rewards |  -32.71 |    9.33 |  -90.46 |  -17.53
steps    |     374 |  

attitude |    0.13    0.01   -0.03 |    1.20    0.65    1.88 |   -3.14   -1.57   -3.14 |    3.14    1.56    3.14
w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.07   -0.05   -0.05 |    0.06    0.05    0.05
a_f      |   -0.01   -0.06 |    0.65    1.90 |   -1.46   -3.14 |    1.40    3.14
w_f      |   -0.00    0.00    0.00 |    0.02    0.01    0.02 |   -0.07   -0.03   -0.04 |    0.06    0.03    0.04
w_rewards |   -0.00 |    0.01 |   -0.20 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.37 |    0.26 |    0.00 |    1.50
seeker_angles |    0.00   -0.01 |    0.11    0.10 |   -0.99   -0.97 |    1.00    1.00
cs_angles |  0.0024 -0.0092 |  0.1104  0.1032 | -0.9910 -0.9679 |  0.9971  0.9977
optical_flow |  0.0001  0.0001 |  0.0300  0.0240 | -1.3090 -0.9468 |  1.0805  1.0104
v_err    | -0.0086 |  0.0616 | -0.5000 |  0.1796
landing_rewards |    7.42 |    4.38 |    0.00 |   10.00
landing_margin |   -0

w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.06   -0.05   -0.05 |    0.06    0.05    0.05
a_f      |   -0.00   -0.08 |    0.65    1.85 |   -1.40   -3.13 |    1.39    3.09
w_f      |   -0.00    0.00    0.00 |    0.03    0.01    0.01 |   -0.06   -0.03   -0.05 |    0.06    0.04    0.04
w_rewards |   -0.00 |    0.01 |   -0.08 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.34 |    0.26 |    0.00 |    1.59
seeker_angles |   -0.00   -0.00 |    0.10    0.10 |   -0.99   -1.00 |    1.00    1.00
cs_angles | -0.0023 -0.0037 |  0.0999  0.1020 | -0.9944 -0.9980 |  0.9959  0.9982
optical_flow |  0.0001  0.0001 |  0.0296  0.0252 | -1.2637 -1.1276 |  1.2924  1.1644
v_err    | -0.0093 |  0.0611 | -0.4998 |  0.1390
landing_rewards |    7.84 |    4.12 |    0.00 |   10.00
landing_margin |   -0.02 |    0.02 |   -0.06 |    0.06
tracking_rewards |  -29.89 |    7.77 |  -75.95 |  -18.14
steps    |     377 |  

attitude |   -0.03   -0.00   -0.08 |    1.14    0.64    1.87 |   -3.14   -1.57   -3.14 |    3.14    1.57    3.14
w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.05   -0.05   -0.05 |    0.07    0.05    0.05
a_f      |    0.01   -0.02 |    0.63    1.86 |   -1.36   -3.14 |    1.44    3.14
w_f      |    0.00   -0.00    0.00 |    0.03    0.01    0.02 |   -0.05   -0.04   -0.04 |    0.07    0.03    0.05
w_rewards |   -0.00 |    0.01 |   -0.18 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.35 |    0.26 |    0.00 |    1.59
seeker_angles |    0.00   -0.01 |    0.10    0.10 |   -1.00   -1.00 |    1.00    1.00
cs_angles |  0.0030 -0.0065 |  0.0989  0.1032 | -0.9985 -0.9977 |  0.9972  0.9994
optical_flow |  0.0002 -0.0000 |  0.0284  0.0262 | -1.2436 -1.2988 |  1.1597  1.2919
v_err    | -0.0097 |  0.0604 | -0.5001 |  0.1674
landing_rewards |    7.65 |    4.24 |    0.00 |   10.00
landing_margin |   -0

attitude |   -0.04    0.01    0.05 |    1.23    0.68    1.89 |   -3.14   -1.55   -3.14 |    3.14    1.56    3.14
w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.07   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |    0.03   -0.10 |    0.68    1.88 |   -1.49   -3.14 |    1.56    3.14
w_f      |   -0.00   -0.00    0.00 |    0.03    0.01    0.02 |   -0.07   -0.03   -0.05 |    0.05    0.04    0.05
w_rewards |   -0.00 |    0.01 |   -0.23 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.34 |    0.26 |    0.00 |    1.79
seeker_angles |   -0.00   -0.00 |    0.10    0.10 |   -0.99   -0.97 |    1.00    0.97
cs_angles | -0.0008 -0.0044 |  0.0993  0.1015 | -0.9935 -0.9738 |  0.9992  0.9744
optical_flow |  0.0002  0.0001 |  0.0299  0.0260 | -1.8088 -0.9924 |  1.5045  1.0767
v_err    | -0.0100 |  0.0602 | -0.4625 |  0.1533
landing_rewards |    7.84 |    4.12 |    0.00 |   10.00
landing_margin |   -0

w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.06   -0.05   -0.05 |    0.06    0.05    0.05
a_f      |   -0.02    0.05 |    0.69    1.77 |   -1.53   -3.11 |    1.47    3.14
w_f      |   -0.00    0.00    0.00 |    0.03    0.01    0.02 |   -0.06   -0.03   -0.04 |    0.06    0.03    0.05
w_rewards |   -0.00 |    0.01 |   -0.10 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.33 |    0.26 |    0.00 |    1.46
seeker_angles |   -0.00    0.00 |    0.10    0.10 |   -1.00   -1.00 |    1.00    0.99
cs_angles | -0.0004  0.0005 |  0.0986  0.1004 | -0.9974 -1.0000 |  0.9971  0.9942
optical_flow | -0.0001 -0.0001 |  0.0304  0.0255 | -1.3290 -1.0528 |  1.6037  1.3634
v_err    | -0.0098 |  0.0598 | -0.4521 |  0.1524
landing_rewards |    7.71 |    4.20 |    0.00 |   10.00
landing_margin |   -0.02 |    0.02 |   -0.07 |    0.05
tracking_rewards |  -28.02 |    8.03 |  -66.78 |  -15.11
steps    |     376 |  

thrust   |   -0.00   -0.00   -0.00 |    0.75    0.77    0.77 |   -3.37   -3.38   -3.46 |    3.39    3.39    3.42
norm_thrust |    1.11 |    0.71 |    0.00 |    3.46
fuel     |    2.17 |    0.30 |    1.63 |    3.45
rewards  |  -25.89 |    8.86 |  -55.16 |  -11.00
fuel_rewards |   -6.22 |    0.85 |   -9.88 |   -4.67
glideslope_rewards |    0.00 |    0.00 |    0.00 |    0.00
glideslope_penalty |    0.00 |    0.00 |    0.00 |    0.00
glideslope |    2.95 |   12.95 |    0.01 |  641.49
norm_af  |    1.78 |    0.89 |    0.09 |    3.27
norm_wf  |    0.03 |    0.01 |    0.00 |    0.07
rh_penalty |    0.00 |    0.00 |    0.00 |    0.00
att_rewards |    0.00 |    0.00 |    0.00 |    0.00
att_penalty |    0.00 |    0.00 |    0.00 |    0.00
attitude |    0.07   -0.00    0.11 |    1.16    0.66    1.86 |   -3.14   -1.56   -3.14 |    3.14    1.57    3.14
w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.06   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |   -0.03    0.06 |    0.66

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.0341   0.6955   3.4382  14.0225   7.9763   5.0627
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0018   0.0009   0.0038   6.4661   2.1407   2.4885
Update Cnt = 630    ET =    877.8   Stats:  Mean, Std, Min, Max
r_f      |   -2.63   18.90    2.68 |  183.31  175.94  197.46 | -389.16 -385.54 -386.26 |  396.59  394.90  395.28
v_f      |    0.00   -0.01   -0.00 |    0.05    0.05    0.06 |   -0.13   -0.12   -0.14 |    0.15    0.14    0.14
r_i      |  -20.41   27.43   27.60 |  675.42  684.67  751.65 |-1236.99-1303.98-1366.23 | 1390.10 1316.53 1308.66
v_i      |    0.00   -0.00   -0.00 |    0.04    0.04    0.05 |   -0.09   -0.09   -0.09 |    0.10    0.09    0.09
norm_rf  |    0.46 |    0.21 |    0.03 |    1.46
norm_vf  |    0.09 |    0.02 |    0.04 |    0.18
gs_f     |    1.62 |    9.73 |    0.02 |  170.62
thrust   |    0.00    0.00   -0.00 |    0.76    0.77    0.75 |   -3.36   -3.36   -3.41 |    3.46    3.45    3.46
norm_thrust |    1

ADV1:  -0.0035769704738723854 0.014142521981845025 0.06846648514270787 -0.09943202976124392
ADV2:  0.023104723629164454 0.9354966276861443 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.1576   1.2577   6.0894  14.0225   7.9763   5.0627
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0036   0.0022   0.0090   6.4661   2.1407   2.4885
***** Episode 19849, Mean R = -27.9  Std R = 9.7  Min R = -53.4
PolicyLoss: -0.00644
Policy_Beta: 0.0667
Policy_Entropy: 0.0819
Policy_KL: 0.000657
Policy_SD: 0.66
Policy_lr_mult: 1
Steps: 1.17e+04
TotalSteps: 6.56e+06
VF_0_ExplainedVarNew: 0.926
VF_0_ExplainedVarOld: 0.923
VF_0_Loss : 0.0759


ADV1:  -0.0016717390874783121 0.015063141666103692 0.12288824596735654 -0.1253940406157356
ADV2:  0.011934482746700996 0.9126233173652071 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.3975   0.6480   3.3630  14.0225   7.9763   5.0627
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0020   0.0012   0.0043   6.4661   2.1407   2.48

ADV1:  -0.0020609730643697116 0.015961776498845406 0.08390971961565755 -0.11852554308973612
ADV2:  0.013207922087516219 0.9431185925665141 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.9218   0.4053   1.8907  14.0225   7.9763   5.0627
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0024   0.0014   0.0051   6.4661   2.1407   2.4885
***** Episode 20128, Mean R = -28.8  Std R = 9.0  Min R = -46.5
PolicyLoss: -0.00809
Policy_Beta: 0.0667
Policy_Entropy: 0.0854
Policy_KL: 0.000743
Policy_SD: 0.658
Policy_lr_mult: 1
Steps: 1.15e+04
TotalSteps: 6.66e+06
VF_0_ExplainedVarNew: 0.909
VF_0_ExplainedVarOld: 0.905
VF_0_Loss : 0.0651


ADV1:  -0.0001434498240677361 0.015700812695105534 0.07582928987743431 -0.08645751492398203
ADV2:  0.004839938233978336 0.9411204422013667 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.6579   0.2773   1.6030  14.0225   7.9763   5.0627
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0009   0.0005   0.0020   6.4661   2.1407   2.

ADV1:  0.001247762661391032 0.013988622679422053 0.07727684885263447 -0.09278587745106642
ADV2:  -0.006524483400936827 0.9390421628831936 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.2983   0.5988   3.1491  14.0225   7.9763   5.0627
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0021   0.0011   0.0043   6.4661   2.1407   2.4885
***** Episode 20407, Mean R = -22.9  Std R = 7.6  Min R = -40.1
PolicyLoss: -0.00302
Policy_Beta: 0.0667
Policy_Entropy: 0.0897
Policy_KL: 0.000733
Policy_SD: 0.622
Policy_lr_mult: 1
Steps: 1.16e+04
TotalSteps: 6.77e+06
VF_0_ExplainedVarNew: 0.917
VF_0_ExplainedVarOld: 0.907
VF_0_Loss : 0.066


ADV1:  -0.0007430218654036141 0.014904276703875978 0.060045269259175575 -0.10870997494051748
ADV2:  0.009294635417009069 0.9339451379125195 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   4.1941   2.7012   9.7960  14.0225   7.9763   5.0627
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0007   0.0004   0.0019   6.4661   2.1407   2.4

ADV1:  -0.0016561517132574579 0.01469246935715065 0.0791191241347853 -0.0800489240357799
ADV2:  0.011819821962465206 0.9426017966824258 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.2127   1.5021   4.9256  14.0225   7.9763   5.0627
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0018   0.0011   0.0041   6.4661   2.1407   2.4885
***** Episode 20686, Mean R = -24.1  Std R = 8.5  Min R = -53.3
PolicyLoss: -0.00725
Policy_Beta: 0.0667
Policy_Entropy: 0.0905
Policy_KL: 0.000997
Policy_SD: 0.633
Policy_lr_mult: 1
Steps: 1.15e+04
TotalSteps: 6.87e+06
VF_0_ExplainedVarNew: 0.906
VF_0_ExplainedVarOld: 0.903
VF_0_Loss : 0.0584


ADV1:  -0.00011014721771073315 0.014258524176177933 0.06229606330394749 -0.08055399590806045
ADV2:  0.006681444427794974 0.9364048649708011 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   3.0530   1.4193   5.8835  14.0225   7.9763   5.0627
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0005   0.0003   0.0011   6.4661   2.1407   2.48

ADV1:  -0.0019552140809305555 0.013847176134270636 0.07212434575335872 -0.09394588931621131
ADV2:  0.02136139526042026 0.9089000760022806 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.8272   0.4156   2.2324  14.0225   7.9763   5.0627
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0020   0.0011   0.0050   6.4661   2.1407   2.4885
***** Episode 20965, Mean R = -21.9  Std R = 5.9  Min R = -34.2
PolicyLoss: -0.0147
Policy_Beta: 0.0667
Policy_Entropy: 0.0932
Policy_KL: 0.000739
Policy_SD: 0.616
Policy_lr_mult: 1
Steps: 1.16e+04
TotalSteps: 6.98e+06
VF_0_ExplainedVarNew: 0.909
VF_0_ExplainedVarOld: 0.902
VF_0_Loss : 0.0724


ADV1:  0.0015620064554706893 0.012581547179725268 0.0810666737018324 -0.07577219127970061
ADV2:  -0.004831725738658351 0.9222487714106299 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.8518   0.4968   2.6666  14.0225   7.9763   5.0627
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0016   0.0009   0.0041   6.4661   2.1407   2.488

ADV1:  -0.004212126905137304 0.01535431076859211 0.10072565119530516 -0.08446795131557933
ADV2:  0.016104188910843996 0.9479971945775231 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.1425   0.6355   3.5271  14.0225   7.9763   5.0627
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0044   0.0025   0.0108   6.4661   2.1407   2.4885
***** Episode 21244, Mean R = -25.8  Std R = 8.0  Min R = -43.0
PolicyLoss: -0.000243
Policy_Beta: 0.0667
Policy_Entropy: 0.0966
Policy_KL: 0.000728
Policy_SD: 0.629
Policy_lr_mult: 1
Steps: 1.15e+04
TotalSteps: 7.08e+06
VF_0_ExplainedVarNew: 0.92
VF_0_ExplainedVarOld: 0.912
VF_0_Loss : 0.0731


ADV1:  0.0009120138726939381 0.013549547046757841 0.13435585856437687 -0.11821682810135081
ADV2:  -0.00500980142677494 0.9332726166823377 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.7426   0.2756   1.4877  14.0225   7.9763   5.0627
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0012   0.0007   0.0024   6.4661   2.1407   2.488

ADV1:  -3.8174859378079994e-05 0.012999142607733882 0.0658174715165076 -0.10702692273771808
ADV2:  0.009120398820780244 0.909147075469606 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   3.8701   2.8248   8.7608  14.0225   7.9763   5.0627
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0002   0.0001   0.0003   6.4661   2.1407   2.4885
***** Episode 21523, Mean R = -22.4  Std R = 7.8  Min R = -39.7
PolicyLoss: -0.0121
Policy_Beta: 0.0667
Policy_Entropy: 0.0997
Policy_KL: 0.00127
Policy_SD: 0.621
Policy_lr_mult: 1
Steps: 1.17e+04
TotalSteps: 7.19e+06
VF_0_ExplainedVarNew: 0.932
VF_0_ExplainedVarOld: 0.928
VF_0_Loss : 0.0805


Dynamics: Max Disturbance (m/s^2):  [0.00179836 0.00129994 0.00168267] 0.0027848433135488422
ADV1:  -0.0008711739287179879 0.013180077559649773 0.07615170800904761 -0.09091833316938536
ADV2:  0.013356013706418443 0.914816588338355 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   3.6841   1.8550   7.8839  14.0225   7.9763   5.0627
ValFun  G

ADV1:  -0.0005145339065508165 0.012806152882359147 0.10685837381212654 -0.09289616059042213
ADV2:  0.008080231410813647 0.9275835867630227 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.0940   0.3832   2.1812  14.0225   7.9763   5.0627
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0006   0.0003   0.0013   6.4661   2.1407   2.4885
***** Episode 21802, Mean R = -23.1  Std R = 8.0  Min R = -42.2
PolicyLoss: -0.0091
Policy_Beta: 0.0667
Policy_Entropy: 0.102
Policy_KL: 0.000674
Policy_SD: 0.625
Policy_lr_mult: 1
Steps: 1.16e+04
TotalSteps: 7.29e+06
VF_0_ExplainedVarNew: 0.943
VF_0_ExplainedVarOld: 0.94
VF_0_Loss : 0.058


Dynamics: Max Disturbance (m/s^2):  [0.00179836 0.00129994 0.00168267] 0.0027848433135488422
ADV1:  0.0023012215293805593 0.01209630164973729 0.093664089177046 -0.07493597534003216
ADV2:  -0.004738785282394125 0.908987474223165 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.7785   0.2811   1.6728  14.0225   7.9763   5.0627
ValFun  Gradi

ADV1:  -0.003700248308107274 0.014552957151149324 0.05580199416754944 -0.08577960651400979
ADV2:  0.02792981789127572 0.9305813788471072 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.0858   0.5667   3.0643  14.0225   7.9763   5.0627
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0039   0.0027   0.0096   6.4661   2.1407   2.4885
***** Episode 22081, Mean R = -23.5  Std R = 8.0  Min R = -39.6
PolicyLoss: -0.013
Policy_Beta: 0.0667
Policy_Entropy: 0.108
Policy_KL: 0.000811
Policy_SD: 0.605
Policy_lr_mult: 1
Steps: 1.17e+04
TotalSteps: 7.4e+06
VF_0_ExplainedVarNew: 0.923
VF_0_ExplainedVarOld: 0.914
VF_0_Loss : 0.0757


Dynamics: Max Disturbance (m/s^2):  [0.00179836 0.00129994 0.00168267] 0.0027848433135488422
ADV1:  0.0035641154089184383 0.013976202960091081 0.06378784188262285 -0.09143826352482703
ADV2:  -0.012010189053692307 0.9363215432727651 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   4.5839   2.2625   8.1093  14.0225   7.9763   5.0627
ValFun  Gra

seeker_angles |   -0.00    0.00 |    0.09    0.09 |   -0.99   -1.00 |    0.98    1.00
cs_angles | -0.0027  0.0012 |  0.0895  0.0922 | -0.9879 -0.9980 |  0.9811  0.9959
optical_flow |  0.0000 -0.0000 |  0.0278  0.0260 | -1.2299 -1.2258 |  1.0991  1.4083
v_err    | -0.0086 |  0.0586 | -0.4530 |  0.1604
landing_rewards |    7.58 |    4.28 |    0.00 |   10.00
landing_margin |   -0.01 |    0.02 |   -0.06 |    0.08
tracking_rewards |  -23.92 |    6.60 |  -79.81 |  -13.59
steps    |     375 |      20 |     333 |     416
***** Episode 22360, Mean R = -22.8  Std R = 10.2  Min R = -53.4
PolicyLoss: -0.00974
Policy_Beta: 0.0667
Policy_Entropy: 0.111
Policy_KL: 0.000668
Policy_SD: 0.593
Policy_lr_mult: 1
Steps: 1.17e+04
TotalSteps: 7.5e+06
VF_0_ExplainedVarNew: 0.92
VF_0_ExplainedVarOld: 0.916
VF_0_Loss : 0.0654


ADV1:  -0.0006871064676672218 0.015545508276314667 0.08654832373883714 -0.0660380925656241
ADV2:  0.003960337392418513 0.9490943989070341 3.0 -3.0
 *** BROKE ***   8 0.004425862338393927

w        |   -0.00   -0.00   -0.00 |    0.01    0.01    0.01 |   -0.06   -0.05   -0.05 |    0.06    0.05    0.05
a_f      |    0.04    0.09 |    0.64    1.92 |   -1.33   -3.14 |    1.53    3.12
w_f      |   -0.00    0.00   -0.00 |    0.02    0.01    0.01 |   -0.06   -0.03   -0.04 |    0.06    0.03    0.04
w_rewards |   -0.00 |    0.01 |   -0.08 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.31 |    0.26 |    0.00 |    1.49
seeker_angles |   -0.00   -0.00 |    0.09    0.09 |   -0.99   -0.98 |    0.99    1.00
cs_angles | -0.0024 -0.0008 |  0.0897  0.0930 | -0.9908 -0.9833 |  0.9867  0.9989
optical_flow | -0.0000  0.0001 |  0.0295  0.0252 | -1.4187 -1.0714 |  1.2906  1.1175
v_err    | -0.0087 |  0.0591 | -0.4520 |  0.1341
landing_rewards |    8.23 |    3.82 |    0.00 |   10.00
landing_margin |   -0.02 |    0.02 |   -0.06 |    0.06
tracking_rewards |  -24.23 |    5.87 |  -52.65 |  -12.83
steps    |     375 |  

w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.06   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |    0.06   -0.09 |    0.69    1.80 |   -1.49   -3.12 |    1.42    3.14
w_f      |   -0.00    0.00    0.00 |    0.03    0.01    0.01 |   -0.06   -0.03   -0.04 |    0.05    0.03    0.03
w_rewards |   -0.00 |    0.01 |   -0.13 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.31 |    0.26 |    0.00 |    1.54
seeker_angles |   -0.00   -0.00 |    0.09    0.09 |   -0.99   -0.99 |    1.00    0.99
cs_angles | -0.0014 -0.0010 |  0.0890  0.0911 | -0.9881 -0.9906 |  0.9981  0.9915
optical_flow |  0.0000 -0.0001 |  0.0287  0.0249 | -1.1073 -1.0738 |  1.4006  1.0663
v_err    | -0.0083 |  0.0582 | -0.4531 |  0.1466
landing_rewards |    8.39 |    3.68 |    0.00 |   10.00
landing_margin |   -0.02 |    0.02 |   -0.06 |    0.07
tracking_rewards |  -23.66 |    5.70 |  -44.83 |  -12.66
steps    |     375 |  

attitude |    0.15   -0.02   -0.04 |    1.15    0.64    1.78 |   -3.14   -1.55   -3.14 |    3.14    1.56    3.14
w        |   -0.00   -0.00    0.00 |    0.01    0.01    0.01 |   -0.05   -0.05   -0.05 |    0.06    0.05    0.05
a_f      |   -0.03   -0.08 |    0.64    1.76 |   -1.38   -3.14 |    1.50    3.14
w_f      |   -0.00   -0.00    0.00 |    0.03    0.01    0.01 |   -0.05   -0.03   -0.03 |    0.06    0.03    0.04
w_rewards |   -0.00 |    0.01 |   -0.07 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.30 |    0.26 |    0.00 |    1.64
seeker_angles |   -0.00   -0.00 |    0.09    0.09 |   -1.00   -0.99 |    1.00    0.98
cs_angles | -0.0015 -0.0014 |  0.0931  0.0880 | -0.9956 -0.9932 |  0.9962  0.9770
optical_flow |  0.0001 -0.0000 |  0.0276  0.0261 | -1.1261 -0.9943 |  1.3219  1.0765
v_err    | -0.0091 |  0.0590 | -0.4523 |  0.1284
landing_rewards |    8.13 |    3.90 |    0.00 |   10.00
landing_margin |   -0

attitude |   -0.03   -0.04    0.01 |    1.16    0.67    1.84 |   -3.14   -1.54   -3.14 |    3.14    1.55    3.14
w        |    0.00   -0.00    0.00 |    0.01    0.01    0.01 |   -0.06   -0.05   -0.05 |    0.06    0.05    0.05
a_f      |   -0.06    0.00 |    0.69    1.83 |   -1.47   -3.13 |    1.48    3.14
w_f      |    0.00   -0.00    0.00 |    0.03    0.01    0.01 |   -0.06   -0.04   -0.04 |    0.06    0.03    0.04
w_rewards |   -0.00 |    0.01 |   -0.08 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.29 |    0.25 |    0.00 |    1.81
seeker_angles |    0.00   -0.00 |    0.09    0.09 |   -0.99   -0.99 |    1.00    1.00
cs_angles |  0.0006 -0.0030 |  0.0871  0.0889 | -0.9949 -0.9905 |  0.9990  0.9986
optical_flow |  0.0001 -0.0002 |  0.0271  0.0248 | -1.2249 -1.5958 |  1.0790  0.9523
v_err    | -0.0093 |  0.0592 | -0.4530 |  0.1418
landing_rewards |    7.58 |    4.28 |    0.00 |   10.00
landing_margin |   -0

w        |   -0.00   -0.00    0.00 |    0.01    0.01    0.01 |   -0.06   -0.05   -0.05 |    0.06    0.05    0.05
a_f      |   -0.02   -0.07 |    0.66    1.86 |   -1.54   -3.14 |    1.46    3.12
w_f      |    0.00   -0.00    0.00 |    0.02    0.01    0.01 |   -0.06   -0.04   -0.03 |    0.06    0.03    0.04
w_rewards |   -0.00 |    0.01 |   -0.08 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.29 |    0.26 |    0.00 |    1.40
seeker_angles |    0.00   -0.00 |    0.09    0.10 |   -0.99   -0.99 |    1.00    0.99
cs_angles |  0.0016 -0.0021 |  0.0857  0.0953 | -0.9863 -0.9896 |  0.9954  0.9903
optical_flow | -0.0000 -0.0001 |  0.0275  0.0268 | -1.0928 -1.3594 |  1.1722  1.3595
v_err    | -0.0095 |  0.0591 | -0.4529 |  0.1274
landing_rewards |    8.45 |    3.62 |    0.00 |   10.00
landing_margin |   -0.02 |    0.02 |   -0.06 |    0.05
tracking_rewards |  -23.51 |    6.01 |  -49.66 |  -13.03
steps    |     374 |  

w        |    0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.06   -0.05   -0.05 |    0.06    0.05    0.05
a_f      |    0.03   -0.25 |    0.65    1.89 |   -1.52   -3.12 |    1.41    3.14
w_f      |   -0.00    0.00    0.00 |    0.02    0.01    0.01 |   -0.06   -0.02   -0.03 |    0.06    0.04    0.03
w_rewards |   -0.00 |    0.01 |   -0.14 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.30 |    0.26 |    0.00 |    1.57
seeker_angles |    0.00    0.00 |    0.09    0.09 |   -0.99   -1.00 |    0.98    1.00
cs_angles |  0.0005  0.0006 |  0.0879  0.0919 | -0.9860 -0.9969 |  0.9833  0.9969
optical_flow | -0.0000  0.0001 |  0.0272  0.0261 | -1.4930 -1.0171 |  1.1745  1.2917
v_err    | -0.0095 |  0.0578 | -0.4937 |  0.1427
landing_rewards |    8.19 |    3.85 |    0.00 |   10.00
landing_margin |   -0.02 |    0.02 |   -0.06 |    0.06
tracking_rewards |  -23.33 |    6.31 |  -76.89 |  -14.36
steps    |     377 |  

attitude |   -0.03   -0.01    0.12 |    1.13    0.61    1.83 |   -3.14   -1.51   -3.14 |    3.14    1.55    3.14
w        |    0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.06   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |   -0.01   -0.04 |    0.63    1.84 |   -1.41   -3.14 |    1.49    3.11
w_f      |    0.00   -0.00    0.00 |    0.03    0.01    0.01 |   -0.06   -0.04   -0.03 |    0.05    0.03    0.03
w_rewards |   -0.00 |    0.01 |   -0.10 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.29 |    0.26 |    0.00 |    1.55
seeker_angles |   -0.00   -0.00 |    0.09    0.10 |   -1.00   -0.98 |    1.00    0.99
cs_angles | -0.0000 -0.0018 |  0.0851  0.0951 | -1.0000 -0.9782 |  0.9959  0.9928
optical_flow | -0.0000 -0.0000 |  0.0282  0.0255 | -1.3836 -0.9098 |  1.1185  1.2393
v_err    | -0.0093 |  0.0583 | -0.4522 |  0.1470
landing_rewards |    8.19 |    3.85 |    0.00 |   10.00
landing_margin |   -0

w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |    0.04   -0.06 |    0.63    1.83 |   -1.49   -3.14 |    1.49    3.10
w_f      |   -0.00    0.00   -0.00 |    0.03    0.01    0.01 |   -0.05   -0.03   -0.03 |    0.05    0.03    0.04
w_rewards |   -0.00 |    0.01 |   -0.08 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.29 |    0.25 |    0.00 |    1.59
seeker_angles |    0.00   -0.00 |    0.09    0.09 |   -0.99   -0.99 |    1.00    1.00
cs_angles |  0.0024 -0.0016 |  0.0858  0.0887 | -0.9940 -0.9933 |  0.9997  0.9963
optical_flow | -0.0001 -0.0000 |  0.0272  0.0256 | -1.2578 -1.2764 |  1.2347  1.0028
v_err    | -0.0095 |  0.0587 | -0.4529 |  0.1320
landing_rewards |    8.71 |    3.35 |    0.00 |   10.00
landing_margin |   -0.02 |    0.02 |   -0.06 |    0.05
tracking_rewards |  -22.74 |    5.36 |  -43.19 |  -13.26
steps    |     376 |  

w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.05   -0.05   -0.05 |    0.06    0.05    0.05
a_f      |    0.05   -0.11 |    0.66    1.82 |   -1.43   -3.12 |    1.48    3.14
w_f      |   -0.00   -0.00   -0.00 |    0.02    0.01    0.01 |   -0.05   -0.03   -0.03 |    0.06    0.03    0.04
w_rewards |   -0.00 |    0.01 |   -0.09 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.29 |    0.26 |    0.00 |    1.57
seeker_angles |    0.00   -0.00 |    0.09    0.09 |   -0.99   -0.99 |    0.99    1.00
cs_angles |  0.0019 -0.0003 |  0.0857  0.0900 | -0.9927 -0.9926 |  0.9891  0.9959
optical_flow |  0.0001 -0.0001 |  0.0266  0.0265 | -1.1599 -1.0236 |  1.1493  1.2796
v_err    | -0.0095 |  0.0591 | -0.4521 |  0.1336
landing_rewards |    8.26 |    3.79 |    0.00 |   10.00
landing_margin |   -0.02 |    0.02 |   -0.06 |    0.05
tracking_rewards |  -22.69 |    5.42 |  -56.43 |  -13.97
steps    |     377 |  

w        |    0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.05   -0.05   -0.05 |    0.06    0.05    0.05
a_f      |   -0.02   -0.32 |    0.64    1.89 |   -1.46   -3.11 |    1.49    3.10
w_f      |    0.00    0.00   -0.00 |    0.03    0.01    0.01 |   -0.05   -0.03   -0.03 |    0.06    0.04    0.04
w_rewards |   -0.00 |    0.01 |   -0.12 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.29 |    0.26 |    0.00 |    1.47
seeker_angles |   -0.00    0.00 |    0.09    0.09 |   -0.99   -1.00 |    0.97    1.00
cs_angles | -0.0005  0.0001 |  0.0865  0.0896 | -0.9907 -0.9968 |  0.9730  0.9990
optical_flow | -0.0000 -0.0001 |  0.0265  0.0262 | -0.9570 -1.3918 |  1.0364  1.4301
v_err    | -0.0093 |  0.0584 | -0.4522 |  0.1304
landing_rewards |    8.55 |    3.52 |    0.00 |   10.00
landing_margin |   -0.02 |    0.02 |   -0.06 |    0.06
tracking_rewards |  -22.51 |    5.36 |  -44.77 |  -13.14
steps    |     375 |  

attitude |    0.03    0.06    0.02 |    1.19    0.66    1.87 |   -3.14   -1.57   -3.14 |    3.14    1.55    3.14
w        |   -0.00   -0.00    0.00 |    0.01    0.01    0.01 |   -0.05   -0.05   -0.05 |    0.06    0.05    0.05
a_f      |    0.08    0.12 |    0.68    1.84 |   -1.50   -3.13 |    1.49    3.13
w_f      |   -0.00   -0.00    0.00 |    0.02    0.01    0.01 |   -0.05   -0.03   -0.03 |    0.06    0.03    0.04
w_rewards |   -0.00 |    0.01 |   -0.07 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.30 |    0.27 |    0.00 |    1.51
seeker_angles |    0.00   -0.00 |    0.09    0.09 |   -0.99   -0.99 |    1.00    1.00
cs_angles |  0.0000 -0.0006 |  0.0885  0.0929 | -0.9872 -0.9912 |  0.9971  0.9985
optical_flow |  0.0000  0.0001 |  0.0275  0.0255 | -1.1310 -0.9246 |  1.0299  1.1831
v_err    | -0.0100 |  0.0585 | -0.4988 |  0.1362
landing_rewards |    8.48 |    3.59 |    0.00 |   10.00
landing_margin |   -0

attitude |    0.07    0.02   -0.17 |    1.18    0.64    1.90 |   -3.14   -1.57   -3.14 |    3.14    1.57    3.14
w        |    0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.06   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |    0.01   -0.17 |    0.65    1.89 |   -1.56   -3.14 |    1.52    3.11
w_f      |   -0.00   -0.00    0.00 |    0.02    0.01    0.01 |   -0.05   -0.03   -0.04 |    0.05    0.03    0.03
w_rewards |   -0.00 |    0.00 |   -0.06 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.29 |    0.26 |    0.00 |    1.53
seeker_angles |   -0.01    0.00 |    0.08    0.09 |   -0.99   -1.00 |    0.99    0.98
cs_angles | -0.0059  0.0004 |  0.0846  0.0905 | -0.9921 -0.9994 |  0.9855  0.9812
optical_flow | -0.0000 -0.0000 |  0.0279  0.0261 | -1.1394 -0.9681 |  1.0809  1.1873
v_err    | -0.0096 |  0.0582 | -0.4525 |  0.1175
landing_rewards |    8.74 |    3.32 |    0.00 |   10.00
landing_margin |   -0

w        |   -0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.06   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |    0.01   -0.06 |    0.67    1.80 |   -1.54   -3.14 |    1.53    3.11
w_f      |   -0.00    0.00    0.00 |    0.02    0.01    0.01 |   -0.06   -0.02   -0.04 |    0.05    0.03    0.03
w_rewards |   -0.00 |    0.01 |   -0.06 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.28 |    0.26 |    0.00 |    1.43
seeker_angles |   -0.00   -0.00 |    0.09    0.09 |   -0.99   -0.95 |    1.00    0.99
cs_angles | -0.0005 -0.0002 |  0.0855  0.0904 | -0.9949 -0.9532 |  0.9958  0.9888
optical_flow | -0.0000  0.0000 |  0.0288  0.0255 | -1.2304 -1.0498 |  1.4703  0.9739
v_err    | -0.0100 |  0.0587 | -0.4844 |  0.1257
landing_rewards |    9.10 |    2.87 |    0.00 |   10.00
landing_margin |   -0.02 |    0.02 |   -0.06 |    0.05
tracking_rewards |  -22.12 |    5.52 |  -45.85 |  -11.71
steps    |     375 |  

w        |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |   -0.03   -0.07 |    0.67    1.82 |   -1.45   -3.14 |    1.40    3.10
w_f      |    0.00   -0.00    0.00 |    0.02    0.01    0.01 |   -0.05   -0.03   -0.03 |    0.05    0.03    0.03
w_rewards |   -0.00 |    0.00 |   -0.01 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.28 |    0.25 |    0.00 |    1.62
seeker_angles |   -0.00   -0.00 |    0.08    0.09 |   -0.99   -0.98 |    0.97    0.99
cs_angles | -0.0002 -0.0016 |  0.0848  0.0851 | -0.9868 -0.9803 |  0.9749  0.9889
optical_flow |  0.0000 -0.0001 |  0.0270  0.0258 | -1.1381 -1.3376 |  1.5766  1.1370
v_err    | -0.0098 |  0.0590 | -0.4526 |  0.1202
landing_rewards |    8.55 |    3.52 |    0.00 |   10.00
landing_margin |   -0.02 |    0.02 |   -0.06 |    0.04
tracking_rewards |  -21.72 |    4.90 |  -42.90 |  -13.31
steps    |     375 |  

attitude |   -0.06    0.10    0.05 |    1.24    0.65    1.88 |   -3.14   -1.57   -3.14 |    3.14    1.52    3.14
w        |    0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |    0.10    0.09 |    0.66    1.86 |   -1.53   -3.13 |    1.46    3.11
w_f      |   -0.00    0.00    0.00 |    0.02    0.01    0.01 |   -0.05   -0.03   -0.03 |    0.05    0.02    0.03
w_rewards |   -0.00 |    0.00 |   -0.01 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.29 |    0.27 |    0.00 |    1.63
seeker_angles |   -0.00    0.00 |    0.08    0.10 |   -0.99   -1.00 |    0.99    1.00
cs_angles | -0.0022  0.0005 |  0.0848  0.0973 | -0.9947 -0.9985 |  0.9919  0.9961
optical_flow | -0.0001  0.0001 |  0.0274  0.0258 | -1.1251 -1.0916 |  1.1689  0.9960
v_err    | -0.0100 |  0.0590 | -0.4520 |  0.1441
landing_rewards |    8.65 |    3.42 |    0.00 |   10.00
landing_margin |   -0

attitude |    0.04   -0.02   -0.05 |    1.16    0.66    1.84 |   -3.14   -1.57   -3.14 |    3.14    1.57    3.14
w        |    0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.05   -0.05   -0.05 |    0.06    0.05    0.05
a_f      |   -0.02   -0.14 |    0.65    1.82 |   -1.40   -3.14 |    1.35    3.14
w_f      |   -0.00   -0.00    0.00 |    0.02    0.01    0.01 |   -0.05   -0.03   -0.03 |    0.05    0.03    0.03
w_rewards |   -0.00 |    0.01 |   -0.10 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.28 |    0.26 |    0.00 |    1.78
seeker_angles |    0.00    0.00 |    0.09    0.09 |   -0.99   -0.99 |    0.99    0.93
cs_angles |  0.0036  0.0007 |  0.0866  0.0891 | -0.9859 -0.9919 |  0.9926  0.9314
optical_flow |  0.0000  0.0000 |  0.0270  0.0243 | -1.0065 -0.9035 |  1.1270  0.9479
v_err    | -0.0103 |  0.0585 | -0.4530 |  0.1202
landing_rewards |    8.58 |    3.49 |    0.00 |   10.00
landing_margin |   -0

w        |    0.00   -0.00    0.00 |    0.01    0.01    0.01 |   -0.06   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |   -0.01   -0.03 |    0.67    1.75 |   -1.41   -3.14 |    1.43    3.10
w_f      |    0.00   -0.00   -0.00 |    0.02    0.01    0.01 |   -0.06   -0.03   -0.03 |    0.05    0.03    0.03
w_rewards |   -0.00 |    0.00 |   -0.06 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.29 |    0.26 |    0.00 |    1.61
seeker_angles |    0.00    0.00 |    0.09    0.09 |   -0.99   -1.00 |    0.99    0.97
cs_angles |  0.0015  0.0022 |  0.0857  0.0895 | -0.9944 -0.9977 |  0.9894  0.9724
optical_flow | -0.0000 -0.0001 |  0.0272  0.0266 | -1.1322 -1.4876 |  1.2259  1.1248
v_err    | -0.0099 |  0.0586 | -0.4520 |  0.1327
landing_rewards |    8.52 |    3.55 |    0.00 |   10.00
landing_margin |   -0.02 |    0.02 |   -0.06 |    0.06
tracking_rewards |  -21.88 |    5.09 |  -45.20 |  -12.39
steps    |     375 |  

attitude |    0.01    0.00   -0.01 |    1.17    0.68    1.84 |   -3.14   -1.57   -3.14 |    3.14    1.57    3.14
w        |    0.00   -0.00    0.00 |    0.01    0.01    0.01 |   -0.06   -0.05   -0.05 |    0.06    0.05    0.05
a_f      |    0.01   -0.02 |    0.68    1.84 |   -1.44   -3.13 |    1.46    3.14
w_f      |    0.00   -0.00    0.00 |    0.02    0.01    0.01 |   -0.06   -0.03   -0.03 |    0.06    0.03    0.03
w_rewards |   -0.00 |    0.01 |   -0.07 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.27 |    0.25 |    0.00 |    1.54
seeker_angles |    0.00    0.00 |    0.08    0.08 |   -0.99   -0.99 |    1.00    0.99
cs_angles |  0.0020  0.0032 |  0.0818  0.0846 | -0.9936 -0.9885 |  0.9986  0.9880
optical_flow | -0.0000 -0.0000 |  0.0272  0.0245 | -1.0580 -0.9061 |  1.1959  1.1460
v_err    | -0.0096 |  0.0587 | -0.4521 |  0.1216
landing_rewards |    8.81 |    3.24 |    0.00 |   10.00
landing_margin |   -0

attitude |    0.00    0.01   -0.01 |    1.23    0.65    1.90 |   -3.14   -1.57   -3.14 |    3.14    1.57    3.14
w        |    0.00   -0.00    0.00 |    0.01    0.00    0.01 |   -0.05   -0.05   -0.05 |    0.06    0.05    0.05
a_f      |    0.01   -0.04 |    0.67    1.90 |   -1.43   -3.14 |    1.42    3.13
w_f      |   -0.00    0.00   -0.00 |    0.02    0.01    0.01 |   -0.05   -0.03   -0.04 |    0.06    0.03    0.03
w_rewards |   -0.00 |    0.00 |   -0.06 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.28 |    0.26 |    0.00 |    1.60
seeker_angles |    0.00    0.00 |    0.08    0.09 |   -0.99   -0.99 |    0.99    1.00
cs_angles |  0.0035  0.0031 |  0.0848  0.0899 | -0.9872 -0.9851 |  0.9882  0.9965
optical_flow | -0.0001 -0.0000 |  0.0268  0.0255 | -0.8789 -0.9359 |  0.8476  1.0114
v_err    | -0.0100 |  0.0584 | -0.4530 |  0.1286
landing_rewards |    9.06 |    2.91 |    0.00 |   10.00
landing_margin |   -0

w        |    0.00   -0.00    0.00 |    0.01    0.00    0.01 |   -0.06   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |   -0.00   -0.04 |    0.63    1.91 |   -1.45   -3.11 |    1.44    3.07
w_f      |    0.00    0.00    0.00 |    0.02    0.01    0.01 |   -0.06   -0.02   -0.02 |    0.05    0.03    0.03
w_rewards |   -0.00 |    0.01 |   -0.14 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.28 |    0.26 |    0.00 |    1.62
seeker_angles |    0.00    0.00 |    0.08    0.09 |   -0.98   -0.99 |    0.99    1.00
cs_angles |  0.0016  0.0023 |  0.0835  0.0875 | -0.9849 -0.9943 |  0.9937  0.9994
optical_flow | -0.0001 -0.0001 |  0.0273  0.0257 | -1.1350 -0.9818 |  1.1339  1.0880
v_err    | -0.0096 |  0.0582 | -0.4513 |  0.1177
landing_rewards |    9.00 |    3.00 |    0.00 |   10.00
landing_margin |   -0.02 |    0.02 |   -0.06 |    0.04
tracking_rewards |  -21.37 |    4.75 |  -39.05 |  -12.41
steps    |     377 |  

w        |    0.00   -0.00    0.00 |    0.01    0.00    0.01 |   -0.05   -0.05   -0.05 |    0.06    0.05    0.05
a_f      |    0.03   -0.04 |    0.74    1.93 |   -1.43   -3.14 |    1.54    3.14
w_f      |   -0.00   -0.00    0.00 |    0.02    0.01    0.01 |   -0.05   -0.02   -0.03 |    0.06    0.02    0.03
w_rewards |   -0.00 |    0.01 |   -0.08 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.26 |    0.24 |    0.00 |    1.60
seeker_angles |    0.00    0.00 |    0.08    0.08 |   -1.00   -1.00 |    1.00    0.98
cs_angles |  0.0023  0.0033 |  0.0796  0.0832 | -0.9997 -0.9998 |  0.9999  0.9796
optical_flow |  0.0001  0.0000 |  0.0264  0.0247 | -1.1419 -1.3010 |  1.1943  0.9827
v_err    | -0.0093 |  0.0585 | -0.4531 |  0.1413
landing_rewards |    9.03 |    2.96 |    0.00 |   10.00
landing_margin |   -0.02 |    0.02 |   -0.06 |    0.05
tracking_rewards |  -20.37 |    4.36 |  -41.27 |  -11.57
steps    |     376 |  

w        |    0.00    0.00    0.00 |    0.01    0.00    0.01 |   -0.06   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |    0.02    0.05 |    0.65    1.86 |   -1.52   -3.13 |    1.45    3.13
w_f      |   -0.00    0.00    0.00 |    0.02    0.01    0.01 |   -0.06   -0.02   -0.03 |    0.05    0.03    0.03
w_rewards |   -0.00 |    0.01 |   -0.08 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.28 |    0.26 |    0.00 |    1.63
seeker_angles |    0.00    0.00 |    0.08    0.09 |   -0.99   -0.99 |    0.99    1.00
cs_angles |  0.0028  0.0043 |  0.0849  0.0871 | -0.9937 -0.9854 |  0.9907  0.9993
optical_flow | -0.0000 -0.0000 |  0.0268  0.0255 | -1.1901 -1.0049 |  1.0005  0.8700
v_err    | -0.0096 |  0.0590 | -0.4894 |  0.1188
landing_rewards |    8.84 |    3.20 |    0.00 |   10.00
landing_margin |   -0.02 |    0.02 |   -0.06 |    0.03
tracking_rewards |  -21.40 |    4.91 |  -38.66 |  -12.11
steps    |     375 |  

w        |   -0.00    0.00    0.00 |    0.01    0.00    0.01 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |    0.05    0.17 |    0.66    1.87 |   -1.44   -3.11 |    1.46    3.13
w_f      |   -0.00    0.00   -0.00 |    0.02    0.01    0.01 |   -0.05   -0.02   -0.03 |    0.05    0.03    0.03
w_rewards |   -0.00 |    0.00 |   -0.01 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.27 |    0.25 |    0.00 |    1.53
seeker_angles |    0.00    0.01 |    0.08    0.09 |   -0.99   -0.99 |    1.00    1.00
cs_angles |  0.0025  0.0066 |  0.0797  0.0879 | -0.9922 -0.9945 |  0.9994  1.0000
optical_flow | -0.0000  0.0001 |  0.0265  0.0241 | -1.0266 -0.9616 |  1.3148  1.2221
v_err    | -0.0094 |  0.0583 | -0.4525 |  0.1187
landing_rewards |    9.03 |    2.96 |    0.00 |   10.00
landing_margin |   -0.02 |    0.02 |   -0.06 |    0.03
tracking_rewards |  -20.93 |    4.74 |  -36.87 |  -11.29
steps    |     377 |  

attitude |    0.11   -0.03    0.08 |    1.21    0.69    1.91 |   -3.14   -1.57   -3.14 |    3.14    1.56    3.14
w        |    0.00    0.00    0.00 |    0.01    0.00    0.01 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |   -0.04    0.12 |    0.68    1.87 |   -1.44   -3.12 |    1.49    3.14
w_f      |   -0.00    0.00    0.00 |    0.02    0.01    0.01 |   -0.05   -0.03   -0.02 |    0.05    0.03    0.04
w_rewards |   -0.00 |    0.00 |   -0.03 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.27 |    0.25 |    0.00 |    1.49
seeker_angles |    0.01    0.00 |    0.08    0.09 |   -1.00   -0.99 |    1.00    0.98
cs_angles |  0.0060  0.0049 |  0.0815  0.0851 | -0.9965 -0.9949 |  0.9992  0.9830
optical_flow |  0.0000 -0.0001 |  0.0251  0.0251 | -1.0567 -1.2450 |  0.9926  1.0884
v_err    | -0.0096 |  0.0585 | -0.4533 |  0.1404
landing_rewards |    9.23 |    2.67 |    0.00 |   10.00
landing_margin |   -0

attitude |   -0.09    0.00   -0.02 |    1.18    0.68    1.81 |   -3.14   -1.57   -3.14 |    3.14    1.56    3.14
w        |    0.00   -0.00   -0.00 |    0.01    0.00    0.01 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |   -0.00   -0.20 |    0.68    1.79 |   -1.53   -3.13 |    1.46    3.14
w_f      |   -0.00    0.00    0.00 |    0.02    0.01    0.01 |   -0.05   -0.03   -0.03 |    0.05    0.02    0.03
w_rewards |   -0.00 |    0.00 |   -0.01 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.26 |    0.25 |    0.00 |    1.51
seeker_angles |    0.01    0.00 |    0.08    0.09 |   -0.99   -0.98 |    1.00    0.99
cs_angles |  0.0077  0.0041 |  0.0807  0.0855 | -0.9945 -0.9839 |  0.9994  0.9923
optical_flow |  0.0001  0.0000 |  0.0272  0.0245 | -1.2147 -1.1033 |  1.2266  1.2069
v_err    | -0.0095 |  0.0583 | -0.4525 |  0.1127
landing_rewards |    9.10 |    2.87 |    0.00 |   10.00
landing_margin |   -0

attitude |    0.11    0.00   -0.08 |    1.10    0.66    1.85 |   -3.14   -1.56   -3.14 |    3.14    1.54    3.14
w        |    0.00    0.00   -0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |    0.01   -0.05 |    0.67    1.84 |   -1.49   -3.14 |    1.50    3.10
w_f      |    0.00   -0.00   -0.00 |    0.02    0.01    0.01 |   -0.05   -0.02   -0.03 |    0.05    0.02    0.02
w_rewards |   -0.00 |    0.00 |   -0.04 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.27 |    0.25 |    0.00 |    1.60
seeker_angles |    0.01    0.00 |    0.08    0.09 |   -0.99   -1.00 |    1.00    0.99
cs_angles |  0.0052  0.0030 |  0.0835  0.0857 | -0.9897 -0.9966 |  0.9957  0.9857
optical_flow | -0.0002 -0.0001 |  0.0281  0.0264 | -1.5340 -0.9929 |  1.5986  1.3847
v_err    | -0.0091 |  0.0584 | -0.4522 |  0.1138
landing_rewards |    9.10 |    2.87 |    0.00 |   10.00
landing_margin |   -0

w        |    0.00   -0.00    0.00 |    0.01    0.00    0.01 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |    0.02    0.00 |    0.68    1.85 |   -1.46   -3.14 |    1.54    3.14
w_f      |    0.00   -0.00    0.00 |    0.02    0.01    0.01 |   -0.05   -0.03   -0.02 |    0.05    0.02    0.03
w_rewards |   -0.00 |    0.00 |   -0.04 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.26 |    0.24 |    0.00 |    1.59
seeker_angles |    0.00    0.00 |    0.08    0.08 |   -1.00   -0.99 |    1.00    0.99
cs_angles |  0.0032  0.0023 |  0.0785  0.0825 | -0.9996 -0.9915 |  0.9984  0.9894
optical_flow |  0.0001 -0.0000 |  0.0267  0.0259 | -1.2957 -1.1403 |  1.1723  1.0629
v_err    | -0.0090 |  0.0585 | -0.4997 |  0.1231
landing_rewards |    9.13 |    2.82 |    0.00 |   10.00
landing_margin |   -0.02 |    0.02 |   -0.06 |    0.04
tracking_rewards |  -19.80 |    4.34 |  -44.83 |  -11.91
steps    |     378 |  

thrust   |   -0.00    0.00    0.00 |    0.68    0.69    0.68 |   -3.33   -3.45   -3.46 |    3.46    3.35    3.38
norm_thrust |    0.92 |    0.75 |    0.00 |    3.46
fuel     |    1.61 |    0.21 |    1.16 |    2.51
rewards  |  -15.93 |    6.47 |  -65.23 |   -6.11
fuel_rewards |   -4.61 |    0.61 |   -7.19 |   -3.33
glideslope_rewards |    0.00 |    0.00 |    0.00 |    0.00
glideslope_penalty |    0.00 |    0.00 |    0.00 |    0.00
glideslope |    2.83 |   12.60 |    0.00 |  261.68
norm_af  |    1.75 |    0.89 |    0.09 |    3.23
norm_wf  |    0.02 |    0.01 |    0.00 |    0.06
rh_penalty |    0.00 |    0.00 |    0.00 |    0.00
att_rewards |    0.00 |    0.00 |    0.00 |    0.00
att_penalty |    0.00 |    0.00 |    0.00 |    0.00
attitude |   -0.04    0.00   -0.16 |    1.20    0.64    1.87 |   -3.14   -1.56   -3.14 |    3.14    1.54    3.14
w        |    0.00   -0.00   -0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |    0.01   -0.14 |    0.64

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   5.9301   3.2219  11.1734  21.2416  12.7737   7.7427
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0006   0.0004   0.0016   6.4661   2.1407   2.4885
Update Cnt = 1010    ET =   1082.5   Stats:  Mean, Std, Min, Max
r_f      |    2.77  -10.21   -9.87 |  195.53  163.67  198.53 | -395.84 -360.92 -391.19 |  393.28  374.68  371.22
v_f      |   -0.00    0.00    0.00 |    0.05    0.04    0.05 |   -0.11   -0.12   -0.10 |    0.11    0.10    0.09
r_i      |    9.03  -30.85  -64.26 |  725.15  633.17  749.72 |-1342.07-1318.93-1311.36 | 1320.68 1249.36 1217.01
v_i      |   -0.00    0.00    0.00 |    0.05    0.04    0.05 |   -0.10   -0.09   -0.09 |    0.09    0.09    0.09
norm_rf  |    0.26 |    0.10 |    0.03 |    0.54
norm_vf  |    0.08 |    0.01 |    0.04 |    0.14
gs_f     |    1.13 |    1.47 |    0.02 |   12.09
thrust   |   -0.00    0.00   -0.00 |    0.67    0.69    0.67 |   -3.45   -3.46   -3.46 |    3.46    3.36    3.44
norm_thrust |    

ADV1:  -0.003465845517049415 0.011138208976119654 0.04780384586791231 -0.07858166514157014
ADV2:  0.04524095717918448 0.8663526355214978 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.1283   1.3449   6.3872  21.2416  12.7737   7.7427
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0040   0.0023   0.0089   6.4661   2.1407   2.4885
***** Episode 31629, Mean R = -18.0  Std R = 6.7  Min R = -37.4
PolicyLoss: -0.029
Policy_Beta: 0.1
Policy_Entropy: 0.138
Policy_KL: 0.00111
Policy_SD: 0.577
Policy_lr_mult: 0.444
Steps: 1.15e+04
TotalSteps: 1.1e+07
VF_0_ExplainedVarNew: 0.961
VF_0_ExplainedVarOld: 0.957
VF_0_Loss : 0.000192


ADV1:  -0.001363986952271042 0.01206897295159869 0.052325631015909535 -0.07726361581669458
ADV2:  0.023763997719316473 0.8979889304898813 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   7.2691   4.1616  13.5765  21.2416  12.7737   7.7427
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0028   0.0015   0.0055   6.4661   2.1407   2.4885


***** Episode 31877, Mean R = -16.7  Std R = 5.7  Min R = -35.0
PolicyLoss: -0.0173
Policy_Beta: 0.0667
Policy_Entropy: 0.142
Policy_KL: 0.000692
Policy_SD: 0.559
Policy_lr_mult: 0.444
Steps: 1.17e+04
TotalSteps: 1.11e+07
VF_0_ExplainedVarNew: 0.955
VF_0_ExplainedVarOld: 0.949
VF_0_Loss : 0.000407


ADV1:  -0.001204493521384316 0.010606172380517944 0.04735363413890207 -0.06794961032166158
ADV2:  0.02229868892352102 0.905596298989456 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   4.1830   2.1033   7.9307  21.2416  12.7737   7.7427
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0014   0.0008   0.0033   6.4661   2.1407   2.4885
***** Episode 31908, Mean R = -16.4  Std R = 6.2  Min R = -29.6
PolicyLoss: -0.017
Policy_Beta: 0.0667
Policy_Entropy: 0.14
Policy_KL: 0.000699
Policy_SD: 0.566
Policy_lr_mult: 0.444
Steps: 1.17e+04
TotalSteps: 1.11e+07
VF_0_ExplainedVarNew: 0.957
VF_0_ExplainedVarOld: 0.952
VF_0_Loss : 0.000319


Dynamics: Max Disturbance (m/s^2):  [0.00179836 0

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.5410   1.3200   6.2367  21.2416  12.7737   7.7427
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0008   0.0004   0.0018   6.4661   2.1407   2.4885
***** Episode 32156, Mean R = -15.7  Std R = 5.9  Min R = -30.5
PolicyLoss: -0.0239
Policy_Beta: 0.0667
Policy_Entropy: 0.141
Policy_KL: 0.000669
Policy_SD: 0.557
Policy_lr_mult: 0.444
Steps: 1.18e+04
TotalSteps: 1.12e+07
VF_0_ExplainedVarNew: 0.966
VF_0_ExplainedVarOld: 0.963
VF_0_Loss : 0.00101


ADV1:  0.0006678486782365794 0.00696899198861332 0.04641127982469101 -0.057443648101006994
ADV2:  0.011032033141581703 0.8630730380500004 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   3.7562   2.4165   8.1223  21.2416  12.7737   7.7427
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0006   0.0004   0.0017   6.4661   2.1407   2.4885
***** Episode 32187, Mean R = -14.8  Std R = 5.4  Min R = -30.6
PolicyLoss: -0.0205
Policy_Beta: 0.0667
Policy_Entropy: 0.142
Policy_KL: 0.00

ADV1:  0.0030796962765622963 0.008787567897231289 0.04349913345804585 -0.09437627923736558
ADV2:  -0.006216756790736294 0.8497821110908635 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.9327   1.2217   4.9609  21.2416  12.7737   7.7427
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0033   0.0021   0.0080   6.4661   2.1407   2.4885
***** Episode 32435, Mean R = -16.3  Std R = 6.0  Min R = -34.1
PolicyLoss: -0.0268
Policy_Beta: 0.0667
Policy_Entropy: 0.142
Policy_KL: 0.000594
Policy_SD: 0.57
Policy_lr_mult: 0.444
Steps: 1.17e+04
TotalSteps: 1.13e+07
VF_0_ExplainedVarNew: 0.974
VF_0_ExplainedVarOld: 0.97
VF_0_Loss : 0.0135


Dynamics: Max Disturbance (m/s^2):  [0.00179836 0.00129994 0.00168267] 0.0027848433135488422
ADV1:  -0.0020594522508190507 0.010024192468480351 0.039547558999361576 -0.07322878687462114
ADV2:  0.036930271765987746 0.8700384555332255 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   3.4301   1.7341   7.2301  21.2416  12.7737   7.7427
ValF

ADV1:  0.002297265999722204 0.010473845369722862 0.05580525061104885 -0.08813047987998329
ADV2:  -0.00282715952996821 0.8859519694157014 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.5222   0.5403   2.5366  21.2416  12.7737   7.7427
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0027   0.0017   0.0061   6.4661   2.1407   2.4885
***** Episode 32714, Mean R = -15.8  Std R = 5.8  Min R = -27.9
PolicyLoss: -0.0213
Policy_Beta: 0.1
Policy_Entropy: 0.144
Policy_KL: 0.00127
Policy_SD: 0.556
Policy_lr_mult: 0.444
Steps: 1.17e+04
TotalSteps: 1.14e+07
VF_0_ExplainedVarNew: 0.954
VF_0_ExplainedVarOld: 0.95
VF_0_Loss : 0.00329


Dynamics: Max Disturbance (m/s^2):  [0.00179836 0.00129994 0.00168267] 0.0027848433135488422
ADV1:  0.0009502867493882261 0.008677385846126944 0.0672760868081913 -0.046615071203324344
ADV2:  0.006920307656107053 0.9043758696648189 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.5974   0.7098   3.3486  21.2416  12.7737   7.7427
ValFun  Gr

Dynamics: Max Disturbance (m/s^2):  [0.00179836 0.00129994 0.00168267] 0.0027848433135488422
ADV1:  -0.0006121568298921118 0.00928658149846835 0.04601775565052213 -0.08820061355839542
ADV2:  0.027713215405125762 0.8531218859180955 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.5333   1.1055   5.7862  21.2416  12.7737   7.7427
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0007   0.0004   0.0016   6.4661   2.1407   2.4885
***** Episode 32993, Mean R = -14.8  Std R = 5.2  Min R = -28.2
PolicyLoss: -0.0278
Policy_Beta: 0.1
Policy_Entropy: 0.144
Policy_KL: 0.00108
Policy_SD: 0.547
Policy_lr_mult: 0.444
Steps: 1.18e+04
TotalSteps: 1.15e+07
VF_0_ExplainedVarNew: 0.962
VF_0_ExplainedVarOld: 0.959
VF_0_Loss : 0.000308


ADV1:  0.00042165906524765906 0.009192694351663151 0.06665040917593107 -0.07087234346936568
ADV2:  0.01607217131460359 0.8285776164946411 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.5338   0.8091   3.8749  21.2416  12.7737   7.7427
ValFun 

ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0029   0.0017   0.0062   6.4661   2.1407   2.4885
***** Episode 33241, Mean R = -15.5  Std R = 6.0  Min R = -31.8
PolicyLoss: -0.0146
Policy_Beta: 0.0198
Policy_Entropy: 0.146
Policy_KL: 0.00592
Policy_SD: 0.548
Policy_lr_mult: 0.296
Steps: 1.18e+04
TotalSteps: 1.16e+07
VF_0_ExplainedVarNew: 0.951
VF_0_ExplainedVarOld: 0.944
VF_0_Loss : 0.00203


Dynamics: Max Disturbance (m/s^2):  [0.00179836 0.00129994 0.00168267] 0.0027848433135488422
ADV1:  0.0020576158514446674 0.007498562069112092 0.05944378763155883 -0.0768374645709991
ADV2:  -0.00842323743088129 0.8773336464383411 3.0 -3.0
 *** BROKE ***   1 0.005267000291496515
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :  14.4224  12.6669  27.0893  27.0893  14.4224  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0021   0.0013   0.0054   6.4661   2.1407   2.4885
***** Episode 33272, Mean R = -15.2  Std R = 5.6  Min R = -30.6
PolicyLoss: 0.00192
Policy_Beta: 0.0132
Policy_En

cs_angles |  0.0036 -0.0028 |  0.0814  0.0860 | -0.9895 -0.9939 |  0.9944  0.9743
optical_flow | -0.0000 -0.0001 |  0.0268  0.0244 | -1.2812 -0.9476 |  1.1160  1.3413
v_err    | -0.0096 |  0.0586 | -0.4520 |  0.1133
landing_rewards |    9.35 |    2.46 |    0.00 |   10.00
landing_margin |   -0.03 |    0.02 |   -0.07 |    0.03
tracking_rewards |  -20.12 |    4.43 |  -37.44 |  -11.60
steps    |     376 |      20 |     328 |     418
***** Episode 33520, Mean R = -15.7  Std R = 6.6  Min R = -33.4
PolicyLoss: -0.0215
Policy_Beta: 0.114
Policy_Entropy: 0.145
Policy_KL: 0.000458
Policy_SD: 0.565
Policy_lr_mult: 0.132
Steps: 1.16e+04
TotalSteps: 1.17e+07
VF_0_ExplainedVarNew: 0.956
VF_0_ExplainedVarOld: 0.953
VF_0_Loss : 0.00443


Dynamics: Max Disturbance (m/s^2):  [0.00179836 0.00129994 0.00168267] 0.0027848433135488422
ADV1:  0.005362675596301796 0.008724806100391443 0.04740611895737884 -0.055397662603194675
ADV2:  -0.03486288833453262 0.9200664419211377 3.0 -3.0
Policy  Gradients: u/sd/Max/

w        |    0.00   -0.00    0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |    0.01   -0.05 |    0.68    1.93 |   -1.45   -3.14 |    1.40    3.14
w_f      |    0.00   -0.00   -0.00 |    0.02    0.01    0.01 |   -0.04   -0.02   -0.03 |    0.05    0.03    0.03
w_rewards |   -0.00 |    0.00 |   -0.02 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.25 |    0.24 |    0.00 |    1.73
seeker_angles |    0.00    0.00 |    0.08    0.08 |   -0.97   -0.99 |    0.99    0.98
cs_angles |  0.0009  0.0025 |  0.0785  0.0835 | -0.9719 -0.9903 |  0.9875  0.9849
optical_flow | -0.0000 -0.0002 |  0.0256  0.0243 | -1.6778 -1.3267 |  1.0384  1.1377
v_err    | -0.0092 |  0.0585 | -0.4524 |  0.1166
landing_rewards |    9.13 |    2.82 |    0.00 |   10.00
landing_margin |   -0.02 |    0.01 |   -0.06 |    0.02
tracking_rewards |  -19.48 |    4.12 |  -34.60 |  -12.14
steps    |     376 |  

thrust   |   -0.00   -0.00   -0.00 |    0.67    0.68    0.69 |   -3.46   -3.46   -3.36 |    3.45    3.33    3.34
norm_thrust |    0.90 |    0.75 |    0.00 |    3.46
fuel     |    1.57 |    0.19 |    1.13 |    2.25
rewards  |  -14.94 |    5.59 |  -36.92 |   -6.48
fuel_rewards |   -4.51 |    0.55 |   -6.44 |   -3.24
glideslope_rewards |    0.00 |    0.00 |    0.00 |    0.00
glideslope_penalty |    0.00 |    0.00 |    0.00 |    0.00
glideslope |    2.87 |   12.68 |    0.01 |  280.17
norm_af  |    1.71 |    0.87 |    0.01 |    3.22
norm_wf  |    0.02 |    0.01 |    0.00 |    0.04
rh_penalty |    0.00 |    0.00 |    0.00 |    0.00
att_rewards |    0.00 |    0.00 |    0.00 |    0.00
att_penalty |    0.00 |    0.00 |    0.00 |    0.00
attitude |   -0.02    0.03    0.03 |    1.13    0.65    1.80 |   -3.14   -1.50   -3.14 |    3.14    1.55    3.14
w        |   -0.00   -0.00   -0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |    0.03   -0.06 |    0.64

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.4538   0.4858   2.9085  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0026   0.0015   0.0057   6.4661   2.1407   2.4885
Update Cnt = 1110    ET =   1150.3   Stats:  Mean, Std, Min, Max
r_f      |   -5.67  -14.16  -15.44 |  186.11  181.72  202.14 | -393.66 -390.79 -382.83 |  381.09  397.07  362.78
v_f      |    0.01    0.00    0.00 |    0.04    0.04    0.05 |   -0.08   -0.09   -0.12 |    0.10    0.10    0.11
r_i      |  -31.14  -46.94  -54.37 |  690.03  660.29  766.49 |-1279.23-1342.95-1337.64 | 1333.39 1249.74 1361.37
v_i      |    0.00    0.00    0.00 |    0.04    0.04    0.05 |   -0.09   -0.09   -0.09 |    0.09    0.10    0.10
norm_rf  |    0.24 |    0.10 |    0.02 |    0.54
norm_vf  |    0.07 |    0.01 |    0.04 |    0.12
gs_f     |    1.25 |    1.77 |    0.01 |   17.45
thrust   |   -0.00   -0.01   -0.01 |    0.67    0.68    0.68 |   -3.44   -3.42   -3.35 |    3.45    3.38    3.44
norm_thrust |    

ADV1:  -0.00012116089752409234 0.011662308169308593 0.05361540845949814 -0.0724859529781226
ADV2:  0.013371727305155325 0.9125959017402095 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.7250   0.1908   1.2468  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0005   0.0004   0.0016   6.4661   2.1407   2.4885
***** Episode 34729, Mean R = -16.3  Std R = 5.4  Min R = -27.7
PolicyLoss: -0.0155
Policy_Beta: 0.114
Policy_Entropy: 0.145
Policy_KL: 0.000702
Policy_SD: 0.555
Policy_lr_mult: 0.132
Steps: 1.17e+04
TotalSteps: 1.22e+07
VF_0_ExplainedVarNew: 0.958
VF_0_ExplainedVarOld: 0.946
VF_0_Loss : 0.000359


ADV1:  -0.0019228905895694105 0.009393406007942902 0.061611331388165935 -0.07521564453840252
ADV2:  0.03378847419422082 0.8646611322493044 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.7444   0.7061   3.1790  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0024   0.0014   0.0050   6.4661   2.1407  

***** Episode 34977, Mean R = -15.1  Std R = 5.9  Min R = -31.1
PolicyLoss: -0.0157
Policy_Beta: 0.114
Policy_Entropy: 0.145
Policy_KL: 0.00135
Policy_SD: 0.548
Policy_lr_mult: 0.132
Steps: 1.16e+04
TotalSteps: 1.22e+07
VF_0_ExplainedVarNew: 0.966
VF_0_ExplainedVarOld: 0.962
VF_0_Loss : 0.000845


ADV1:  0.002307837183810015 0.00844134865480658 0.05796463420309461 -0.05648570822968706
ADV2:  0.0012147642645616295 0.8568939115815605 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.3829   0.5666   2.8791  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0030   0.0018   0.0064   6.4661   2.1407   2.4885
***** Episode 35008, Mean R = -15.3  Std R = 5.6  Min R = -31.1
PolicyLoss: -0.025
Policy_Beta: 0.114
Policy_Entropy: 0.144
Policy_KL: 0.00116
Policy_SD: 0.565
Policy_lr_mult: 0.132
Steps: 1.16e+04
TotalSteps: 1.23e+07
VF_0_ExplainedVarNew: 0.973
VF_0_ExplainedVarOld: 0.97
VF_0_Loss : 0.000245


ADV1:  -0.0015235002636313426 0.007220850074461698 0

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.8065   0.8964   4.4511  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0021   0.0012   0.0042   6.4661   2.1407   2.4885
***** Episode 35256, Mean R = -17.4  Std R = 7.7  Min R = -42.9
PolicyLoss: -0.0101
Policy_Beta: 0.114
Policy_Entropy: 0.147
Policy_KL: 0.00103
Policy_SD: 0.556
Policy_lr_mult: 0.132
Steps: 1.17e+04
TotalSteps: 1.24e+07
VF_0_ExplainedVarNew: 0.956
VF_0_ExplainedVarOld: 0.952
VF_0_Loss : 0.000883


ADV1:  0.0035367428992154567 0.010403388591432108 0.056192996984040955 -0.0768935044685915
ADV2:  -0.00956188884593638 0.893970206891621 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.2676   0.5413   2.4159  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0044   0.0027   0.0097   6.4661   2.1407   2.4885
***** Episode 35287, Mean R = -16.0  Std R = 5.7  Min R = -30.1
PolicyLoss: -0.02
Policy_Beta: 0.114
Policy_Entropy: 0.146
Policy_KL: 0.000911


ADV1:  -0.0019988457261774575 0.008878312872340581 0.06138693182596114 -0.07869117349407644
ADV2:  0.03552675419960261 0.8341529423647565 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.9182   0.3826   2.1434  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0023   0.0014   0.0053   6.4661   2.1407   2.4885
***** Episode 35535, Mean R = -14.5  Std R = 4.9  Min R = -25.9
PolicyLoss: -0.0226
Policy_Beta: 0.114
Policy_Entropy: 0.144
Policy_KL: 0.0013
Policy_SD: 0.553
Policy_lr_mult: 0.132
Steps: 1.17e+04
TotalSteps: 1.25e+07
VF_0_ExplainedVarNew: 0.969
VF_0_ExplainedVarOld: 0.963
VF_0_Loss : 0.0058


ADV1:  0.003426363172430152 0.006713567703555438 0.04290751511088587 -0.05389263645638903
ADV2:  -0.027283422233161634 0.9137614426057027 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.6528   0.9889   4.7022  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0037   0.0022   0.0089   6.4661   2.1407   2.488

***** Episode 35783, Mean R = -14.7  Std R = 5.5  Min R = -31.0
PolicyLoss: -0.0272
Policy_Beta: 0.114
Policy_Entropy: 0.148
Policy_KL: 0.000959
Policy_SD: 0.541
Policy_lr_mult: 0.132
Steps: 1.17e+04
TotalSteps: 1.26e+07
VF_0_ExplainedVarNew: 0.971
VF_0_ExplainedVarOld: 0.967
VF_0_Loss : 0.00228


ADV1:  5.072498306918018e-06 0.005979179230110457 0.041448886208690236 -0.06283356897986092
ADV2:  0.0030009933908280682 0.9062354058121207 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.2360   0.5153   2.5881  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0002   0.0001   0.0004   6.4661   2.1407   2.4885
***** Episode 35814, Mean R = -13.3  Std R = 3.8  Min R = -20.9
PolicyLoss: -0.00565
Policy_Beta: 0.114
Policy_Entropy: 0.15
Policy_KL: 0.000934
Policy_SD: 0.536
Policy_lr_mult: 0.132
Steps: 1.18e+04
TotalSteps: 1.26e+07
VF_0_ExplainedVarNew: 0.983
VF_0_ExplainedVarOld: 0.98
VF_0_Loss : 0.00434


ADV1:  0.00028772071875203325 0.0083056420127119

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.8622   0.9638   5.5884  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0010   0.0006   0.0022   6.4661   2.1407   2.4885
***** Episode 36062, Mean R = -13.2  Std R = 5.1  Min R = -34.0
PolicyLoss: -0.0231
Policy_Beta: 0.114
Policy_Entropy: 0.149
Policy_KL: 0.00115
Policy_SD: 0.538
Policy_lr_mult: 0.132
Steps: 1.15e+04
TotalSteps: 1.27e+07
VF_0_ExplainedVarNew: 0.962
VF_0_ExplainedVarOld: 0.958
VF_0_Loss : 0.00274


ADV1:  0.0003231686740439643 0.007082742797698258 0.054564020538324653 -0.047612386346671705
ADV2:  0.003957194716472338 0.8845905785440545 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.8161   1.0094   4.1786  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0003   0.0002   0.0008   6.4661   2.1407   2.4885
***** Episode 36093, Mean R = -13.9  Std R = 4.4  Min R = -27.8
PolicyLoss: -0.00949
Policy_Beta: 0.114
Policy_Entropy: 0.148
Policy_KL: 0.00

ADV1:  0.0006929308099871926 0.009358447165121499 0.03660358083380941 -0.07971805642552103
ADV2:  0.01717756785826377 0.8632451464345879 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.3066   0.6816   3.5498  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0009   0.0005   0.0018   6.4661   2.1407   2.4885
***** Episode 36341, Mean R = -15.0  Std R = 5.3  Min R = -27.1
PolicyLoss: -0.0262
Policy_Beta: 0.114
Policy_Entropy: 0.15
Policy_KL: 0.000765
Policy_SD: 0.543
Policy_lr_mult: 0.132
Steps: 1.16e+04
TotalSteps: 1.28e+07
VF_0_ExplainedVarNew: 0.963
VF_0_ExplainedVarOld: 0.959
VF_0_Loss : 0.00468


ADV1:  -0.00029137593897924063 0.007731603815823366 0.06281562719158168 -0.05907054173687806
ADV2:  0.014762179242346891 0.8673506968340035 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.9206   0.4568   2.2738  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0004   0.0002   0.0009   6.4661   2.1407   2.

theta_cv |    0.26 |    0.24 |    0.00 |    1.63
seeker_angles |    0.00    0.00 |    0.08    0.08 |   -0.98   -0.98 |    0.99    0.99
cs_angles |  0.0033  0.0010 |  0.0808  0.0828 | -0.9778 -0.9809 |  0.9926  0.9861
optical_flow |  0.0001 -0.0001 |  0.0277  0.0255 | -1.1641 -1.2153 |  1.1079  1.0931
v_err    | -0.0094 |  0.0583 | -0.4522 |  0.1182
landing_rewards |    9.52 |    2.15 |    0.00 |   10.00
landing_margin |   -0.02 |    0.01 |   -0.06 |    0.04
tracking_rewards |  -19.60 |    4.19 |  -41.26 |  -11.82
steps    |     377 |      21 |     338 |     415
***** Episode 36620, Mean R = -15.1  Std R = 4.8  Min R = -28.4
PolicyLoss: -0.0017
Policy_Beta: 0.114
Policy_Entropy: 0.15
Policy_KL: 0.00087
Policy_SD: 0.541
Policy_lr_mult: 0.132
Steps: 1.17e+04
TotalSteps: 1.29e+07
VF_0_ExplainedVarNew: 0.983
VF_0_ExplainedVarOld: 0.978
VF_0_Loss : 0.00459


ADV1:  -0.00018181426749342878 0.009559243129159036 0.04970534726247147 -0.061211191929852984
ADV2:  0.021734605800028155 0.86370456691

theta_cv |    0.26 |    0.25 |    0.00 |    1.54
seeker_angles |    0.00   -0.00 |    0.08    0.09 |   -1.00   -1.00 |    0.96    1.00
cs_angles |  0.0015 -0.0006 |  0.0788  0.0897 | -0.9996 -0.9998 |  0.9622  0.9955
optical_flow |  0.0000  0.0000 |  0.0261  0.0251 | -0.9874 -1.0251 |  1.0718  1.3003
v_err    | -0.0096 |  0.0589 | -0.4530 |  0.1206
landing_rewards |    9.58 |    2.00 |    0.00 |   10.00
landing_margin |   -0.03 |    0.01 |   -0.06 |    0.03
tracking_rewards |  -19.83 |    5.05 |  -37.69 |  -10.93
steps    |     375 |      20 |     328 |     416
***** Episode 36930, Mean R = -14.3  Std R = 6.9  Min R = -31.9
PolicyLoss: -0.0266
Policy_Beta: 0.114
Policy_Entropy: 0.149
Policy_KL: 0.00114
Policy_SD: 0.545
Policy_lr_mult: 0.132
Steps: 1.16e+04
TotalSteps: 1.3e+07
VF_0_ExplainedVarNew: 0.968
VF_0_ExplainedVarOld: 0.962
VF_0_Loss : 0.00167


ADV1:  -0.001335523100789544 0.010344669600956065 0.0420360563019669 -0.06991903942830979
ADV2:  0.03203350576730134 0.865632274422296 

attitude |    0.02    0.04   -0.15 |    1.04    0.63    1.76 |   -3.14   -1.55   -3.14 |    3.14    1.53    3.14
w        |    0.00   -0.00   -0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |    0.03   -0.15 |    0.62    1.76 |   -1.52   -3.13 |    1.44    3.09
w_f      |    0.00    0.00   -0.00 |    0.02    0.01    0.01 |   -0.05   -0.02   -0.03 |    0.05    0.02    0.03
w_rewards |   -0.00 |    0.00 |   -0.02 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.26 |    0.25 |    0.00 |    1.55
seeker_angles |    0.00   -0.00 |    0.08    0.08 |   -1.00   -1.00 |    1.00    0.99
cs_angles |  0.0024 -0.0007 |  0.0830  0.0825 | -0.9981 -0.9967 |  0.9962  0.9893
optical_flow |  0.0000 -0.0001 |  0.0257  0.0246 | -0.9753 -1.1629 |  0.8787  1.1747
v_err    | -0.0095 |  0.0584 | -0.4533 |  0.1296
landing_rewards |    9.26 |    2.62 |    0.00 |   10.00
landing_margin |   -0

thrust   |    0.00    0.00   -0.00 |    0.67    0.68    0.67 |   -3.43   -3.33   -3.27 |    3.44    3.44    3.44
norm_thrust |    0.90 |    0.75 |    0.00 |    3.46
fuel     |    1.56 |    0.20 |    1.07 |    2.18
rewards  |  -14.35 |    5.23 |  -37.33 |   -5.13
fuel_rewards |   -4.46 |    0.56 |   -6.24 |   -3.09
glideslope_rewards |    0.00 |    0.00 |    0.00 |    0.00
glideslope_penalty |    0.00 |    0.00 |    0.00 |    0.00
glideslope |    2.78 |   12.30 |    0.01 |  272.37
norm_af  |    1.65 |    0.91 |    0.09 |    3.33
norm_wf  |    0.02 |    0.01 |    0.00 |    0.05
rh_penalty |    0.00 |    0.00 |    0.00 |    0.00
att_rewards |    0.00 |    0.00 |    0.00 |    0.00
att_penalty |    0.00 |    0.00 |    0.00 |    0.00
attitude |    0.01    0.03    0.04 |    1.10    0.64    1.77 |   -3.14   -1.57   -3.14 |    3.14    1.49    3.14
w        |   -0.00   -0.00    0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |    0.03    0.10 |    0.64

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.0698   1.2195   6.3226  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0015   0.0009   0.0038   6.4661   2.1407   2.4885
Update Cnt = 1220    ET =   1116.3   Stats:  Mean, Std, Min, Max
r_f      |   11.31   -9.36   -9.56 |  187.23  163.16  200.37 | -387.51 -375.81 -397.89 |  397.37  363.69  385.12
v_f      |   -0.00    0.00    0.00 |    0.04    0.04    0.05 |   -0.09   -0.09   -0.10 |    0.10    0.10    0.10
r_i      |   28.17  -37.45  -30.93 |  687.45  627.39  782.25 |-1294.99-1214.56-1332.70 | 1371.84 1274.28 1324.83
v_i      |   -0.00    0.00    0.00 |    0.04    0.04    0.05 |   -0.10   -0.09   -0.10 |    0.10    0.09    0.09
norm_rf  |    0.23 |    0.09 |    0.04 |    0.62
norm_vf  |    0.07 |    0.01 |    0.03 |    0.13
gs_f     |    1.63 |    5.16 |    0.01 |   86.19
thrust   |   -0.00   -0.00   -0.00 |    0.67    0.68    0.67 |   -3.32   -3.33   -3.42 |    3.38    3.34    3.18
norm_thrust |    

ADV1:  -0.0020192614930901734 0.00899680274842571 0.053457198930250194 -0.05506409112412326
ADV2:  0.03572482352674838 0.8575919649998581 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.3294   1.2176   5.4595  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0022   0.0015   0.0053   6.4661   2.1407   2.4885
***** Episode 38139, Mean R = -13.5  Std R = 4.9  Min R = -27.6
PolicyLoss: -0.0217
Policy_Beta: 0.114
Policy_Entropy: 0.148
Policy_KL: 0.00124
Policy_SD: 0.551
Policy_lr_mult: 0.132
Steps: 1.15e+04
TotalSteps: 1.34e+07
VF_0_ExplainedVarNew: 0.965
VF_0_ExplainedVarOld: 0.955
VF_0_Loss : 0.000247


ADV1:  0.0018072563833177672 0.006103798098004137 0.034130388213649526 -0.05783026069995195
ADV2:  -0.01697098001118482 0.9064398162825476 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.6383   1.3066   6.8800  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0020   0.0012   0.0047   6.4661   2.1407   2

***** Episode 38387, Mean R = -14.7  Std R = 6.3  Min R = -33.3
PolicyLoss: -0.0245
Policy_Beta: 0.114
Policy_Entropy: 0.149
Policy_KL: 0.000911
Policy_SD: 0.55
Policy_lr_mult: 0.132
Steps: 1.16e+04
TotalSteps: 1.35e+07
VF_0_ExplainedVarNew: 0.975
VF_0_ExplainedVarOld: 0.972
VF_0_Loss : 6.45e-05


ADV1:  -0.001021164155614191 0.008838849518114545 0.042195976420230596 -0.08109117890004325
ADV2:  0.038970799188090086 0.8080235632990735 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.5328   0.5347   2.5777  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0010   0.0006   0.0026   6.4661   2.1407   2.4885
***** Episode 38418, Mean R = -14.2  Std R = 4.7  Min R = -28.3
PolicyLoss: -0.0347
Policy_Beta: 0.114
Policy_Entropy: 0.147
Policy_KL: 0.00113
Policy_SD: 0.558
Policy_lr_mult: 0.132
Steps: 1.16e+04
TotalSteps: 1.35e+07
VF_0_ExplainedVarNew: 0.964
VF_0_ExplainedVarOld: 0.962
VF_0_Loss : 0.000111


ADV1:  0.0009772609784797059 0.00752508854869558

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.3126   0.6323   2.8012  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0055   0.0034   0.0132   6.4661   2.1407   2.4885
***** Episode 38666, Mean R = -13.1  Std R = 3.5  Min R = -21.0
PolicyLoss: -0.0174
Policy_Beta: 0.114
Policy_Entropy: 0.15
Policy_KL: 0.00113
Policy_SD: 0.542
Policy_lr_mult: 0.132
Steps: 1.16e+04
TotalSteps: 1.36e+07
VF_0_ExplainedVarNew: 0.974
VF_0_ExplainedVarOld: 0.967
VF_0_Loss : 0.00109


ADV1:  -0.002699354271870256 0.0092114581478605 0.04742639237603308 -0.06287084308974034
ADV2:  0.03526666428566776 0.8876881786503958 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.0356   0.5749   2.7099  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0028   0.0017   0.0069   6.4661   2.1407   2.4885
***** Episode 38697, Mean R = -15.0  Std R = 6.5  Min R = -31.8
PolicyLoss: -0.0212
Policy_Beta: 0.114
Policy_Entropy: 0.152
Policy_KL: 0.00104
Pol

ADV1:  -0.00114085962884808 0.009051093903830422 0.03805320549018315 -0.07095640251108731
ADV2:  0.035970272425933425 0.8359299988349606 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.4668   1.0348   5.3589  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0012   0.0006   0.0029   6.4661   2.1407   2.4885
***** Episode 38945, Mean R = -14.6  Std R = 5.1  Min R = -30.2
PolicyLoss: -0.0326
Policy_Beta: 0.114
Policy_Entropy: 0.148
Policy_KL: 0.000872
Policy_SD: 0.543
Policy_lr_mult: 0.132
Steps: 1.16e+04
TotalSteps: 1.37e+07
VF_0_ExplainedVarNew: 0.966
VF_0_ExplainedVarOld: 0.963
VF_0_Loss : 0.000119


ADV1:  0.0011345067901136474 0.0072366643686728105 0.060173174430888265 -0.050593692319707284
ADV2:  -0.015453353656100415 0.897799039739569 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.6661   0.6520   3.6870  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0010   0.0007   0.0030   6.4661   2.1407  

***** Episode 39193, Mean R = -14.1  Std R = 5.2  Min R = -26.7
PolicyLoss: -0.0145
Policy_Beta: 0.114
Policy_Entropy: 0.155
Policy_KL: 0.00104
Policy_SD: 0.523
Policy_lr_mult: 0.132
Steps: 1.17e+04
TotalSteps: 1.38e+07
VF_0_ExplainedVarNew: 0.92
VF_0_ExplainedVarOld: 0.916
VF_0_Loss : 0.000148


ADV1:  0.0007343454331952492 0.00935397449150678 0.03804282022899652 -0.07470229819202157
ADV2:  0.01866436752209678 0.837435451047154 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.2299   0.5284   2.4100  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0009   0.0005   0.0020   6.4661   2.1407   2.4885
***** Episode 39224, Mean R = -13.9  Std R = 5.0  Min R = -27.8
PolicyLoss: -0.0298
Policy_Beta: 0.114
Policy_Entropy: 0.151
Policy_KL: 0.000965
Policy_SD: 0.549
Policy_lr_mult: 0.132
Steps: 1.16e+04
TotalSteps: 1.38e+07
VF_0_ExplainedVarNew: 0.96
VF_0_ExplainedVarOld: 0.954
VF_0_Loss : 0.000403


ADV1:  0.0008212142081925142 0.008912945955485965 0.0

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.1757   1.1074   5.9150  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0003   0.0002   0.0007   6.4661   2.1407   2.4885
***** Episode 39472, Mean R = -13.7  Std R = 4.8  Min R = -29.7
PolicyLoss: -0.0181
Policy_Beta: 0.114
Policy_Entropy: 0.149
Policy_KL: 0.00138
Policy_SD: 0.543
Policy_lr_mult: 0.132
Steps: 1.16e+04
TotalSteps: 1.39e+07
VF_0_ExplainedVarNew: 0.974
VF_0_ExplainedVarOld: 0.97
VF_0_Loss : 0.000356


ADV1:  0.0015896842119739367 0.005994025210851821 0.042062863744053214 -0.0611644283952327
ADV2:  -0.0038753791100678728 0.8827839985497747 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.3655   0.6600   2.8508  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0019   0.0012   0.0043   6.4661   2.1407   2.4885
***** Episode 39503, Mean R = -13.1  Std R = 4.8  Min R = -27.6
PolicyLoss: -0.015
Policy_Beta: 0.114
Policy_Entropy: 0.151
Policy_KL: 0.0007

ADV1:  -0.0006990854061297459 0.008308646149926926 0.06154015146114572 -0.06624153818981804
ADV2:  0.022695528901862043 0.8591335637586496 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.1793   1.1721   5.4370  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0009   0.0005   0.0019   6.4661   2.1407   2.4885
***** Episode 39751, Mean R = -14.9  Std R = 7.0  Min R = -36.3
PolicyLoss: -0.0208
Policy_Beta: 0.114
Policy_Entropy: 0.15
Policy_KL: 0.000802
Policy_SD: 0.549
Policy_lr_mult: 0.132
Steps: 1.16e+04
TotalSteps: 1.4e+07
VF_0_ExplainedVarNew: 0.974
VF_0_ExplainedVarOld: 0.97
VF_0_Loss : 6.49e-05


ADV1:  -0.0005244260899148374 0.008087086276144934 0.0390176637967428 -0.06143518257969492
ADV2:  0.02709046674374186 0.8598895978687052 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.3975   0.4735   2.4890  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0006   0.0004   0.0014   6.4661   2.1407   2.48

theta_cv |    0.25 |    0.25 |    0.00 |    1.56
seeker_angles |    0.00    0.00 |    0.08    0.09 |   -0.99   -0.99 |    0.99    0.98
cs_angles |  0.0001  0.0004 |  0.0782  0.0857 | -0.9926 -0.9945 |  0.9857  0.9841
optical_flow |  0.0001 -0.0001 |  0.0252  0.0248 | -1.2960 -1.0377 |  1.2475  1.1066
v_err    | -0.0099 |  0.0584 | -0.4529 |  0.1179
landing_rewards |    9.39 |    2.40 |    0.00 |   10.00
landing_margin |   -0.02 |    0.01 |   -0.07 |    0.04
tracking_rewards |  -19.21 |    4.62 |  -39.83 |  -12.19
steps    |     377 |      20 |     331 |     415
***** Episode 40030, Mean R = -12.8  Std R = 4.9  Min R = -26.8
PolicyLoss: -0.0161
Policy_Beta: 0.114
Policy_Entropy: 0.153
Policy_KL: 0.000926
Policy_SD: 0.534
Policy_lr_mult: 0.132
Steps: 1.18e+04
TotalSteps: 1.42e+07
VF_0_ExplainedVarNew: 0.971
VF_0_ExplainedVarOld: 0.966
VF_0_Loss : 0.000719


ADV1:  0.0015881200214738723 0.008419050008226214 0.05329396170169087 -0.056052495537513236
ADV2:  0.0032502685648961626 0.888440687

attitude |    0.03   -0.01    0.12 |    1.23    0.65    1.92 |   -3.14   -1.51   -3.14 |    3.14    1.57    3.14
w        |   -0.00   -0.00    0.00 |    0.01    0.00    0.00 |   -0.06   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |   -0.01    0.14 |    0.65    1.93 |   -1.36   -3.12 |    1.50    3.13
w_f      |   -0.00   -0.00    0.00 |    0.02    0.01    0.01 |   -0.06   -0.02   -0.02 |    0.05    0.02    0.03
w_rewards |   -0.00 |    0.00 |   -0.06 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.26 |    0.25 |    0.00 |    1.58
seeker_angles |    0.00    0.00 |    0.08    0.09 |   -0.98   -0.99 |    0.99    0.99
cs_angles |  0.0001  0.0003 |  0.0809  0.0872 | -0.9791 -0.9947 |  0.9930  0.9895
optical_flow |  0.0001  0.0000 |  0.0261  0.0247 | -1.1559 -0.9980 |  1.0574  1.0318
v_err    | -0.0097 |  0.0583 | -0.4523 |  0.1088
landing_rewards |    9.45 |    2.28 |    0.00 |   10.00
landing_margin |   -0

thrust   |   -0.01    0.00   -0.00 |    0.68    0.68    0.68 |   -3.42   -3.41   -3.36 |    3.39    3.28    3.37
norm_thrust |    0.90 |    0.75 |    0.00 |    3.46
fuel     |    1.56 |    0.21 |    1.08 |    2.34
rewards  |  -14.67 |    6.14 |  -53.69 |   -4.33
fuel_rewards |   -4.48 |    0.60 |   -6.72 |   -3.14
glideslope_rewards |    0.00 |    0.00 |    0.00 |    0.00
glideslope_penalty |    0.00 |    0.00 |    0.00 |    0.00
glideslope |    2.94 |   12.94 |    0.01 |  594.37
norm_af  |    1.65 |    0.90 |    0.11 |    3.28
norm_wf  |    0.02 |    0.01 |    0.00 |    0.05
rh_penalty |    0.00 |    0.00 |    0.00 |    0.00
att_rewards |    0.00 |    0.00 |    0.00 |    0.00
att_penalty |    0.00 |    0.00 |    0.00 |    0.00
attitude |   -0.04    0.02    0.11 |    1.18    0.67    1.77 |   -3.14   -1.55   -3.14 |    3.14    1.57    3.14
w        |   -0.00   -0.00    0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |    0.01   -0.00 |    0.67

ADV1:  0.004348039823743192 0.008416644067887289 0.04779213311115274 -0.07574991710580038
ADV2:  -0.011833041759905226 0.8807375160777188 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.7131   1.0088   5.4882  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0050   0.0030   0.0111   6.4661   2.1407   2.4885
Update Cnt = 1320    ET =   1043.1   Stats:  Mean, Std, Min, Max
r_f      |  -11.13    4.30   -4.56 |  185.87  175.29  203.81 | -398.57 -391.43 -393.49 |  384.08  379.68  395.84
v_f      |    0.00   -0.00    0.00 |    0.04    0.04    0.05 |   -0.10   -0.09   -0.10 |    0.10    0.11    0.11
r_i      |  -35.92   -1.47  -55.45 |  667.51  668.31  781.96 |-1340.07-1310.93-1315.06 | 1259.94 1339.31 1314.21
v_i      |    0.00   -0.00    0.00 |    0.04    0.04    0.05 |   -0.09   -0.09   -0.09 |    0.10    0.10    0.10
norm_rf  |    0.23 |    0.09 |    0.03 |    0.57
norm_vf  |    0.07 |    0.01 |    0.04 |    0.12
gs_f     |    1.48 |    2.65 |  

Dynamics: Max Disturbance (m/s^2):  [0.00179836 0.00129994 0.00168267] 0.0027848433135488422
ADV1:  -0.0006437964171945136 0.011544310226326657 0.061748347496970335 -0.08137683261701513
ADV2:  0.02660779865099369 0.8582179559343189 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.3328   0.7862   4.2863  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0012   0.0006   0.0021   6.4661   2.1407   2.4885
***** Episode 41239, Mean R = -14.4  Std R = 5.9  Min R = -30.1
PolicyLoss: -0.0268
Policy_Beta: 0.114
Policy_Entropy: 0.151
Policy_KL: 0.00118
Policy_SD: 0.554
Policy_lr_mult: 0.132
Steps: 1.15e+04
TotalSteps: 1.46e+07
VF_0_ExplainedVarNew: 0.94
VF_0_ExplainedVarOld: 0.934
VF_0_Loss : 0.000125


ADV1:  0.0023655238839477544 0.0076261452425150054 0.04242608929223775 -0.06746550092931483
ADV2:  -0.011817820658884643 0.879282854097903 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.1819   0.6536   3.6437  27.0893  20.3031  12.6669
ValF

***** Episode 41487, Mean R = -14.8  Std R = 6.7  Min R = -40.4
PolicyLoss: -0.0279
Policy_Beta: 0.114
Policy_Entropy: 0.151
Policy_KL: 0.00149
Policy_SD: 0.542
Policy_lr_mult: 0.132
Steps: 1.18e+04
TotalSteps: 1.47e+07
VF_0_ExplainedVarNew: 0.972
VF_0_ExplainedVarOld: 0.963
VF_0_Loss : 0.00048


Dynamics: Max Disturbance (m/s^2):  [0.00179836 0.00129994 0.00168267] 0.0027848433135488422
ADV1:  -0.0007890685591331632 0.009309124421060126 0.04145695671385652 -0.07604661261397061
ADV2:  0.02149877071630914 0.8944011535147491 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.1819   1.2985   6.2868  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0013   0.0007   0.0028   6.4661   2.1407   2.4885
***** Episode 41518, Mean R = -15.7  Std R = 7.1  Min R = -37.9
PolicyLoss: -0.0189
Policy_Beta: 0.114
Policy_Entropy: 0.148
Policy_KL: 0.000885
Policy_SD: 0.564
Policy_lr_mult: 0.132
Steps: 1.16e+04
TotalSteps: 1.47e+07
VF_0_ExplainedVarNew: 0.972
VF_0_Ex

ADV1:  -0.0014795209529482095 0.009653135368511595 0.04131558318899009 -0.0635445715542504
ADV2:  0.033578400966027676 0.8677417747662374 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.8664   0.9506   5.1258  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0017   0.0010   0.0038   6.4661   2.1407   2.4885
***** Episode 41766, Mean R = -14.3  Std R = 4.8  Min R = -32.1
PolicyLoss: -0.0264
Policy_Beta: 0.114
Policy_Entropy: 0.153
Policy_KL: 0.00104
Policy_SD: 0.539
Policy_lr_mult: 0.132
Steps: 1.17e+04
TotalSteps: 1.48e+07
VF_0_ExplainedVarNew: 0.955
VF_0_ExplainedVarOld: 0.951
VF_0_Loss : 0.000523


ADV1:  0.004555910392008507 0.0068543174073932575 0.048345384149233256 -0.07287012911727803
ADV2:  -0.03809609601696464 0.8762241141627832 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.5611   1.2235   5.7445  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0056   0.0035   0.0121   6.4661   2.1407   2

Dynamics: Max Disturbance (m/s^2):  [0.00179836 0.00129994 0.00168267] 0.0027848433135488422
ADV1:  -0.0017507919036938585 0.009349327524491278 0.03252493770985576 -0.06656233686573754
ADV2:  0.03984436989193836 0.848358275145782 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.2919   0.9543   4.9389  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0023   0.0013   0.0050   6.4661   2.1407   2.4885
***** Episode 42045, Mean R = -14.3  Std R = 6.4  Min R = -31.4
PolicyLoss: -0.0326
Policy_Beta: 0.114
Policy_Entropy: 0.153
Policy_KL: 0.00128
Policy_SD: 0.54
Policy_lr_mult: 0.132
Steps: 1.14e+04
TotalSteps: 1.49e+07
VF_0_ExplainedVarNew: 0.968
VF_0_ExplainedVarOld: 0.964
VF_0_Loss : 0.00111


ADV1:  0.000466275045020021 0.008764718603249478 0.058539349930172846 -0.06626807011002106
ADV2:  0.005458826890068736 0.8898416445020294 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.0348   0.4136   2.1733  27.0893  20.3031  12.6669
ValFun  

***** Episode 42293, Mean R = -13.5  Std R = 4.9  Min R = -26.3
PolicyLoss: -0.0291
Policy_Beta: 0.114
Policy_Entropy: 0.155
Policy_KL: 0.000772
Policy_SD: 0.534
Policy_lr_mult: 0.132
Steps: 1.18e+04
TotalSteps: 1.5e+07
VF_0_ExplainedVarNew: 0.953
VF_0_ExplainedVarOld: 0.949
VF_0_Loss : 0.00013


ADV1:  0.0022653230775756166 0.007941121155016165 0.04167262024030202 -0.06269385954587268
ADV2:  0.005524135541345265 0.8365952073550689 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.5688   1.0745   5.8748  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0028   0.0016   0.0061   6.4661   2.1407   2.4885
***** Episode 42324, Mean R = -14.6  Std R = 5.9  Min R = -26.9
PolicyLoss: -0.0292
Policy_Beta: 0.114
Policy_Entropy: 0.155
Policy_KL: 0.000786
Policy_SD: 0.531
Policy_lr_mult: 0.132
Steps: 1.19e+04
TotalSteps: 1.5e+07
VF_0_ExplainedVarNew: 0.978
VF_0_ExplainedVarOld: 0.975
VF_0_Loss : 8.18e-05


ADV1:  -0.0002509914874860817 0.007327173899859189

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.8064   0.9395   4.6041  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0022   0.0013   0.0046   6.4661   2.1407   2.4885
***** Episode 42572, Mean R = -15.4  Std R = 4.5  Min R = -28.5
PolicyLoss: -0.031
Policy_Beta: 0.114
Policy_Entropy: 0.153
Policy_KL: 0.000891
Policy_SD: 0.54
Policy_lr_mult: 0.132
Steps: 1.17e+04
TotalSteps: 1.51e+07
VF_0_ExplainedVarNew: 0.959
VF_0_ExplainedVarOld: 0.956
VF_0_Loss : 0.000516


ADV1:  0.0008546146965720585 0.00934690987075332 0.056366530977355445 -0.06897571731604768
ADV2:  0.013277784161158488 0.8735487800173986 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.7581   0.3418   2.0976  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0011   0.0006   0.0025   6.4661   2.1407   2.4885
***** Episode 42603, Mean R = -12.7  Std R = 5.9  Min R = -34.4
PolicyLoss: -0.0231
Policy_Beta: 0.114
Policy_Entropy: 0.153
Policy_KL: 0.00097

ADV1:  -0.002084324903369624 0.00934683596223796 0.052012611750970245 -0.08586513541595003
ADV2:  0.034879743740323446 0.875830045137031 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.3140   0.7139   3.9013  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0022   0.0014   0.0054   6.4661   2.1407   2.4885
***** Episode 42851, Mean R = -16.1  Std R = 5.4  Min R = -30.9
PolicyLoss: -0.0227
Policy_Beta: 0.114
Policy_Entropy: 0.153
Policy_KL: 0.000941
Policy_SD: 0.546
Policy_lr_mult: 0.132
Steps: 1.17e+04
TotalSteps: 1.52e+07
VF_0_ExplainedVarNew: 0.97
VF_0_ExplainedVarOld: 0.966
VF_0_Loss : 0.000152


ADV1:  0.003294969942405952 0.007438779970047864 0.07066250180689554 -0.12808786434354452
ADV2:  -0.01781630598483706 0.8234916771859402 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.1354   0.7413   4.1005  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0042   0.0026   0.0093   6.4661   2.1407   2.48

seeker_angles |    0.00    0.00 |    0.08    0.08 |   -0.99   -0.94 |    0.99    0.99
cs_angles |  0.0037  0.0046 |  0.0836  0.0837 | -0.9925 -0.9381 |  0.9870  0.9903
optical_flow |  0.0000  0.0001 |  0.0264  0.0255 | -0.9908 -1.0709 |  1.0337  1.2805
v_err    | -0.0101 |  0.0582 | -0.4523 |  0.1164
landing_rewards |    9.58 |    2.00 |    0.00 |   10.00
landing_margin |   -0.02 |    0.01 |   -0.05 |    0.02
tracking_rewards |  -19.44 |    5.00 |  -43.76 |  -11.70
steps    |     377 |      21 |     331 |     419
***** Episode 43130, Mean R = -14.1  Std R = 6.6  Min R = -39.5
PolicyLoss: -0.0278
Policy_Beta: 0.114
Policy_Entropy: 0.154
Policy_KL: 0.00135
Policy_SD: 0.536
Policy_lr_mult: 0.132
Steps: 1.18e+04
TotalSteps: 1.53e+07
VF_0_ExplainedVarNew: 0.987
VF_0_ExplainedVarOld: 0.978
VF_0_Loss : 4.31e-05


ADV1:  -0.0007768528749671863 0.00745670370254278 0.04929481964123339 -0.04971092854500324
ADV2:  0.02038571173053075 0.8695145399547942 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Ma

attitude |    0.07    0.03   -0.02 |    1.14    0.68    1.72 |   -3.14   -1.54   -3.14 |    3.14    1.57    3.14
w        |    0.00    0.00    0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |    0.03   -0.04 |    0.67    1.72 |   -1.46   -3.14 |    1.41    3.14
w_f      |    0.00   -0.00   -0.00 |    0.02    0.01    0.01 |   -0.04   -0.02   -0.03 |    0.05    0.02    0.02
w_rewards |   -0.00 |    0.00 |   -0.01 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.24 |    0.24 |    0.00 |    1.61
seeker_angles |    0.00    0.00 |    0.08    0.08 |   -0.99   -0.99 |    1.00    0.98
cs_angles |  0.0031  0.0046 |  0.0779  0.0831 | -0.9890 -0.9936 |  0.9999  0.9806
optical_flow |  0.0000 -0.0002 |  0.0255  0.0254 | -1.1653 -0.9556 |  1.1530  1.0200
v_err    | -0.0103 |  0.0586 | -0.4533 |  0.1028
landing_rewards |    9.58 |    2.00 |    0.00 |   10.00
landing_margin |   -0

attitude |    0.17   -0.04    0.09 |    1.16    0.67    1.84 |   -3.14   -1.57   -3.14 |    3.14    1.57    3.14
w        |   -0.00    0.00    0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |   -0.03    0.09 |    0.67    1.84 |   -1.54   -3.11 |    1.48    3.12
w_f      |   -0.00   -0.00    0.00 |    0.02    0.01    0.01 |   -0.05   -0.02   -0.02 |    0.05    0.02    0.02
w_rewards |   -0.00 |    0.00 |   -0.03 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.25 |    0.25 |    0.00 |    1.61
seeker_angles |    0.01    0.00 |    0.08    0.08 |   -1.00   -0.96 |    0.99    0.99
cs_angles |  0.0053  0.0017 |  0.0794  0.0825 | -0.9953 -0.9649 |  0.9945  0.9938
optical_flow | -0.0001  0.0000 |  0.0256  0.0247 | -1.1328 -1.0737 |  1.1778  1.0316
v_err    | -0.0099 |  0.0583 | -0.4530 |  0.1067
landing_rewards |    9.39 |    2.40 |    0.00 |   10.00
landing_margin |   -0

attitude |   -0.04    0.01    0.03 |    1.18    0.65    1.82 |   -3.14   -1.57   -3.14 |    3.14    1.57    3.14
w        |   -0.00    0.00    0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |    0.02    0.09 |    0.66    1.81 |   -1.52   -3.12 |    1.56    3.12
w_f      |   -0.00   -0.00   -0.00 |    0.02    0.01    0.01 |   -0.04   -0.02   -0.02 |    0.05    0.02    0.02
w_rewards |   -0.00 |    0.00 |   -0.02 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.25 |    0.25 |    0.00 |    1.62
seeker_angles |    0.00    0.00 |    0.08    0.09 |   -1.00   -0.99 |    0.98    0.97
cs_angles |  0.0002  0.0028 |  0.0753  0.0885 | -0.9978 -0.9949 |  0.9757  0.9659
optical_flow |  0.0002  0.0000 |  0.0260  0.0243 | -1.0843 -1.0115 |  1.1606  1.1398
v_err    | -0.0096 |  0.0586 | -0.4531 |  0.1051
landing_rewards |    9.19 |    2.72 |    0.00 |   10.00
landing_margin |   -0

w        |   -0.00    0.00    0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |    0.01   -0.00 |    0.64    1.90 |   -1.38   -3.13 |    1.53    3.14
w_f      |    0.00   -0.00    0.00 |    0.02    0.01    0.01 |   -0.05   -0.03   -0.02 |    0.05    0.02    0.03
w_rewards |   -0.00 |    0.00 |   -0.04 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.25 |    0.25 |    0.00 |    1.70
seeker_angles |   -0.00    0.00 |    0.08    0.08 |   -0.98   -0.99 |    0.97    0.99
cs_angles | -0.0003  0.0035 |  0.0784  0.0832 | -0.9826 -0.9902 |  0.9663  0.9924
optical_flow |  0.0001 -0.0001 |  0.0255  0.0249 | -1.2761 -1.2992 |  1.3741  0.9531
v_err    | -0.0099 |  0.0578 | -0.4531 |  0.1230
landing_rewards |    9.48 |    2.21 |    0.00 |   10.00
landing_margin |   -0.02 |    0.01 |   -0.06 |    0.04
tracking_rewards |  -18.89 |    4.59 |  -40.20 |  -10.45
steps    |     379 |  

w        |    0.00    0.00    0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |    0.04    0.01 |    0.64    1.83 |   -1.42   -3.12 |    1.55    3.10
w_f      |    0.00   -0.00   -0.00 |    0.02    0.01    0.01 |   -0.05   -0.02   -0.03 |    0.05    0.03    0.02
w_rewards |   -0.00 |    0.00 |   -0.02 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.25 |    0.25 |    0.00 |    1.44
seeker_angles |   -0.00    0.00 |    0.08    0.08 |   -1.00   -0.99 |    0.98    1.00
cs_angles | -0.0021  0.0038 |  0.0805  0.0807 | -0.9956 -0.9936 |  0.9832  0.9968
optical_flow | -0.0001 -0.0001 |  0.0248  0.0248 | -1.1606 -1.1221 |  1.1077  1.1276
v_err    | -0.0102 |  0.0582 | -0.4525 |  0.0997
landing_rewards |    9.48 |    2.21 |    0.00 |   10.00
landing_margin |   -0.02 |    0.01 |   -0.06 |    0.03
tracking_rewards |  -18.86 |    4.29 |  -39.26 |  -11.74
steps    |     378 |  

attitude |   -0.03    0.06   -0.07 |    1.15    0.66    1.89 |   -3.14   -1.57   -3.14 |    3.14    1.56    3.14
w        |    0.00    0.00    0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |    0.07   -0.01 |    0.66    1.90 |   -1.37   -3.10 |    1.51    3.14
w_f      |    0.00    0.00   -0.00 |    0.02    0.01    0.01 |   -0.05   -0.02   -0.02 |    0.05    0.02    0.03
w_rewards |   -0.00 |    0.00 |   -0.02 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.25 |    0.25 |    0.00 |    1.54
seeker_angles |    0.00    0.00 |    0.08    0.08 |   -0.99   -0.99 |    0.99    0.99
cs_angles |  0.0018  0.0006 |  0.0777  0.0833 | -0.9938 -0.9948 |  0.9935  0.9942
optical_flow |  0.0001 -0.0000 |  0.0267  0.0249 | -1.0736 -1.0065 |  1.2494  1.2744
v_err    | -0.0099 |  0.0588 | -0.4524 |  0.1109
landing_rewards |    9.48 |    2.21 |    0.00 |   10.00
landing_margin |   -0

attitude |    0.11    0.03    0.06 |    1.18    0.65    1.86 |   -3.14   -1.56   -3.14 |    3.14    1.54    3.14
w        |    0.00   -0.00    0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |    0.04    0.06 |    0.64    1.85 |   -1.47   -3.14 |    1.43    3.12
w_f      |    0.00   -0.00    0.00 |    0.02    0.01    0.01 |   -0.04   -0.03   -0.02 |    0.05    0.02    0.02
w_rewards |   -0.00 |    0.00 |   -0.02 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.25 |    0.25 |    0.00 |    1.52
seeker_angles |    0.00    0.00 |    0.08    0.08 |   -0.98   -0.96 |    0.94    0.98
cs_angles |  0.0022  0.0035 |  0.0763  0.0828 | -0.9833 -0.9612 |  0.9442  0.9783
optical_flow | -0.0000 -0.0001 |  0.0245  0.0254 | -1.0436 -1.2336 |  0.8895  1.2398
v_err    | -0.0096 |  0.0588 | -0.4531 |  0.1062
landing_rewards |    9.55 |    2.08 |    0.00 |   10.00
landing_margin |   -0

w        |    0.00   -0.00    0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |    0.00    0.02 |    0.66    1.82 |   -1.56   -3.11 |    1.55    3.11
w_f      |    0.00   -0.00    0.00 |    0.02    0.01    0.01 |   -0.04   -0.02   -0.02 |    0.04    0.03    0.02
w_rewards |   -0.00 |    0.00 |   -0.03 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.26 |    0.25 |    0.00 |    1.47
seeker_angles |    0.00    0.00 |    0.08    0.08 |   -1.00   -1.00 |    0.99    0.97
cs_angles |  0.0028  0.0037 |  0.0818  0.0797 | -0.9955 -0.9976 |  0.9907  0.9736
optical_flow | -0.0001 -0.0001 |  0.0251  0.0249 | -1.2684 -0.9983 |  1.0635  1.3079
v_err    | -0.0094 |  0.0588 | -0.4527 |  0.1078
landing_rewards |    9.48 |    2.21 |    0.00 |   10.00
landing_margin |   -0.02 |    0.01 |   -0.06 |    0.02
tracking_rewards |  -18.77 |    4.03 |  -31.23 |   -9.87
steps    |     375 |  

w        |    0.00    0.00   -0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |    0.02    0.14 |    0.69    1.89 |   -1.43   -3.14 |    1.51    3.11
w_f      |    0.00   -0.00   -0.00 |    0.02    0.01    0.01 |   -0.04   -0.02   -0.02 |    0.05    0.02    0.02
w_rewards |   -0.00 |    0.00 |   -0.04 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.25 |    0.25 |    0.00 |    1.65
seeker_angles |   -0.00    0.00 |    0.08    0.09 |   -1.00   -0.96 |    0.99    0.99
cs_angles | -0.0004  0.0027 |  0.0775  0.0861 | -0.9959 -0.9637 |  0.9935  0.9895
optical_flow | -0.0000 -0.0001 |  0.0259  0.0238 | -1.1426 -1.1093 |  1.2316  1.0062
v_err    | -0.0092 |  0.0582 | -0.4524 |  0.1110
landing_rewards |    9.58 |    2.00 |    0.00 |   10.00
landing_margin |   -0.02 |    0.01 |   -0.06 |    0.03
tracking_rewards |  -18.96 |    4.38 |  -34.51 |  -10.82
steps    |     377 |  

attitude |    0.05    0.05    0.03 |    1.08    0.63    1.85 |   -3.14   -1.55   -3.14 |    3.14    1.54    3.14
w        |    0.00   -0.00    0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |    0.04   -0.01 |    0.63    1.85 |   -1.41   -3.14 |    1.46    3.13
w_f      |    0.00   -0.00   -0.00 |    0.02    0.01    0.01 |   -0.04   -0.02   -0.03 |    0.04    0.02    0.02
w_rewards |   -0.00 |    0.00 |   -0.04 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.25 |    0.25 |    0.00 |    1.84
seeker_angles |    0.00    0.00 |    0.08    0.08 |   -0.99   -0.96 |    1.00    1.00
cs_angles |  0.0012  0.0023 |  0.0788  0.0837 | -0.9914 -0.9639 |  0.9955  0.9956
optical_flow |  0.0000 -0.0000 |  0.0248  0.0251 | -0.8908 -1.2633 |  1.2790  1.1057
v_err    | -0.0092 |  0.0583 | -0.4514 |  0.1306
landing_rewards |    9.19 |    2.72 |    0.00 |   10.00
landing_margin |   -0

thrust   |   -0.00    0.00   -0.00 |    0.67    0.70    0.68 |   -3.38   -3.44   -3.43 |    3.36    3.31    3.36
norm_thrust |    0.91 |    0.75 |    0.00 |    3.46
fuel     |    1.59 |    0.20 |    1.07 |    2.20
rewards  |  -13.94 |    5.23 |  -34.18 |   -4.54
fuel_rewards |   -4.55 |    0.58 |   -6.31 |   -3.06
glideslope_rewards |    0.00 |    0.00 |    0.00 |    0.00
glideslope_penalty |    0.00 |    0.00 |    0.00 |    0.00
glideslope |    2.73 |   12.46 |    0.01 |  176.07
norm_af  |    1.72 |    0.89 |    0.13 |    3.32
norm_wf  |    0.02 |    0.01 |    0.00 |    0.05
rh_penalty |    0.00 |    0.00 |    0.00 |    0.00
att_rewards |    0.00 |    0.00 |    0.00 |    0.00
att_penalty |    0.00 |    0.00 |    0.00 |    0.00
attitude |   -0.06    0.02    0.07 |    1.20    0.64    1.81 |   -3.14   -1.57   -3.14 |    3.14    1.48    3.14
w        |    0.00    0.00    0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |    0.01    0.03 |    0.65

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.3570   0.5594   2.7641  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0008   0.0005   0.0017   6.4661   2.1407   2.4885
Update Cnt = 1510    ET =    967.7   Stats:  Mean, Std, Min, Max
r_f      |   -7.53    5.52   20.08 |  184.11  168.41  195.82 | -368.87 -384.67 -392.80 |  397.36  385.38  390.09
v_f      |    0.00   -0.00   -0.00 |    0.04    0.04    0.05 |   -0.09   -0.11   -0.10 |    0.11    0.10    0.09
r_i      |  -50.60   32.66   48.37 |  683.76  664.99  753.84 |-1272.49-1170.58-1316.23 | 1333.53 1292.20 1306.63
v_i      |    0.00   -0.00   -0.00 |    0.04    0.04    0.05 |   -0.09   -0.10   -0.10 |    0.10    0.09    0.09
norm_rf  |    0.22 |    0.08 |    0.04 |    0.55
norm_vf  |    0.08 |    0.01 |    0.04 |    0.12
gs_f     |    1.19 |    1.59 |    0.02 |   11.70
thrust   |    0.00   -0.00   -0.00 |    0.68    0.69    0.68 |   -3.33   -3.37   -3.46 |    3.40    3.46    3.44
norm_thrust |    

ADV1:  0.004390271428692487 0.006782527926743512 0.07424791964599392 -0.08065717216044532
ADV2:  -0.03578563812222187 0.8714123570175114 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.7537   0.3740   2.1440  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0047   0.0029   0.0114   6.4661   2.1407   2.4885
***** Episode 47129, Mean R = -12.9  Std R = 4.1  Min R = -20.2
PolicyLoss: -0.0159
Policy_Beta: 0.114
Policy_Entropy: 0.152
Policy_KL: 0.000813
Policy_SD: 0.547
Policy_lr_mult: 0.132
Steps: 1.17e+04
TotalSteps: 1.68e+07
VF_0_ExplainedVarNew: 0.985
VF_0_ExplainedVarOld: 0.979
VF_0_Loss : 0.000664


ADV1:  -0.003012189957553298 0.008392372061876603 0.03887652347371273 -0.057538969122523764
ADV2:  0.04523452178360018 0.8791501412606374 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.9507   1.1734   6.1546  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0030   0.0019   0.0079   6.4661   2.1407   2.

***** Episode 47377, Mean R = -14.6  Std R = 4.4  Min R = -26.9
PolicyLoss: -0.0292
Policy_Beta: 0.114
Policy_Entropy: 0.151
Policy_KL: 0.000763
Policy_SD: 0.554
Policy_lr_mult: 0.132
Steps: 1.16e+04
TotalSteps: 1.69e+07
VF_0_ExplainedVarNew: 0.967
VF_0_ExplainedVarOld: 0.965
VF_0_Loss : 0.000713


ADV1:  8.04528821448409e-05 0.00927614004893373 0.04574519683241024 -0.05197730555876329
ADV2:  0.01182058027534759 0.905470303434209 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.6942   0.6549   3.5314  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0003   0.0002   0.0007   6.4661   2.1407   2.4885
***** Episode 47408, Mean R = -14.1  Std R = 4.7  Min R = -27.3
PolicyLoss: -0.0163
Policy_Beta: 0.114
Policy_Entropy: 0.151
Policy_KL: 0.00118
Policy_SD: 0.555
Policy_lr_mult: 0.132
Steps: 1.16e+04
TotalSteps: 1.69e+07
VF_0_ExplainedVarNew: 0.964
VF_0_ExplainedVarOld: 0.96
VF_0_Loss : 0.00039


ADV1:  0.00037156996543053134 0.007997600622140263 0.0

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.0278   0.3837   1.9598  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0011   0.0007   0.0028   6.4661   2.1407   2.4885
***** Episode 47656, Mean R = -13.4  Std R = 4.2  Min R = -25.2
PolicyLoss: -0.0185
Policy_Beta: 0.114
Policy_Entropy: 0.155
Policy_KL: 0.000862
Policy_SD: 0.538
Policy_lr_mult: 0.132
Steps: 1.18e+04
TotalSteps: 1.7e+07
VF_0_ExplainedVarNew: 0.986
VF_0_ExplainedVarOld: 0.983
VF_0_Loss : 0.00032


ADV1:  0.00016244398945829087 0.008519761893505784 0.047448897982631355 -0.06907250903860451
ADV2:  0.024616540930448162 0.8295992692824379 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.0769   1.0042   4.2811  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0001   0.0001   0.0005   6.4661   2.1407   2.4885
***** Episode 47687, Mean R = -14.5  Std R = 6.9  Min R = -33.0
PolicyLoss: -0.0311
Policy_Beta: 0.114
Policy_Entropy: 0.154
Policy_KL: 0.001

ADV1:  0.001214212873957449 0.008184658968722383 0.04930050551145995 -0.11364545320611402
ADV2:  0.015204723809987178 0.804819225069694 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.2715   1.1081   6.2159  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0019   0.0010   0.0036   6.4661   2.1407   2.4885
***** Episode 47935, Mean R = -12.9  Std R = 5.0  Min R = -25.3
PolicyLoss: -0.031
Policy_Beta: 0.114
Policy_Entropy: 0.154
Policy_KL: 0.000972
Policy_SD: 0.55
Policy_lr_mult: 0.132
Steps: 1.17e+04
TotalSteps: 1.71e+07
VF_0_ExplainedVarNew: 0.973
VF_0_ExplainedVarOld: 0.967
VF_0_Loss : 0.000291


ADV1:  -0.0013439741213895485 0.00837297107352355 0.05885363412555178 -0.0640998149628399
ADV2:  0.03803637660269754 0.8251325277879001 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.7427   0.7857   3.8163  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0014   0.0009   0.0034   6.4661   2.1407   2.4885


***** Episode 48183, Mean R = -12.7  Std R = 5.8  Min R = -28.6
PolicyLoss: -0.0287
Policy_Beta: 0.114
Policy_Entropy: 0.155
Policy_KL: 0.000909
Policy_SD: 0.533
Policy_lr_mult: 0.132
Steps: 1.17e+04
TotalSteps: 1.72e+07
VF_0_ExplainedVarNew: 0.956
VF_0_ExplainedVarOld: 0.951
VF_0_Loss : 0.000472


ADV1:  -0.00019013001956365609 0.009743462655185425 0.07839087596840322 -0.08730412355682221
ADV2:  0.01347358165129223 0.8764356986279637 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.4781   1.1518   5.8912  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0005   0.0003   0.0012   6.4661   2.1407   2.4885
***** Episode 48214, Mean R = -13.7  Std R = 6.1  Min R = -30.1
PolicyLoss: -0.0162
Policy_Beta: 0.114
Policy_Entropy: 0.155
Policy_KL: 0.00112
Policy_SD: 0.543
Policy_lr_mult: 0.132
Steps: 1.16e+04
TotalSteps: 1.72e+07
VF_0_ExplainedVarNew: 0.964
VF_0_ExplainedVarOld: 0.956
VF_0_Loss : 0.000382


ADV1:  -0.0027341847409355162 0.010710996607065

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.9928   0.4293   2.1130  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0004   0.0003   0.0011   6.4661   2.1407   2.4885
***** Episode 48462, Mean R = -14.6  Std R = 5.4  Min R = -27.5
PolicyLoss: -0.0162
Policy_Beta: 0.114
Policy_Entropy: 0.155
Policy_KL: 0.000843
Policy_SD: 0.55
Policy_lr_mult: 0.132
Steps: 1.18e+04
TotalSteps: 1.73e+07
VF_0_ExplainedVarNew: 0.983
VF_0_ExplainedVarOld: 0.98
VF_0_Loss : 0.000208


ADV1:  0.0010646280033867318 0.009428788301789717 0.04108515731788692 -0.08556033451341888
ADV2:  0.011437397893235236 0.8738637854791246 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.1492   0.8639   4.7467  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0012   0.0008   0.0028   6.4661   2.1407   2.4885
***** Episode 48493, Mean R = -14.7  Std R = 6.4  Min R = -31.5
PolicyLoss: -0.0234
Policy_Beta: 0.114
Policy_Entropy: 0.156
Policy_KL: 0.00108

ADV1:  0.0016318030072353692 0.0064799454727259035 0.04147529296594196 -0.048639032386879
ADV2:  -0.0039035003051040283 0.8827207669209859 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.2821   0.7228   3.9610  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0018   0.0011   0.0042   6.4661   2.1407   2.4885
***** Episode 48741, Mean R = -13.1  Std R = 4.2  Min R = -22.7
PolicyLoss: -0.019
Policy_Beta: 0.114
Policy_Entropy: 0.153
Policy_KL: 0.00114
Policy_SD: 0.555
Policy_lr_mult: 0.132
Steps: 1.18e+04
TotalSteps: 1.74e+07
VF_0_ExplainedVarNew: 0.982
VF_0_ExplainedVarOld: 0.98
VF_0_Loss : 0.000323


ADV1:  -0.0023316840856229554 0.007997980644758481 0.0517438126575851 -0.07861585977700736
ADV2:  0.04098516192538893 0.8592483927668794 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.4741   0.8305   4.4625  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0026   0.0016   0.0059   6.4661   2.1407   2.48

seeker_angles |    0.00    0.00 |    0.08    0.08 |   -0.99   -0.99 |    1.00    0.98
cs_angles |  0.0007  0.0011 |  0.0817  0.0827 | -0.9931 -0.9911 |  0.9968  0.9822
optical_flow |  0.0001  0.0000 |  0.0256  0.0237 | -1.1093 -1.0410 |  1.3284  1.1397
v_err    | -0.0093 |  0.0577 | -0.4512 |  0.1132
landing_rewards |    9.45 |    2.28 |    0.00 |   10.00
landing_margin |   -0.02 |    0.01 |   -0.06 |    0.02
tracking_rewards |  -18.63 |    4.76 |  -43.29 |  -10.75
steps    |     379 |      20 |     330 |     416
***** Episode 49020, Mean R = -13.7  Std R = 5.7  Min R = -30.0
PolicyLoss: -0.0292
Policy_Beta: 0.114
Policy_Entropy: 0.154
Policy_KL: 0.000999
Policy_SD: 0.543
Policy_lr_mult: 0.132
Steps: 1.18e+04
TotalSteps: 1.75e+07
VF_0_ExplainedVarNew: 0.973
VF_0_ExplainedVarOld: 0.968
VF_0_Loss : 0.000114


ADV1:  0.00026959825581775485 0.006928310425072318 0.04084082752466206 -0.04727186552499104
ADV2:  0.016557018493825165 0.8542027402300587 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max

att_rewards |    0.00 |    0.00 |    0.00 |    0.00
att_penalty |    0.00 |    0.00 |    0.00 |    0.00
attitude |   -0.00    0.01    0.06 |    1.18    0.66    1.88 |   -3.14   -1.55   -3.14 |    3.14    1.56    3.14
w        |    0.00   -0.00   -0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |    0.01    0.15 |    0.68    1.89 |   -1.53   -3.14 |    1.43    3.13
w_f      |   -0.00   -0.00    0.00 |    0.02    0.01    0.01 |   -0.04   -0.02   -0.03 |    0.04    0.03    0.02
w_rewards |   -0.00 |    0.00 |   -0.03 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.24 |    0.25 |    0.00 |    1.66
seeker_angles |    0.00    0.00 |    0.08    0.08 |   -0.98   -0.99 |    1.00    1.00
cs_angles |  0.0002  0.0028 |  0.0757  0.0795 | -0.9812 -0.9850 |  0.9998  0.9993
optical_flow |  0.0000 -0.0001 |  0.0248  0.0251 | -1.2371 -1.0745 |  1.0006  1.0415
v_err    | -0.0096 |  

w        |    0.00   -0.00   -0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |    0.00   -0.11 |    0.64    1.82 |   -1.42   -3.14 |    1.43    3.13
w_f      |    0.00   -0.00   -0.00 |    0.02    0.01    0.01 |   -0.04   -0.03   -0.02 |    0.05    0.02    0.02
w_rewards |   -0.00 |    0.00 |   -0.02 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.24 |    0.25 |    0.00 |    1.61
seeker_angles |    0.00    0.00 |    0.08    0.08 |   -0.98   -0.97 |    0.98    0.99
cs_angles |  0.0005  0.0030 |  0.0782  0.0809 | -0.9781 -0.9719 |  0.9779  0.9893
optical_flow |  0.0001 -0.0001 |  0.0250  0.0245 | -0.9483 -1.1668 |  1.0865  0.9218
v_err    | -0.0098 |  0.0581 | -0.4529 |  0.1267
landing_rewards |    9.48 |    2.21 |    0.00 |   10.00
landing_margin |   -0.02 |    0.01 |   -0.06 |    0.04
tracking_rewards |  -18.00 |    4.30 |  -35.96 |  -10.62
steps    |     376 |  

w        |    0.00   -0.00    0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |   -0.03   -0.13 |    0.60    1.85 |   -1.39   -3.13 |    1.35    3.12
w_f      |    0.00   -0.00   -0.00 |    0.02    0.01    0.01 |   -0.04   -0.02   -0.03 |    0.04    0.02    0.02
w_rewards |   -0.00 |    0.00 |   -0.04 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.24 |    0.24 |    0.00 |    1.62
seeker_angles |    0.00   -0.00 |    0.08    0.08 |   -1.00   -1.00 |    0.98    0.99
cs_angles |  0.0009 -0.0002 |  0.0751  0.0775 | -0.9998 -0.9972 |  0.9812  0.9850
optical_flow |  0.0000 -0.0002 |  0.0250  0.0244 | -1.0670 -1.0374 |  1.1226  0.9413
v_err    | -0.0097 |  0.0580 | -0.4521 |  0.1085
landing_rewards |    9.32 |    2.51 |    0.00 |   10.00
landing_margin |   -0.02 |    0.01 |   -0.06 |    0.02
tracking_rewards |  -17.72 |    3.52 |  -31.75 |  -11.20
steps    |     377 |  

attitude |   -0.02    0.02    0.10 |    1.19    0.64    1.90 |   -3.14   -1.54   -3.14 |    3.14    1.56    3.14
w        |    0.00    0.00    0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |    0.01    0.18 |    0.65    1.87 |   -1.43   -3.14 |    1.47    3.14
w_f      |    0.00    0.00    0.00 |    0.02    0.01    0.01 |   -0.04   -0.02   -0.03 |    0.05    0.02    0.03
w_rewards |   -0.00 |    0.00 |   -0.03 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.25 |    0.25 |    0.00 |    1.64
seeker_angles |    0.00   -0.00 |    0.08    0.08 |   -0.99   -0.97 |    0.98    1.00
cs_angles |  0.0008 -0.0020 |  0.0798  0.0820 | -0.9949 -0.9699 |  0.9769  0.9974
optical_flow |  0.0001 -0.0001 |  0.0243  0.0238 | -1.1570 -0.8899 |  0.9807  1.3636
v_err    | -0.0100 |  0.0583 | -0.4529 |  0.1142
landing_rewards |    9.45 |    2.28 |    0.00 |   10.00
landing_margin |   -0

w        |    0.00   -0.00    0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |   -0.01    0.13 |    0.67    1.83 |   -1.51   -3.14 |    1.42    3.13
w_f      |    0.00    0.00   -0.00 |    0.02    0.01    0.01 |   -0.03   -0.03   -0.02 |    0.04    0.02    0.02
w_rewards |   -0.00 |    0.00 |   -0.01 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.24 |    0.25 |    0.00 |    1.44
seeker_angles |   -0.00    0.00 |    0.08    0.08 |   -0.93   -0.99 |    0.99    0.99
cs_angles | -0.0014  0.0021 |  0.0778  0.0814 | -0.9324 -0.9914 |  0.9933  0.9928
optical_flow |  0.0000 -0.0001 |  0.0255  0.0242 | -1.0828 -1.4282 |  1.1868  1.0700
v_err    | -0.0094 |  0.0576 | -0.4525 |  0.1094
landing_rewards |    9.19 |    2.72 |    0.00 |   10.00
landing_margin |   -0.02 |    0.01 |   -0.06 |    0.04
tracking_rewards |  -18.11 |    4.30 |  -44.49 |  -10.24
steps    |     378 |  

attitude |    0.09    0.05    0.09 |    1.21    0.65    1.86 |   -3.14   -1.57   -3.14 |    3.14    1.57    3.14
w        |    0.00   -0.00    0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |    0.04    0.06 |    0.65    1.87 |   -1.52   -3.11 |    1.45    3.14
w_f      |    0.00   -0.00    0.00 |    0.02    0.01    0.01 |   -0.05   -0.02   -0.03 |    0.04    0.02    0.02
w_rewards |   -0.00 |    0.00 |   -0.01 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.25 |    0.25 |    0.00 |    1.52
seeker_angles |    0.00    0.00 |    0.08    0.08 |   -0.98   -1.00 |    1.00    0.97
cs_angles |  0.0041  0.0014 |  0.0769  0.0833 | -0.9814 -0.9974 |  0.9996  0.9704
optical_flow | -0.0000  0.0000 |  0.0262  0.0246 | -1.4068 -1.0514 |  0.9060  1.1480
v_err    | -0.0099 |  0.0584 | -0.4534 |  0.1107
landing_rewards |    9.39 |    2.40 |    0.00 |   10.00
landing_margin |   -0

thrust   |   -0.01    0.00   -0.00 |    0.67    0.67    0.66 |   -3.45   -3.40   -3.26 |    3.35    3.40    3.43
norm_thrust |    0.88 |    0.75 |    0.00 |    3.46
fuel     |    1.52 |    0.20 |    1.10 |    2.17
rewards  |  -13.20 |    5.06 |  -39.45 |   -4.59
fuel_rewards |   -4.36 |    0.56 |   -6.20 |   -3.15
glideslope_rewards |    0.00 |    0.00 |    0.00 |    0.00
glideslope_penalty |    0.00 |    0.00 |    0.00 |    0.00
glideslope |    3.01 |   13.44 |    0.01 |  608.61
norm_af  |    1.80 |    0.92 |    0.05 |    3.39
norm_wf  |    0.02 |    0.01 |    0.00 |    0.05
rh_penalty |    0.00 |    0.00 |    0.00 |    0.00
att_rewards |    0.00 |    0.00 |    0.00 |    0.00
att_penalty |    0.00 |    0.00 |    0.00 |    0.00
attitude |   -0.08   -0.03   -0.00 |    1.28    0.68    1.90 |   -3.14   -1.54   -3.14 |    3.14    1.55    3.14
w        |    0.00   -0.00    0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |   -0.04   -0.02 |    0.69

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   3.2369   1.7099   9.3472  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0013   0.0007   0.0025   6.4661   2.1407   2.4885
Update Cnt = 1660    ET =    910.4   Stats:  Mean, Std, Min, Max
r_f      |   -2.70   -3.07   -6.27 |  181.80  177.58  200.42 | -383.12 -380.15 -394.06 |  381.09  379.33  382.16
v_f      |    0.00    0.00    0.00 |    0.04    0.04    0.05 |   -0.08   -0.09   -0.10 |    0.10    0.09    0.10
r_i      |  -10.35    6.76  -33.74 |  690.19  651.05  767.17 |-1320.69-1320.53-1326.17 | 1285.62 1308.29 1318.01
v_i      |    0.00   -0.00    0.00 |    0.04    0.04    0.05 |   -0.09   -0.08   -0.10 |    0.09    0.10    0.09
norm_rf  |    0.21 |    0.09 |    0.04 |    0.49
norm_vf  |    0.07 |    0.01 |    0.04 |    0.12
gs_f     |    1.74 |    5.36 |    0.01 |   81.39
thrust   |    0.00   -0.01    0.00 |    0.67    0.67    0.67 |   -3.35   -3.29   -3.39 |    3.46    3.30    3.39
norm_thrust |    

ADV1:  0.003998267163968466 0.007249651943790339 0.03750418735821939 -0.11342611393847901
ADV2:  -0.014929164742484608 0.853829188898057 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.8724   0.9867   5.2139  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0035   0.0025   0.0105   6.4661   2.1407   2.4885
***** Episode 51779, Mean R = -14.5  Std R = 5.7  Min R = -32.0
PolicyLoss: -0.0277
Policy_Beta: 0.114
Policy_Entropy: 0.157
Policy_KL: 0.000969
Policy_SD: 0.546
Policy_lr_mult: 0.132
Steps: 1.17e+04
TotalSteps: 1.86e+07
VF_0_ExplainedVarNew: 0.99
VF_0_ExplainedVarOld: 0.981
VF_0_Loss : 0.000177


ADV1:  -0.002084896476492153 0.008291417424755055 0.04872415262807156 -0.0939692154767926
ADV2:  0.04103471717248527 0.8609109604290346 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.7569   0.9126   5.2671  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0022   0.0014   0.0053   6.4661   2.1407   2.488

***** Episode 52027, Mean R = -12.0  Std R = 4.7  Min R = -26.0
PolicyLoss: -0.0276
Policy_Beta: 0.114
Policy_Entropy: 0.159
Policy_KL: 0.000878
Policy_SD: 0.522
Policy_lr_mult: 0.132
Steps: 1.17e+04
TotalSteps: 1.87e+07
VF_0_ExplainedVarNew: 0.968
VF_0_ExplainedVarOld: 0.964
VF_0_Loss : 0.000135


ADV1:  -0.0037545001741112276 0.009725847272667915 0.037137429391618515 -0.05232158154544814
ADV2:  0.0442963459750634 0.915827986287061 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.3359   1.4120   7.0912  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0040   0.0025   0.0097   6.4661   2.1407   2.4885
***** Episode 52058, Mean R = -14.0  Std R = 4.9  Min R = -24.0
PolicyLoss: -0.0163
Policy_Beta: 0.114
Policy_Entropy: 0.157
Policy_KL: 0.000819
Policy_SD: 0.546
Policy_lr_mult: 0.132
Steps: 1.17e+04
TotalSteps: 1.87e+07
VF_0_ExplainedVarNew: 0.958
VF_0_ExplainedVarOld: 0.952
VF_0_Loss : 0.000184


ADV1:  0.0026440480456520784 0.00858207528691260

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.0655   0.6774   3.7220  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0011   0.0006   0.0027   6.4661   2.1407   2.4885
***** Episode 52306, Mean R = -12.6  Std R = 5.4  Min R = -26.6
PolicyLoss: -0.0256
Policy_Beta: 0.114
Policy_Entropy: 0.157
Policy_KL: 0.000947
Policy_SD: 0.545
Policy_lr_mult: 0.132
Steps: 1.16e+04
TotalSteps: 1.88e+07
VF_0_ExplainedVarNew: 0.977
VF_0_ExplainedVarOld: 0.973
VF_0_Loss : 0.000496


ADV1:  -0.0023311199370014916 0.008903425055262442 0.03553140875718417 -0.05956236391184875
ADV2:  0.03705927220604137 0.8915367409353135 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.3329   0.6992   3.6882  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0025   0.0016   0.0060   6.4661   2.1407   2.4885
***** Episode 52337, Mean R = -13.6  Std R = 4.5  Min R = -25.3
PolicyLoss: -0.0218
Policy_Beta: 0.114
Policy_Entropy: 0.16
Policy_KL: 0.0009

ADV1:  -0.0013728957577775435 0.006910572301339774 0.03249352494641006 -0.05837491340657269
ADV2:  0.03543512856580251 0.8583003211935505 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.3528   0.6205   3.6598  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0015   0.0010   0.0036   6.4661   2.1407   2.4885
***** Episode 52585, Mean R = -13.1  Std R = 5.7  Min R = -30.9
PolicyLoss: -0.0271
Policy_Beta: 0.114
Policy_Entropy: 0.157
Policy_KL: 0.0012
Policy_SD: 0.538
Policy_lr_mult: 0.132
Steps: 1.17e+04
TotalSteps: 1.89e+07
VF_0_ExplainedVarNew: 0.981
VF_0_ExplainedVarOld: 0.977
VF_0_Loss : 0.000522


ADV1:  0.0005190507127085557 0.006849040600166415 0.04985301323978411 -0.04838681920199523
ADV2:  0.0071876536949615835 0.8776247482763097 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.9379   1.1574   6.5291  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0006   0.0004   0.0013   6.4661   2.1407   2.

***** Episode 52833, Mean R = -12.6  Std R = 4.4  Min R = -22.5
PolicyLoss: -0.0242
Policy_Beta: 0.114
Policy_Entropy: 0.156
Policy_KL: 0.000922
Policy_SD: 0.538
Policy_lr_mult: 0.132
Steps: 1.18e+04
TotalSteps: 1.9e+07
VF_0_ExplainedVarNew: 0.978
VF_0_ExplainedVarOld: 0.976
VF_0_Loss : 0.00027


ADV1:  -0.000162688551189435 0.008591144375084436 0.03371668060956173 -0.05053040107952637
ADV2:  0.027328901767186164 0.85601834417166 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.4890   0.6179   2.9121  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0006   0.0004   0.0014   6.4661   2.1407   2.4885
***** Episode 52864, Mean R = -12.1  Std R = 4.2  Min R = -26.6
PolicyLoss: -0.0302
Policy_Beta: 0.114
Policy_Entropy: 0.158
Policy_KL: 0.000955
Policy_SD: 0.526
Policy_lr_mult: 0.132
Steps: 1.16e+04
TotalSteps: 1.9e+07
VF_0_ExplainedVarNew: 0.961
VF_0_ExplainedVarOld: 0.957
VF_0_Loss : 0.000353


Dynamics: Max Disturbance (m/s^2):  [0.00179836 0.00

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   3.2067   1.3487   6.6248  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0002   0.0001   0.0005   6.4661   2.1407   2.4885
***** Episode 53112, Mean R = -13.4  Std R = 5.7  Min R = -30.0
PolicyLoss: -0.022
Policy_Beta: 0.114
Policy_Entropy: 0.159
Policy_KL: 0.00178
Policy_SD: 0.531
Policy_lr_mult: 0.132
Steps: 1.19e+04
TotalSteps: 1.91e+07
VF_0_ExplainedVarNew: 0.972
VF_0_ExplainedVarOld: 0.966
VF_0_Loss : 0.000454


ADV1:  -0.002193288728225069 0.009151721839347727 0.04965269692401242 -0.06094132320575589
ADV2:  0.03228152713800553 0.895181321046573 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.0427   1.3932   7.1204  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0026   0.0016   0.0057   6.4661   2.1407   2.4885
***** Episode 53143, Mean R = -13.3  Std R = 4.7  Min R = -23.2
PolicyLoss: -0.0181
Policy_Beta: 0.114
Policy_Entropy: 0.157
Policy_KL: 0.000987


ADV1:  0.0004866773664529118 0.007662714842946957 0.039535291616837914 -0.07165018180233246
ADV2:  0.020960548749904547 0.8262504690472147 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.0659   0.9258   4.3497  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0012   0.0007   0.0024   6.4661   2.1407   2.4885
***** Episode 53391, Mean R = -12.5  Std R = 3.6  Min R = -22.7
PolicyLoss: -0.0309
Policy_Beta: 0.114
Policy_Entropy: 0.157
Policy_KL: 0.0011
Policy_SD: 0.541
Policy_lr_mult: 0.132
Steps: 1.17e+04
TotalSteps: 1.92e+07
VF_0_ExplainedVarNew: 0.977
VF_0_ExplainedVarOld: 0.97
VF_0_Loss : 0.000411


ADV1:  -0.0021017345785478104 0.008157474636391646 0.05885385709714552 -0.05671790225009692
ADV2:  0.03656687579585964 0.859441587720243 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.8676   0.8647   4.1125  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0023   0.0014   0.0055   6.4661   2.1407   2.48

cs_angles |  0.0002  0.0024 |  0.0753  0.0805 | -0.9892 -0.9982 |  0.9976  0.9916
optical_flow |  0.0001 -0.0001 |  0.0256  0.0246 | -1.1697 -1.2385 |  1.0768  1.0210
v_err    | -0.0094 |  0.0577 | -0.4534 |  0.1037
landing_rewards |    9.58 |    2.00 |    0.00 |   10.00
landing_margin |   -0.03 |    0.01 |   -0.06 |    0.02
tracking_rewards |  -18.00 |    3.71 |  -31.30 |  -10.18
steps    |     379 |      20 |     332 |     417
***** Episode 53670, Mean R = -13.2  Std R = 4.9  Min R = -27.2
PolicyLoss: -0.0271
Policy_Beta: 0.114
Policy_Entropy: 0.158
Policy_KL: 0.00111
Policy_SD: 0.538
Policy_lr_mult: 0.132
Steps: 1.16e+04
TotalSteps: 1.93e+07
VF_0_ExplainedVarNew: 0.975
VF_0_ExplainedVarOld: 0.972
VF_0_Loss : 0.000288


Dynamics: Max Disturbance (m/s^2):  [0.00179836 0.00129994 0.00168267] 0.0027848433135488422
ADV1:  0.00022415649955724465 0.00790189605851987 0.04388667369862059 -0.05430929458765582
ADV2:  0.017755300158709676 0.8782695344065302 3.0 -3.0
Policy  Gradients: u/sd/Max/

attitude |   -0.03    0.07    0.08 |    1.26    0.66    1.91 |   -3.14   -1.56   -3.14 |    3.14    1.57    3.14
w        |    0.00   -0.00    0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |    0.06    0.05 |    0.66    1.93 |   -1.40   -3.12 |    1.52    3.13
w_f      |    0.00   -0.00    0.00 |    0.02    0.01    0.01 |   -0.04   -0.03   -0.03 |    0.04    0.02    0.02
w_rewards |   -0.00 |    0.00 |   -0.02 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.24 |    0.25 |    0.00 |    1.70
seeker_angles |    0.00    0.00 |    0.07    0.08 |   -0.98   -1.00 |    0.99    0.99
cs_angles |  0.0036  0.0012 |  0.0742  0.0825 | -0.9815 -0.9957 |  0.9872  0.9932
optical_flow | -0.0000 -0.0001 |  0.0253  0.0248 | -1.1186 -1.2410 |  1.0120  1.3512
v_err    | -0.0101 |  0.0579 | -0.4532 |  0.1099
landing_rewards |    9.52 |    2.15 |    0.00 |   10.00
landing_margin |   -0

thrust   |    0.00   -0.00   -0.00 |    0.67    0.67    0.68 |   -3.40   -3.31   -3.40 |    3.45    3.19    3.40
norm_thrust |    0.89 |    0.75 |    0.00 |    3.46
fuel     |    1.52 |    0.21 |    1.04 |    2.18
rewards  |  -12.82 |    5.09 |  -31.97 |   -4.31
fuel_rewards |   -4.35 |    0.59 |   -6.26 |   -3.00
glideslope_rewards |    0.00 |    0.00 |    0.00 |    0.00
glideslope_penalty |    0.00 |    0.00 |    0.00 |    0.00
glideslope |    2.97 |   20.26 |    0.01 | 5426.96
norm_af  |    1.80 |    0.92 |    0.04 |    3.42
norm_wf  |    0.02 |    0.01 |    0.00 |    0.05
rh_penalty |    0.00 |    0.00 |    0.00 |    0.00
att_rewards |    0.00 |    0.00 |    0.00 |    0.00
att_penalty |    0.00 |    0.00 |    0.00 |    0.00
attitude |    0.03   -0.01   -0.07 |    1.23    0.64    1.91 |   -3.14   -1.56   -3.14 |    3.14    1.57    3.14
w        |    0.00   -0.00   -0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |   -0.00   -0.08 |    0.64

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.1779   0.9412   5.7987  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0025   0.0016   0.0063   6.4661   2.1407   2.4885
Update Cnt = 1760    ET =   1047.6   Stats:  Mean, Std, Min, Max
r_f      |    0.37   -2.89  -10.90 |  187.23  169.48  200.32 | -388.54 -368.23 -391.51 |  389.23  387.06  394.79
v_f      |   -0.00   -0.00    0.00 |    0.04    0.04    0.05 |   -0.14   -0.10   -0.11 |    0.09    0.10    0.10
r_i      |   10.52   14.25  -27.21 |  712.28  650.83  747.50 |-1276.20-1197.99-1262.78 | 1247.75 1363.19 1308.58
v_i      |   -0.00   -0.00    0.00 |    0.04    0.04    0.05 |   -0.09   -0.10   -0.09 |    0.10    0.09    0.09
norm_rf  |    0.21 |    0.08 |    0.04 |    0.55
norm_vf  |    0.08 |    0.01 |    0.04 |    0.17
gs_f     |    1.19 |    1.71 |    0.01 |   15.94
thrust   |   -0.00   -0.00    0.00 |    0.67    0.68    0.67 |   -3.45   -3.36   -3.40 |    3.39    3.43    3.44
norm_thrust |    

ADV1:  -0.00014184423841208998 0.006366133999338127 0.047889876261164394 -0.10554743702612457
ADV2:  0.004625003591187802 0.8246323294094345 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.3284   0.4657   2.0995  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0002   0.0001   0.0004   6.4661   2.1407   2.4885
***** Episode 54879, Mean R = -13.8  Std R = 5.3  Min R = -24.5
PolicyLoss: -0.00572
Policy_Beta: 0.114
Policy_Entropy: 0.158
Policy_KL: 0.00121
Policy_SD: 0.551
Policy_lr_mult: 0.132
Steps: 1.16e+04
TotalSteps: 1.98e+07
VF_0_ExplainedVarNew: 0.99
VF_0_ExplainedVarOld: 0.985
VF_0_Loss : 0.000615


ADV1:  -0.0008896825596089491 0.006926803321219799 0.03862893984684518 -0.06983630623684367
ADV2:  0.028093038363384528 0.8496578977030123 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.0318   0.4071   2.5755  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0013   0.0008   0.0028   6.4661   2.1407 

***** Episode 55127, Mean R = -13.2  Std R = 4.1  Min R = -24.1
PolicyLoss: -0.00378
Policy_Beta: 0.114
Policy_Entropy: 0.159
Policy_KL: 0.00116
Policy_SD: 0.54
Policy_lr_mult: 0.132
Steps: 1.18e+04
TotalSteps: 1.98e+07
VF_0_ExplainedVarNew: 0.986
VF_0_ExplainedVarOld: 0.983
VF_0_Loss : 0.000259


ADV1:  -0.0008368539265140859 0.006152615254480233 0.03436683716299663 -0.0533835795061923
ADV2:  0.031171040429698874 0.8374107533722901 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.4390   1.4875   6.2402  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0009   0.0006   0.0021   6.4661   2.1407   2.4885
***** Episode 55158, Mean R = -12.3  Std R = 4.0  Min R = -22.9
PolicyLoss: -0.0263
Policy_Beta: 0.114
Policy_Entropy: 0.158
Policy_KL: 0.00111
Policy_SD: 0.528
Policy_lr_mult: 0.132
Steps: 1.19e+04
TotalSteps: 1.99e+07
VF_0_ExplainedVarNew: 0.981
VF_0_ExplainedVarOld: 0.978
VF_0_Loss : 0.000215


ADV1:  -0.0003538419485869858 0.00561481494622463

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.7287   0.2455   1.3308  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0022   0.0013   0.0055   6.4661   2.1407   2.4885
***** Episode 55406, Mean R = -13.6  Std R = 5.1  Min R = -24.4
PolicyLoss: -0.0291
Policy_Beta: 0.114
Policy_Entropy: 0.158
Policy_KL: 0.000827
Policy_SD: 0.546
Policy_lr_mult: 0.132
Steps: 1.19e+04
TotalSteps: 2e+07
VF_0_ExplainedVarNew: 0.981
VF_0_ExplainedVarOld: 0.978
VF_0_Loss : 0.000265


ADV1:  0.0003426315050044271 0.007385559902647296 0.04195473205446468 -0.052924116870738336
ADV2:  0.01747588376395907 0.8522931374785937 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.8850   0.3266   1.5127  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0004   0.0002   0.0009   6.4661   2.1407   2.4885
***** Episode 55437, Mean R = -10.9  Std R = 3.1  Min R = -18.9
PolicyLoss: -0.0244
Policy_Beta: 0.114
Policy_Entropy: 0.159
Policy_KL: 0.000825

ADV1:  -0.0023042009655518145 0.008185636812302178 0.07059522264007495 -0.0636138594280722
ADV2:  0.04949033709192297 0.8198391201168167 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.2765   0.6542   3.7663  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0022   0.0014   0.0060   6.4661   2.1407   2.4885
***** Episode 55685, Mean R = -12.4  Std R = 4.9  Min R = -23.2
PolicyLoss: -0.0305
Policy_Beta: 0.114
Policy_Entropy: 0.16
Policy_KL: 0.000973
Policy_SD: 0.544
Policy_lr_mult: 0.132
Steps: 1.17e+04
TotalSteps: 2.01e+07
VF_0_ExplainedVarNew: 0.97
VF_0_ExplainedVarOld: 0.966
VF_0_Loss : 0.000726


ADV1:  -0.0018386622906371726 0.008810938076461723 0.034960140768535236 -0.07616161967962143
ADV2:  0.04045145916558942 0.8527677894238038 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.2593   0.9508   4.7172  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0022   0.0013   0.0047   6.4661   2.1407   2.4

***** Episode 55933, Mean R = -10.9  Std R = 3.5  Min R = -19.8
PolicyLoss: -0.00787
Policy_Beta: 0.114
Policy_Entropy: 0.157
Policy_KL: 0.00105
Policy_SD: 0.54
Policy_lr_mult: 0.132
Steps: 1.16e+04
TotalSteps: 2.01e+07
VF_0_ExplainedVarNew: 0.984
VF_0_ExplainedVarOld: 0.98
VF_0_Loss : 0.000181


ADV1:  0.0008672315542880268 0.007060215993294552 0.035663284081159596 -0.06205658130051017
ADV2:  0.008887134573025559 0.8972664120466037 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.8916   0.6259   3.3822  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0008   0.0005   0.0023   6.4661   2.1407   2.4885
***** Episode 55964, Mean R = -14.7  Std R = 6.6  Min R = -31.2
PolicyLoss: -0.0191
Policy_Beta: 0.114
Policy_Entropy: 0.156
Policy_KL: 0.00102
Policy_SD: 0.548
Policy_lr_mult: 0.132
Steps: 1.17e+04
TotalSteps: 2.02e+07
VF_0_ExplainedVarNew: 0.985
VF_0_ExplainedVarOld: 0.982
VF_0_Loss : 8.8e-05


ADV1:  -0.0012118836830326686 0.00917437475667813 

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.4271   0.8003   3.5672  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0030   0.0017   0.0068   6.4661   2.1407   2.4885
***** Episode 56212, Mean R = -14.1  Std R = 6.2  Min R = -33.0
PolicyLoss: -0.0263
Policy_Beta: 0.114
Policy_Entropy: 0.159
Policy_KL: 0.00102
Policy_SD: 0.544
Policy_lr_mult: 0.132
Steps: 1.17e+04
TotalSteps: 2.03e+07
VF_0_ExplainedVarNew: 0.969
VF_0_ExplainedVarOld: 0.967
VF_0_Loss : 0.000852


ADV1:  -0.0018253014114275009 0.01103706266186693 0.05282666612339221 -0.07744197999527502
ADV2:  0.029606295631252503 0.8865980286752293 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.4312   0.6173   2.9660  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0019   0.0012   0.0047   6.4661   2.1407   2.4885
***** Episode 56243, Mean R = -15.8  Std R = 6.6  Min R = -36.3
PolicyLoss: -0.0213
Policy_Beta: 0.114
Policy_Entropy: 0.159
Policy_KL: 0.0008

ADV1:  0.0011128578187095688 0.008561794520566716 0.04334033075619234 -0.047077111875969205
ADV2:  0.0029712285665671094 0.9033179979610011 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.1646   0.4835   2.2998  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0018   0.0009   0.0034   6.4661   2.1407   2.4885
***** Episode 56491, Mean R = -14.4  Std R = 7.5  Min R = -36.7
PolicyLoss: -0.0172
Policy_Beta: 0.114
Policy_Entropy: 0.157
Policy_KL: 0.000953
Policy_SD: 0.563
Policy_lr_mult: 0.132
Steps: 1.16e+04
TotalSteps: 2.04e+07
VF_0_ExplainedVarNew: 0.976
VF_0_ExplainedVarOld: 0.972
VF_0_Loss : 0.00275


ADV1:  0.0023298006459519464 0.006986473809995153 0.034264622248351695 -0.05395761984796074
ADV2:  -0.004520394338335301 0.8772773418430931 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.9742   0.5701   2.4150  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0031   0.0018   0.0064   6.4661   2.1407 

seeker_angles |    0.00    0.00 |    0.08    0.08 |   -1.00   -0.99 |    1.00    0.99
cs_angles |  0.0000  0.0035 |  0.0777  0.0847 | -0.9993 -0.9938 |  0.9959  0.9868
optical_flow |  0.0001 -0.0000 |  0.0252  0.0242 | -1.0825 -1.0756 |  1.1345  1.0867
v_err    | -0.0099 |  0.0585 | -0.4534 |  0.1134
landing_rewards |    9.61 |    1.93 |    0.00 |   10.00
landing_margin |   -0.02 |    0.01 |   -0.06 |    0.05
tracking_rewards |  -18.31 |    4.40 |  -35.92 |   -9.48
steps    |     377 |      20 |     333 |     418
***** Episode 56770, Mean R = -12.2  Std R = 5.5  Min R = -32.3
PolicyLoss: -0.0204
Policy_Beta: 0.114
Policy_Entropy: 0.154
Policy_KL: 0.00127
Policy_SD: 0.551
Policy_lr_mult: 0.132
Steps: 1.17e+04
TotalSteps: 2.05e+07
VF_0_ExplainedVarNew: 0.987
VF_0_ExplainedVarOld: 0.984
VF_0_Loss : 0.000405


ADV1:  -0.0004903356973719533 0.007050284860590551 0.05777372952145454 -0.0741721808450958
ADV2:  0.024165356232969535 0.8147673959815535 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/M

w        |    0.00   -0.00   -0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |    0.04    0.15 |    0.69    1.76 |   -1.51   -3.13 |    1.49    3.10
w_f      |    0.00    0.00   -0.00 |    0.02    0.01    0.01 |   -0.05   -0.02   -0.03 |    0.05    0.02    0.02
w_rewards |   -0.00 |    0.00 |   -0.04 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.25 |    0.26 |    0.00 |    1.60
seeker_angles |    0.00    0.00 |    0.08    0.08 |   -0.96   -0.99 |    0.99    1.00
cs_angles |  0.0033  0.0038 |  0.0796  0.0809 | -0.9597 -0.9933 |  0.9936  0.9962
optical_flow | -0.0001 -0.0001 |  0.0248  0.0239 | -0.9985 -0.9378 |  1.1977  1.1288
v_err    | -0.0098 |  0.0577 | -0.4513 |  0.1198
landing_rewards |    9.65 |    1.85 |    0.00 |   10.00
landing_margin |   -0.02 |    0.01 |   -0.06 |    0.03
tracking_rewards |  -18.08 |    4.21 |  -33.71 |  -11.09
steps    |     378 |  

thrust   |    0.00   -0.00   -0.00 |    0.67    0.69    0.67 |   -3.33   -3.41   -3.40 |    3.44    3.46    3.39
norm_thrust |    0.90 |    0.75 |    0.00 |    3.46
fuel     |    1.57 |    0.20 |    1.14 |    2.25
rewards  |  -12.49 |    4.59 |  -27.94 |   -4.69
fuel_rewards |   -4.51 |    0.56 |   -6.42 |   -3.27
glideslope_rewards |    0.00 |    0.00 |    0.00 |    0.00
glideslope_penalty |    0.00 |    0.00 |    0.00 |    0.00
glideslope |    2.85 |   12.87 |    0.00 |  295.72
norm_af  |    1.75 |    0.89 |    0.06 |    3.31
norm_wf  |    0.02 |    0.01 |    0.00 |    0.05
rh_penalty |    0.00 |    0.00 |    0.00 |    0.00
att_rewards |    0.00 |    0.00 |    0.00 |    0.00
att_penalty |    0.00 |    0.00 |    0.00 |    0.00
attitude |   -0.00   -0.03    0.10 |    1.17    0.65    1.83 |   -3.14   -1.56   -3.14 |    3.14    1.57    3.14
w        |    0.00   -0.00    0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |   -0.04    0.07 |    0.66

ADV1:  -0.0006288984138770949 0.006235294284762855 0.042836410672915326 -0.08346193320909634
ADV2:  0.01964525909075863 0.8753558032650876 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.2572   0.7699   4.2387  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0010   0.0006   0.0025   6.4661   2.1407   2.4885
Update Cnt = 1860    ET =   1207.7   Stats:  Mean, Std, Min, Max
r_f      |  -10.23   -0.94  -22.63 |  182.21  160.65  196.22 | -392.13 -375.13 -395.94 |  377.30  388.64  364.53
v_f      |    0.00   -0.00    0.01 |    0.04    0.04    0.05 |   -0.09   -0.11   -0.09 |    0.10    0.09    0.09
r_i      |  -45.32  -10.05  -80.19 |  664.36  633.50  778.96 |-1373.71-1293.24-1288.11 | 1229.33 1256.52 1309.74
v_i      |    0.00    0.00    0.00 |    0.04    0.04    0.05 |   -0.08   -0.09   -0.10 |    0.10    0.09    0.10
norm_rf  |    0.20 |    0.08 |    0.03 |    0.45
norm_vf  |    0.07 |    0.01 |    0.04 |    0.12
gs_f     |    1.59 |    2.29 | 

***** Episode 57948, Mean R = -12.1  Std R = 4.0  Min R = -22.2
PolicyLoss: -0.0149
Policy_Beta: 0.114
Policy_Entropy: 0.159
Policy_KL: 0.000908
Policy_SD: 0.545
Policy_lr_mult: 0.132
Steps: 1.17e+04
TotalSteps: 2.09e+07
VF_0_ExplainedVarNew: 0.98
VF_0_ExplainedVarOld: 0.976
VF_0_Loss : 0.000251


ADV1:  -0.0005876857336951142 0.009256757584837627 0.0334331089515178 -0.0616719586831016
ADV2:  0.025523031177778245 0.8745800060593437 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.1969   0.6097   2.9076  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0006   0.0004   0.0015   6.4661   2.1407   2.4885
***** Episode 57979, Mean R = -13.0  Std R = 5.6  Min R = -28.2
PolicyLoss: -0.0247
Policy_Beta: 0.114
Policy_Entropy: 0.16
Policy_KL: 0.00102
Policy_SD: 0.541
Policy_lr_mult: 0.132
Steps: 1.18e+04
TotalSteps: 2.09e+07
VF_0_ExplainedVarNew: 0.96
VF_0_ExplainedVarOld: 0.957
VF_0_Loss : 0.000303


ADV1:  0.0013014980026612001 0.0056718549012261445 0

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.0414   0.6699   3.5931  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0022   0.0013   0.0047   6.4661   2.1407   2.4885
***** Episode 58227, Mean R = -13.4  Std R = 5.6  Min R = -27.7
PolicyLoss: -0.019
Policy_Beta: 0.114
Policy_Entropy: 0.159
Policy_KL: 0.000854
Policy_SD: 0.555
Policy_lr_mult: 0.132
Steps: 1.18e+04
TotalSteps: 2.1e+07
VF_0_ExplainedVarNew: 0.979
VF_0_ExplainedVarOld: 0.975
VF_0_Loss : 0.000425


ADV1:  0.00040338317648361147 0.007382242246470335 0.03905180529590646 -0.06029260002748566
ADV2:  0.020088221705536473 0.8398152388582092 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.0958   1.1987   6.4037  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0012   0.0007   0.0026   6.4661   2.1407   2.4885
***** Episode 58258, Mean R = -13.4  Std R = 4.5  Min R = -22.7
PolicyLoss: -0.0281
Policy_Beta: 0.114
Policy_Entropy: 0.158
Policy_KL: 0.0012

ADV1:  -0.0014381080902500574 0.009153896271654966 0.030245743183996365 -0.09125870360177668
ADV2:  0.031129324567288646 0.8803077825000941 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.7879   1.3553   7.1068  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0016   0.0009   0.0036   6.4661   2.1407   2.4885
***** Episode 58506, Mean R = -13.5  Std R = 6.5  Min R = -34.4
PolicyLoss: -0.0237
Policy_Beta: 0.114
Policy_Entropy: 0.16
Policy_KL: 0.00105
Policy_SD: 0.538
Policy_lr_mult: 0.132
Steps: 1.19e+04
TotalSteps: 2.11e+07
VF_0_ExplainedVarNew: 0.964
VF_0_ExplainedVarOld: 0.961
VF_0_Loss : 0.000298


ADV1:  0.002818824672130457 0.0075040227053028066 0.05513216004990745 -0.05255391337389202
ADV2:  -0.008662583118710036 0.8696167339846484 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.4599   1.3441   6.2054  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0037   0.0022   0.0080   6.4661   2.1407   

***** Episode 58754, Mean R = -13.6  Std R = 5.2  Min R = -24.5
PolicyLoss: -0.0287
Policy_Beta: 0.114
Policy_Entropy: 0.16
Policy_KL: 0.000949
Policy_SD: 0.543
Policy_lr_mult: 0.132
Steps: 1.16e+04
TotalSteps: 2.12e+07
VF_0_ExplainedVarNew: 0.97
VF_0_ExplainedVarOld: 0.965
VF_0_Loss : 0.000543


ADV1:  -0.0018024482549518742 0.007912560147644934 0.041457294826504065 -0.05913253959302241
ADV2:  0.0450166296250338 0.8264251185783953 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.7635   0.8703   4.0472  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0021   0.0013   0.0047   6.4661   2.1407   2.4885
***** Episode 58785, Mean R = -12.8  Std R = 5.3  Min R = -27.2
PolicyLoss: -0.0323
Policy_Beta: 0.114
Policy_Entropy: 0.16
Policy_KL: 0.00137
Policy_SD: 0.542
Policy_lr_mult: 0.132
Steps: 1.17e+04
TotalSteps: 2.12e+07
VF_0_ExplainedVarNew: 0.97
VF_0_ExplainedVarOld: 0.967
VF_0_Loss : 0.000365


ADV1:  0.0017164858686189173 0.01088712755315817 0.0

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.1848   0.5835   2.3965  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0005   0.0003   0.0010   6.4661   2.1407   2.4885
***** Episode 59033, Mean R = -13.1  Std R = 4.8  Min R = -28.2
PolicyLoss: -0.0211
Policy_Beta: 0.114
Policy_Entropy: 0.159
Policy_KL: 0.000876
Policy_SD: 0.536
Policy_lr_mult: 0.132
Steps: 1.19e+04
TotalSteps: 2.13e+07
VF_0_ExplainedVarNew: 0.971
VF_0_ExplainedVarOld: 0.965
VF_0_Loss : 0.000234


ADV1:  -0.0035158542737193364 0.010156874286209547 0.03697221872992887 -0.06702093128771966
ADV2:  0.04074910911102598 0.8937722055957774 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.8256   0.3432   1.4777  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0036   0.0023   0.0091   6.4661   2.1407   2.4885
***** Episode 59064, Mean R = -13.3  Std R = 5.7  Min R = -31.5
PolicyLoss: -0.0224
Policy_Beta: 0.114
Policy_Entropy: 0.162
Policy_KL: 0.000

ADV1:  -0.0007241412424816047 0.0061568719171742085 0.05854540816069659 -0.058725408047673316
ADV2:  0.011420138721556242 0.9061496668375384 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.0216   1.1837   5.8322  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0008   0.0005   0.0019   6.4661   2.1407   2.4885
***** Episode 59312, Mean R = -12.7  Std R = 5.3  Min R = -31.1
PolicyLoss: -0.00674
Policy_Beta: 0.114
Policy_Entropy: 0.159
Policy_KL: 0.00139
Policy_SD: 0.543
Policy_lr_mult: 0.132
Steps: 1.17e+04
TotalSteps: 2.14e+07
VF_0_ExplainedVarNew: 0.987
VF_0_ExplainedVarOld: 0.982
VF_0_Loss : 8.62e-05


ADV1:  0.0022088903531695334 0.006847439017763598 0.07748161036367063 -0.05591478017677831
ADV2:  -0.013805819582635478 0.889077197680575 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.5296   0.6319   2.6291  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0023   0.0015   0.0058   6.4661   2.1407 

***** Episode 59560, Mean R = -13.9  Std R = 6.0  Min R = -32.5
PolicyLoss: -0.0149
Policy_Beta: 0.114
Policy_Entropy: 0.162
Policy_KL: 0.000985
Policy_SD: 0.558
Policy_lr_mult: 0.132
Steps: 1.17e+04
TotalSteps: 2.15e+07
VF_0_ExplainedVarNew: 0.986
VF_0_ExplainedVarOld: 0.983
VF_0_Loss : 0.000127


ADV1:  0.0005052551190729888 0.007629040910883255 0.04045186941595724 -0.06309921069977552
ADV2:  0.02592646746423651 0.818911941467299 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.9790   0.5141   2.7915  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0006   0.0004   0.0014   6.4661   2.1407   2.4885
***** Episode 59591, Mean R = -13.6  Std R = 5.8  Min R = -31.2
PolicyLoss: -0.035
Policy_Beta: 0.114
Policy_Entropy: 0.161
Policy_KL: 0.0011
Policy_SD: 0.544
Policy_lr_mult: 0.132
Steps: 1.18e+04
TotalSteps: 2.15e+07
VF_0_ExplainedVarNew: 0.979
VF_0_ExplainedVarOld: 0.976
VF_0_Loss : 0.000115


ADV1:  0.0009448528350809522 0.007001040619403367 0.

cs_angles |  0.0038  0.0021 |  0.0755  0.0804 | -0.9618 -0.9741 |  0.9910  0.9777
optical_flow |  0.0001 -0.0000 |  0.0249  0.0249 | -1.2423 -1.0729 |  1.0688  1.1233
v_err    | -0.0102 |  0.0580 | -0.4524 |  0.1106
landing_rewards |    9.61 |    1.93 |    0.00 |   10.00
landing_margin |   -0.03 |    0.01 |   -0.06 |    0.03
tracking_rewards |  -17.89 |    4.17 |  -36.26 |  -10.76
steps    |     379 |      21 |     330 |     419
***** Episode 59870, Mean R = -12.5  Std R = 4.3  Min R = -23.2
PolicyLoss: -0.0255
Policy_Beta: 0.114
Policy_Entropy: 0.16
Policy_KL: 0.000984
Policy_SD: 0.533
Policy_lr_mult: 0.132
Steps: 1.18e+04
TotalSteps: 2.16e+07
VF_0_ExplainedVarNew: 0.977
VF_0_ExplainedVarOld: 0.973
VF_0_Loss : 0.000162


ADV1:  -0.0009742070779783673 0.015070987343276181 0.04287424243849347 -0.12171582356771393
ADV2:  0.038320802693809164 0.7848867447664994 2.8225066801112755 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.2676   0.6634   3.8286  27.0893  20.3031  12.6669
Va

theta_cv |    0.25 |    0.25 |    0.00 |    1.73
seeker_angles |    0.00    0.00 |    0.08    0.08 |   -1.00   -0.99 |    1.00    0.98
cs_angles |  0.0024  0.0035 |  0.0768  0.0834 | -0.9980 -0.9884 |  0.9998  0.9845
optical_flow |  0.0000 -0.0000 |  0.0261  0.0250 | -1.0771 -1.1998 |  1.1127  1.1619
v_err    | -0.0100 |  0.0578 | -0.4515 |  0.1165
landing_rewards |    9.39 |    2.40 |    0.00 |   10.00
landing_margin |   -0.02 |    0.01 |   -0.06 |    0.03
tracking_rewards |  -17.99 |    5.46 |  -78.64 |  -10.40
steps    |     376 |      20 |     333 |     419
***** Episode 60180, Mean R = -12.3  Std R = 3.9  Min R = -22.6
PolicyLoss: -0.0164
Policy_Beta: 0.114
Policy_Entropy: 0.16
Policy_KL: 0.000968
Policy_SD: 0.538
Policy_lr_mult: 0.132
Steps: 1.16e+04
TotalSteps: 2.18e+07
VF_0_ExplainedVarNew: 0.981
VF_0_ExplainedVarOld: 0.975
VF_0_Loss : 0.000232


ADV1:  -0.0008534480963951938 0.005836808957243586 0.044722839923927005 -0.07037512753932346
ADV2:  0.01863553961626622 0.88882507150

attitude |    0.14    0.02   -0.03 |    1.16    0.64    1.79 |   -3.14   -1.57   -3.14 |    3.14    1.52    3.14
w        |    0.00   -0.00   -0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |    0.02   -0.06 |    0.65    1.78 |   -1.49   -3.12 |    1.46    3.13
w_f      |    0.00   -0.00   -0.00 |    0.02    0.01    0.01 |   -0.03   -0.03   -0.03 |    0.04    0.02    0.02
w_rewards |   -0.00 |    0.00 |   -0.01 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.24 |    0.25 |    0.00 |    1.85
seeker_angles |    0.00    0.00 |    0.08    0.08 |   -1.00   -0.98 |    1.00    0.99
cs_angles |  0.0013  0.0018 |  0.0804  0.0803 | -0.9971 -0.9779 |  0.9960  0.9877
optical_flow | -0.0001 -0.0002 |  0.0247  0.0240 | -1.0957 -1.0985 |  0.9793  1.1391
v_err    | -0.0103 |  0.0582 | -0.4527 |  0.1164
landing_rewards |    9.81 |    1.38 |    0.00 |   10.00
landing_margin |   -0

attitude |   -0.04    0.02   -0.01 |    1.18    0.62    1.86 |   -3.14   -1.56   -3.14 |    3.14    1.53    3.14
w        |    0.00    0.00    0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |    0.02    0.03 |    0.62    1.85 |   -1.41   -3.12 |    1.51    3.13
w_f      |   -0.00    0.00   -0.00 |    0.02    0.01    0.01 |   -0.04   -0.02   -0.02 |    0.04    0.02    0.03
w_rewards |   -0.00 |    0.00 |   -0.02 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.24 |    0.25 |    0.00 |    1.58
seeker_angles |    0.00    0.00 |    0.08    0.08 |   -0.99   -0.98 |    0.96    0.96
cs_angles |  0.0022  0.0037 |  0.0763  0.0809 | -0.9860 -0.9813 |  0.9624  0.9609
optical_flow |  0.0000 -0.0000 |  0.0243  0.0227 | -0.9901 -1.2289 |  1.1011  1.0835
v_err    | -0.0095 |  0.0582 | -0.4517 |  0.1107
landing_rewards |    9.39 |    2.40 |    0.00 |   10.00
landing_margin |   -0

attitude |    0.00   -0.02    0.03 |    1.09    0.67    1.75 |   -3.14   -1.53   -3.14 |    3.14    1.54    3.14
w        |    0.00    0.00    0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |   -0.01   -0.01 |    0.66    1.75 |   -1.36   -3.13 |    1.46    3.07
w_f      |   -0.00   -0.00    0.00 |    0.02    0.01    0.01 |   -0.04   -0.02   -0.03 |    0.04    0.03    0.02
w_rewards |   -0.00 |    0.00 |   -0.03 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.25 |    0.26 |    0.00 |    1.59
seeker_angles |    0.00    0.00 |    0.08    0.08 |   -0.94   -0.99 |    0.98    0.97
cs_angles |  0.0037  0.0036 |  0.0802  0.0809 | -0.9354 -0.9874 |  0.9849  0.9724
optical_flow | -0.0000 -0.0000 |  0.0257  0.0233 | -1.1294 -1.1302 |  1.0846  1.0813
v_err    | -0.0096 |  0.0575 | -0.4528 |  0.1086
landing_rewards |    9.77 |    1.49 |    0.00 |   10.00
landing_margin |   -0

thrust   |    0.00    0.00   -0.00 |    0.67    0.68    0.69 |   -3.45   -3.40   -3.30 |    3.30    3.43    3.44
norm_thrust |    0.90 |    0.75 |    0.00 |    3.46
fuel     |    1.56 |    0.19 |    1.16 |    2.21
rewards  |  -12.72 |    5.01 |  -39.51 |   -3.29
fuel_rewards |   -4.48 |    0.54 |   -6.33 |   -3.33
glideslope_rewards |    0.00 |    0.00 |    0.00 |    0.00
glideslope_penalty |    0.00 |    0.00 |    0.00 |    0.00
glideslope |    2.94 |   17.04 |    0.01 | 3599.81
norm_af  |    1.85 |    0.90 |    0.07 |    3.25
norm_wf  |    0.02 |    0.01 |    0.00 |    0.04
rh_penalty |    0.00 |    0.00 |    0.00 |    0.00
att_rewards |    0.00 |    0.00 |    0.00 |    0.00
att_penalty |    0.00 |    0.00 |    0.00 |    0.00
attitude |   -0.04   -0.06    0.14 |    1.30    0.70    1.92 |   -3.14   -1.56   -3.14 |    3.14    1.53    3.14
w        |    0.00   -0.00   -0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |   -0.06    0.18 |    0.71

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.9119   1.1030   5.9543  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0024   0.0014   0.0054   6.4661   2.1407   2.4885
Update Cnt = 1990    ET =   1053.0   Stats:  Mean, Std, Min, Max
r_f      |   -9.27   15.21   -1.37 |  185.29  182.05  192.26 | -393.27 -393.97 -390.40 |  380.07  382.42  373.16
v_f      |   -0.00   -0.00   -0.00 |    0.04    0.04    0.05 |   -0.10   -0.10   -0.08 |    0.10    0.09    0.11
r_i      |   10.09   28.73    8.36 |  658.11  693.47  753.68 |-1318.20-1345.53-1282.86 | 1318.50 1325.36 1268.71
v_i      |   -0.00   -0.00   -0.00 |    0.04    0.04    0.05 |   -0.09   -0.09   -0.09 |    0.09    0.09    0.09
norm_rf  |    0.20 |    0.08 |    0.03 |    0.50
norm_vf  |    0.07 |    0.01 |    0.04 |    0.12
gs_f     |    1.30 |    2.39 |    0.01 |   23.99
thrust   |   -0.00   -0.00    0.01 |    0.68    0.68    0.69 |   -3.39   -3.42   -3.37 |    3.22    3.45    3.46
norm_thrust |    

ADV1:  -0.0012296526036504475 0.008801066196605216 0.03333715826757089 -0.06784739626522374
ADV2:  0.03528479420932787 0.8508480270028574 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.2123   0.6893   3.9215  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0015   0.0008   0.0031   6.4661   2.1407   2.4885
***** Episode 62009, Mean R = -13.3  Std R = 5.5  Min R = -26.8
PolicyLoss: -0.0297
Policy_Beta: 0.114
Policy_Entropy: 0.161
Policy_KL: 0.000892
Policy_SD: 0.536
Policy_lr_mult: 0.132
Steps: 1.19e+04
TotalSteps: 2.24e+07
VF_0_ExplainedVarNew: 0.966
VF_0_ExplainedVarOld: 0.964
VF_0_Loss : 0.000169


ADV1:  0.0007935515185322928 0.006553699466575488 0.043616973454735364 -0.05192106949393122
ADV2:  0.013477201528907697 0.8315680582054903 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.7396   1.4724   7.2826  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0011   0.0006   0.0024   6.4661   2.1407   

***** Episode 62257, Mean R = -13.6  Std R = 6.0  Min R = -37.8
PolicyLoss: -0.00436
Policy_Beta: 0.114
Policy_Entropy: 0.162
Policy_KL: 0.00083
Policy_SD: 0.551
Policy_lr_mult: 0.132
Steps: 1.17e+04
TotalSteps: 2.25e+07
VF_0_ExplainedVarNew: 0.99
VF_0_ExplainedVarOld: 0.987
VF_0_Loss : 0.000476


ADV1:  -0.0012695024614288852 0.009552930415894197 0.04228946979625364 -0.07618966143556422
ADV2:  0.03075050810981586 0.86537343999106 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.3051   0.6287   3.0383  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0014   0.0009   0.0032   6.4661   2.1407   2.4885
***** Episode 62288, Mean R = -13.5  Std R = 5.6  Min R = -28.9
PolicyLoss: -0.0275
Policy_Beta: 0.114
Policy_Entropy: 0.161
Policy_KL: 0.000954
Policy_SD: 0.543
Policy_lr_mult: 0.132
Steps: 1.15e+04
TotalSteps: 2.25e+07
VF_0_ExplainedVarNew: 0.966
VF_0_ExplainedVarOld: 0.962
VF_0_Loss : 0.000521


ADV1:  -0.00033972072989358004 0.00654294854288527

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.1860   0.5232   2.3208  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0027   0.0017   0.0069   6.4661   2.1407   2.4885
***** Episode 62536, Mean R = -14.2  Std R = 6.0  Min R = -30.7
PolicyLoss: -0.0273
Policy_Beta: 0.114
Policy_Entropy: 0.16
Policy_KL: 0.00105
Policy_SD: 0.55
Policy_lr_mult: 0.132
Steps: 1.19e+04
TotalSteps: 2.26e+07
VF_0_ExplainedVarNew: 0.984
VF_0_ExplainedVarOld: 0.98
VF_0_Loss : 0.000275


ADV1:  0.00044834115434465045 0.007250440158489243 0.04326025441872433 -0.05688559467174509
ADV2:  0.022200906838170574 0.8374884375924065 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.5690   0.8263   3.8239  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0005   0.0003   0.0012   6.4661   2.1407   2.4885
***** Episode 62567, Mean R = -13.6  Std R = 6.2  Min R = -34.0
PolicyLoss: -0.0314
Policy_Beta: 0.114
Policy_Entropy: 0.161
Policy_KL: 0.000978

ADV1:  -0.000982527372365387 0.007077534676990775 0.03464684088279135 -0.04711600508660618
ADV2:  0.029671366491471257 0.8726621228285526 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.8286   1.2676   6.3427  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0013   0.0008   0.0028   6.4661   2.1407   2.4885
***** Episode 62815, Mean R = -13.1  Std R = 5.0  Min R = -23.4
PolicyLoss: -0.0246
Policy_Beta: 0.114
Policy_Entropy: 0.158
Policy_KL: 0.0012
Policy_SD: 0.562
Policy_lr_mult: 0.132
Steps: 1.16e+04
TotalSteps: 2.27e+07
VF_0_ExplainedVarNew: 0.981
VF_0_ExplainedVarOld: 0.977
VF_0_Loss : 0.000347


ADV1:  0.00124970405459552 0.009222603452046894 0.04256198221529206 -0.057274762124970895
ADV2:  0.013190370825303763 0.8581068505997415 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.1244   0.9966   4.9033  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0015   0.0009   0.0033   6.4661   2.1407   2.48

***** Episode 63063, Mean R = -11.7  Std R = 5.0  Min R = -22.7
PolicyLoss: -0.0262
Policy_Beta: 0.114
Policy_Entropy: 0.163
Policy_KL: 0.000977
Policy_SD: 0.541
Policy_lr_mult: 0.132
Steps: 1.18e+04
TotalSteps: 2.28e+07
VF_0_ExplainedVarNew: 0.98
VF_0_ExplainedVarOld: 0.976
VF_0_Loss : 0.000586


ADV1:  -0.0022806661900145043 0.0055910046822301345 0.03118827476648478 -0.045620114914584675
ADV2:  0.04227956441169832 0.8904626503118841 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.3626   1.0548   4.8662  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0023   0.0014   0.0059   6.4661   2.1407   2.4885
***** Episode 63094, Mean R = -11.5  Std R = 4.1  Min R = -25.7
PolicyLoss: -0.0166
Policy_Beta: 0.114
Policy_Entropy: 0.16
Policy_KL: 0.00127
Policy_SD: 0.543
Policy_lr_mult: 0.132
Steps: 1.19e+04
TotalSteps: 2.28e+07
VF_0_ExplainedVarNew: 0.987
VF_0_ExplainedVarOld: 0.983
VF_0_Loss : 0.000351


ADV1:  0.0012932434476736092 0.00684913702551136

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.0640   0.9682   5.1646  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0021   0.0013   0.0056   6.4661   2.1407   2.4885
***** Episode 63342, Mean R = -12.5  Std R = 6.2  Min R = -28.6
PolicyLoss: -0.0247
Policy_Beta: 0.114
Policy_Entropy: 0.161
Policy_KL: 0.00121
Policy_SD: 0.533
Policy_lr_mult: 0.132
Steps: 1.18e+04
TotalSteps: 2.29e+07
VF_0_ExplainedVarNew: 0.962
VF_0_ExplainedVarOld: 0.958
VF_0_Loss : 0.000205


ADV1:  0.003090214287802597 0.009266974751845002 0.03448304431441044 -0.07491206494079014
ADV2:  -0.008014477796283606 0.9140918791376205 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.9642   0.7269   4.4620  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0037   0.0022   0.0080   6.4661   2.1407   2.4885
***** Episode 63373, Mean R = -13.9  Std R = 5.2  Min R = -27.7
PolicyLoss: -0.0176
Policy_Beta: 0.114
Policy_Entropy: 0.161
Policy_KL: 0.0014

ADV1:  0.0013805290269698705 0.008587049011362006 0.06749212606551819 -0.05943127284538212
ADV2:  0.01168974700611518 0.8436039309788788 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.6006   1.0400   5.5827  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0016   0.0010   0.0037   6.4661   2.1407   2.4885
***** Episode 63621, Mean R = -12.6  Std R = 4.9  Min R = -21.9
PolicyLoss: -0.0268
Policy_Beta: 0.114
Policy_Entropy: 0.163
Policy_KL: 0.0013
Policy_SD: 0.537
Policy_lr_mult: 0.132
Steps: 1.16e+04
TotalSteps: 2.3e+07
VF_0_ExplainedVarNew: 0.969
VF_0_ExplainedVarOld: 0.966
VF_0_Loss : 0.000184


ADV1:  -0.000566081997186396 0.004955772646849796 0.030468476205073702 -0.04920714300397336
ADV2:  0.013159907193744977 0.8968223292547397 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.8079   1.0948   5.8579  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0006   0.0004   0.0015   6.4661   2.1407   2.48

theta_cv |    0.24 |    0.25 |    0.00 |    1.75
seeker_angles |    0.00    0.00 |    0.08    0.08 |   -0.99   -1.00 |    1.00    1.00
cs_angles |  0.0022  0.0030 |  0.0754  0.0802 | -0.9904 -0.9988 |  0.9962  1.0000
optical_flow |  0.0000 -0.0000 |  0.0240  0.0241 | -1.3053 -1.1810 |  0.8810  1.1183
v_err    | -0.0097 |  0.0574 | -0.4530 |  0.1076
landing_rewards |    9.77 |    1.49 |    0.00 |   10.00
landing_margin |   -0.03 |    0.01 |   -0.06 |    0.01
tracking_rewards |  -17.45 |    4.60 |  -61.01 |  -10.46
steps    |     376 |      20 |     337 |     416
***** Episode 63900, Mean R = -12.4  Std R = 5.4  Min R = -27.6
PolicyLoss: -0.0266
Policy_Beta: 0.114
Policy_Entropy: 0.162
Policy_KL: 0.00126
Policy_SD: 0.55
Policy_lr_mult: 0.132
Steps: 1.17e+04
TotalSteps: 2.32e+07
VF_0_ExplainedVarNew: 0.981
VF_0_ExplainedVarOld: 0.977
VF_0_Loss : 0.000181


ADV1:  -0.000991501456049909 0.006760482010368106 0.05520753621489771 -0.05410547928121986
ADV2:  0.030222423732778173 0.8391786166241

w        |    0.00    0.00    0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |    0.02    0.07 |    0.63    1.86 |   -1.49   -3.12 |    1.51    3.14
w_f      |   -0.00   -0.00    0.00 |    0.02    0.01    0.01 |   -0.04   -0.02   -0.02 |    0.04    0.02    0.03
w_rewards |   -0.00 |    0.00 |   -0.01 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.25 |    0.26 |    0.00 |    1.56
seeker_angles |    0.00    0.00 |    0.08    0.08 |   -0.97   -1.00 |    1.00    0.99
cs_angles |  0.0012  0.0018 |  0.0761  0.0823 | -0.9741 -0.9981 |  0.9980  0.9931
optical_flow | -0.0001  0.0001 |  0.0248  0.0240 | -1.2219 -1.0980 |  1.1295  1.1765
v_err    | -0.0099 |  0.0578 | -0.4536 |  0.1093
landing_rewards |    9.65 |    1.85 |    0.00 |   10.00
landing_margin |   -0.03 |    0.01 |   -0.06 |    0.02
tracking_rewards |  -17.84 |    4.05 |  -32.35 |  -10.59
steps    |     378 |  

attitude |    0.01    0.03    0.04 |    1.20    0.68    1.92 |   -3.14   -1.56   -3.14 |    3.14    1.55    3.14
w        |    0.00    0.00    0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |    0.03    0.07 |    0.68    1.93 |   -1.41   -3.10 |    1.45    3.14
w_f      |    0.00   -0.00    0.00 |    0.02    0.01    0.01 |   -0.04   -0.02   -0.03 |    0.04    0.03    0.03
w_rewards |   -0.00 |    0.00 |   -0.03 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.24 |    0.25 |    0.00 |    1.49
seeker_angles |    0.00    0.00 |    0.08    0.08 |   -1.00   -0.96 |    0.98    1.00
cs_angles |  0.0028  0.0043 |  0.0783  0.0795 | -0.9989 -0.9622 |  0.9845  0.9989
optical_flow |  0.0002 -0.0000 |  0.0233  0.0236 | -1.0008 -1.2057 |  1.0150  1.0563
v_err    | -0.0097 |  0.0580 | -0.4534 |  0.1040
landing_rewards |    9.55 |    2.08 |    0.00 |   10.00
landing_margin |   -0

attitude |   -0.06    0.02   -0.07 |    1.13    0.63    1.79 |   -3.14   -1.50   -3.14 |    3.14    1.55    3.14
w        |    0.00    0.00    0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |    0.02   -0.03 |    0.64    1.79 |   -1.49   -3.12 |    1.33    3.11
w_f      |   -0.00   -0.00   -0.00 |    0.02    0.01    0.01 |   -0.04   -0.02   -0.03 |    0.04    0.03    0.02
w_rewards |   -0.00 |    0.00 |   -0.02 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.24 |    0.25 |    0.00 |    1.52
seeker_angles |    0.00    0.00 |    0.08    0.08 |   -0.99   -1.00 |    0.99    0.99
cs_angles |  0.0046  0.0045 |  0.0765  0.0798 | -0.9933 -0.9967 |  0.9853  0.9876
optical_flow | -0.0001  0.0000 |  0.0238  0.0242 | -1.0885 -0.9693 |  0.9940  1.0130
v_err    | -0.0095 |  0.0577 | -0.4523 |  0.1035
landing_rewards |    9.68 |    1.77 |    0.00 |   10.00
landing_margin |   -0

attitude |    0.03    0.02    0.07 |    1.08    0.65    1.81 |   -3.14   -1.54   -3.14 |    3.14    1.56    3.14
w        |    0.00    0.00    0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |    0.02    0.00 |    0.65    1.83 |   -1.43   -3.13 |    1.46    3.14
w_f      |    0.00    0.00    0.00 |    0.02    0.01    0.01 |   -0.04   -0.02   -0.02 |    0.04    0.02    0.03
w_rewards |   -0.00 |    0.00 |   -0.02 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.24 |    0.24 |    0.00 |    1.56
seeker_angles |    0.00    0.00 |    0.07    0.08 |   -0.99   -0.99 |    1.00    1.00
cs_angles |  0.0022  0.0029 |  0.0749  0.0807 | -0.9935 -0.9933 |  0.9979  0.9987
optical_flow | -0.0001 -0.0001 |  0.0248  0.0246 | -1.3245 -1.2072 |  1.0831  1.0709
v_err    | -0.0097 |  0.0577 | -0.4525 |  0.0963
landing_rewards |    9.74 |    1.59 |    0.00 |   10.00
landing_margin |   -0

attitude |    0.06    0.07    0.05 |    1.17    0.64    1.88 |   -3.14   -1.54   -3.14 |    3.14    1.54    3.14
w        |    0.00   -0.00    0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.06    0.05    0.05
a_f      |    0.06    0.09 |    0.64    1.87 |   -1.49   -3.11 |    1.43    3.12
w_f      |    0.00   -0.00    0.00 |    0.02    0.01    0.01 |   -0.04   -0.02   -0.03 |    0.04    0.03    0.03
w_rewards |   -0.00 |    0.00 |   -0.06 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.24 |    0.26 |    0.00 |    1.62
seeker_angles |   -0.00    0.00 |    0.08    0.08 |   -1.00   -0.99 |    0.96    0.99
cs_angles | -0.0001  0.0007 |  0.0796  0.0848 | -0.9982 -0.9864 |  0.9598  0.9899
optical_flow |  0.0001 -0.0001 |  0.0240  0.0234 | -1.0886 -1.1251 |  1.3238  1.1542
v_err    | -0.0099 |  0.0576 | -0.4515 |  0.1087
landing_rewards |    9.52 |    2.15 |    0.00 |   10.00
landing_margin |   -0

attitude |   -0.08    0.03    0.00 |    1.24    0.66    1.91 |   -3.14   -1.57   -3.14 |    3.14    1.55    3.14
w        |    0.00    0.00   -0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |    0.03   -0.09 |    0.67    1.91 |   -1.52   -3.14 |    1.40    3.11
w_f      |    0.00   -0.00   -0.00 |    0.02    0.01    0.01 |   -0.04   -0.02   -0.03 |    0.04    0.02    0.02
w_rewards |   -0.00 |    0.00 |   -0.02 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.24 |    0.25 |    0.00 |    1.48
seeker_angles |    0.00    0.00 |    0.07    0.08 |   -1.00   -0.99 |    1.00    0.98
cs_angles |  0.0027  0.0031 |  0.0749  0.0804 | -0.9987 -0.9855 |  0.9970  0.9768
optical_flow |  0.0000  0.0000 |  0.0245  0.0237 | -1.1603 -0.9989 |  1.2262  1.1106
v_err    | -0.0101 |  0.0577 | -0.4516 |  0.1069
landing_rewards |    9.68 |    1.77 |    0.00 |   10.00
landing_margin |   -0

attitude |    0.08   -0.01   -0.02 |    1.22    0.67    1.93 |   -3.14   -1.55   -3.14 |    3.14    1.54    3.14
w        |    0.00   -0.00    0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |    0.01   -0.01 |    0.66    1.93 |   -1.43   -3.14 |    1.47    3.11
w_f      |    0.00   -0.00    0.00 |    0.01    0.01    0.01 |   -0.04   -0.03   -0.02 |    0.04    0.02    0.03
w_rewards |   -0.00 |    0.00 |   -0.03 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.23 |    0.24 |    0.00 |    1.65
seeker_angles |    0.00    0.00 |    0.07    0.08 |   -0.97   -1.00 |    1.00    0.99
cs_angles |  0.0015  0.0028 |  0.0733  0.0798 | -0.9728 -0.9976 |  0.9957  0.9935
optical_flow |  0.0001 -0.0001 |  0.0247  0.0250 | -1.0623 -1.1716 |  1.0823  1.0121
v_err    | -0.0100 |  0.0577 | -0.4531 |  0.1213
landing_rewards |    9.58 |    2.00 |    0.00 |   10.00
landing_margin |   -0

w        |    0.00    0.00    0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |    0.05   -0.05 |    0.64    1.84 |   -1.50   -3.13 |    1.45    3.14
w_f      |    0.00   -0.00    0.00 |    0.01    0.01    0.01 |   -0.03   -0.03   -0.02 |    0.04    0.02    0.03
w_rewards |   -0.00 |    0.00 |   -0.03 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.24 |    0.25 |    0.00 |    1.66
seeker_angles |    0.00    0.01 |    0.07    0.08 |   -0.95   -0.99 |    0.99    1.00
cs_angles |  0.0014  0.0053 |  0.0748  0.0815 | -0.9497 -0.9950 |  0.9905  0.9983
optical_flow |  0.0001 -0.0001 |  0.0227  0.0237 | -1.1249 -1.0318 |  0.9903  1.1264
v_err    | -0.0100 |  0.0577 | -0.4524 |  0.1115
landing_rewards |    9.55 |    2.08 |    0.00 |   10.00
landing_margin |   -0.03 |    0.01 |   -0.07 |    0.03
tracking_rewards |  -17.68 |    4.25 |  -43.04 |  -10.84
steps    |     376 |  

w        |    0.00   -0.00    0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |   -0.03    0.18 |    0.64    1.85 |   -1.53   -3.11 |    1.50    3.11
w_f      |    0.00   -0.00   -0.00 |    0.01    0.01    0.01 |   -0.03   -0.02   -0.03 |    0.04    0.02    0.03
w_rewards |   -0.00 |    0.00 |   -0.01 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.24 |    0.25 |    0.00 |    1.76
seeker_angles |    0.01    0.00 |    0.07    0.08 |   -0.98   -1.00 |    0.98    0.99
cs_angles |  0.0052  0.0041 |  0.0747  0.0817 | -0.9845 -0.9961 |  0.9789  0.9854
optical_flow | -0.0002 -0.0002 |  0.0246  0.0228 | -1.1808 -1.1152 |  1.0863  1.0162
v_err    | -0.0103 |  0.0580 | -0.4511 |  0.1170
landing_rewards |    9.45 |    2.28 |    0.00 |   10.00
landing_margin |   -0.02 |    0.01 |   -0.06 |    0.03
tracking_rewards |  -17.84 |    4.38 |  -41.24 |  -10.92
steps    |     380 |  

attitude |   -0.10    0.02    0.01 |    1.11    0.64    1.82 |   -3.14   -1.57   -3.14 |    3.14    1.56    3.14
w        |    0.00   -0.00    0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |    0.02    0.01 |    0.64    1.82 |   -1.42   -3.10 |    1.53    3.10
w_f      |    0.00   -0.00    0.00 |    0.01    0.01    0.01 |   -0.04   -0.02   -0.02 |    0.03    0.02    0.02
w_rewards |   -0.00 |    0.00 |   -0.01 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.24 |    0.26 |    0.00 |    1.52
seeker_angles |    0.00    0.00 |    0.08    0.08 |   -0.97   -1.00 |    1.00    1.00
cs_angles |  0.0002  0.0035 |  0.0777  0.0833 | -0.9680 -0.9987 |  0.9972  0.9984
optical_flow |  0.0001 -0.0000 |  0.0227  0.0237 | -1.0087 -1.1136 |  1.0405  1.1170
v_err    | -0.0106 |  0.0579 | -0.4529 |  0.1122
landing_rewards |    9.52 |    2.15 |    0.00 |   10.00
landing_margin |   -0

attitude |    0.15    0.04   -0.14 |    1.17    0.66    1.88 |   -3.14   -1.53   -3.14 |    3.14    1.57    3.14
w        |    0.00   -0.00    0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |    0.05   -0.13 |    0.66    1.88 |   -1.49   -3.13 |    1.46    3.14
w_f      |    0.00   -0.00    0.00 |    0.01    0.01    0.01 |   -0.04   -0.02   -0.02 |    0.04    0.02    0.03
w_rewards |   -0.00 |    0.00 |   -0.05 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.24 |    0.25 |    0.00 |    1.54
seeker_angles |    0.00    0.00 |    0.08    0.08 |   -1.00   -0.99 |    0.99    0.99
cs_angles |  0.0034  0.0042 |  0.0762  0.0833 | -0.9984 -0.9873 |  0.9945  0.9880
optical_flow |  0.0001 -0.0001 |  0.0250  0.0248 | -0.9954 -1.0582 |  1.2199  1.1615
v_err    | -0.0106 |  0.0582 | -0.4535 |  0.1116
landing_rewards |    9.58 |    2.00 |    0.00 |   10.00
landing_margin |   -0

attitude |    0.09    0.02    0.01 |    1.12    0.69    1.81 |   -3.14   -1.55   -3.14 |    3.14    1.57    3.14
w        |    0.00   -0.00    0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |    0.02   -0.04 |    0.70    1.83 |   -1.43   -3.13 |    1.55    3.12
w_f      |    0.00   -0.00    0.00 |    0.01    0.01    0.01 |   -0.04   -0.03   -0.03 |    0.04    0.02    0.02
w_rewards |   -0.00 |    0.00 |   -0.03 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.23 |    0.25 |    0.00 |    1.53
seeker_angles |    0.00    0.00 |    0.08    0.08 |   -1.00   -0.96 |    0.99    0.99
cs_angles |  0.0028  0.0004 |  0.0782  0.0816 | -0.9980 -0.9597 |  0.9932  0.9896
optical_flow | -0.0001  0.0000 |  0.0244  0.0241 | -1.1618 -1.1548 |  1.1108  1.1168
v_err    | -0.0108 |  0.0579 | -0.4525 |  0.1012
landing_rewards |    9.74 |    1.59 |    0.00 |   10.00
landing_margin |   -0

attitude |   -0.05    0.02   -0.22 |    1.11    0.65    1.78 |   -3.14   -1.57   -3.14 |    3.14    1.51    3.14
w        |    0.00   -0.00    0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |    0.03   -0.22 |    0.65    1.78 |   -1.46   -3.14 |    1.40    3.11
w_f      |    0.00   -0.00    0.00 |    0.01    0.01    0.01 |   -0.03   -0.02   -0.02 |    0.05    0.02    0.03
w_rewards |   -0.00 |    0.00 |   -0.03 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.23 |    0.25 |    0.00 |    1.51
seeker_angles |    0.00    0.00 |    0.08    0.08 |   -0.99   -0.96 |    0.98    0.99
cs_angles |  0.0024  0.0040 |  0.0774  0.0801 | -0.9876 -0.9624 |  0.9779  0.9902
optical_flow | -0.0000 -0.0000 |  0.0244  0.0236 | -1.1666 -1.1492 |  1.0809  1.1987
v_err    | -0.0104 |  0.0575 | -0.4525 |  0.1059
landing_rewards |    9.71 |    1.68 |    0.00 |   10.00
landing_margin |   -0

thrust   |   -0.01    0.00    0.00 |    0.66    0.66    0.67 |   -3.46   -3.30   -3.46 |    3.38    3.29    3.40
norm_thrust |    0.87 |    0.75 |    0.00 |    3.46
fuel     |    1.50 |    0.20 |    1.07 |    2.38
rewards  |  -12.33 |    5.64 |  -46.49 |   -3.62
fuel_rewards |   -4.31 |    0.56 |   -6.83 |   -3.07
glideslope_rewards |    0.00 |    0.00 |    0.00 |    0.00
glideslope_penalty |    0.00 |    0.00 |    0.00 |    0.00
glideslope |    2.95 |   12.59 |    0.01 |  315.07
norm_af  |    1.73 |    0.92 |    0.04 |    3.35
norm_wf  |    0.02 |    0.01 |    0.00 |    0.04
rh_penalty |    0.00 |    0.00 |    0.00 |    0.00
att_rewards |    0.00 |    0.00 |    0.00 |    0.00
att_penalty |    0.00 |    0.00 |    0.00 |    0.00
attitude |    0.01   -0.04    0.06 |    1.20    0.66    1.85 |   -3.14   -1.56   -3.14 |    3.14    1.55    3.14
w        |    0.00   -0.00    0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |   -0.02    0.03 |    0.66

ADV1:  0.0014652559896057825 0.008794730077575806 0.05998399425629408 -0.061152518054237825
ADV2:  0.006724406972690693 0.8737023614121944 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.6516   0.8018   4.5082  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0018   0.0011   0.0043   6.4661   2.1407   2.4885
Update Cnt = 2210    ET =   1064.3   Stats:  Mean, Std, Min, Max
r_f      |    7.07   -5.79   -0.55 |  176.84  171.17  201.34 | -368.09 -376.51 -374.45 |  395.58  371.47  379.87
v_f      |   -0.00    0.00   -0.00 |    0.04    0.04    0.05 |   -0.11   -0.09   -0.10 |    0.09    0.10    0.09
r_i      |   30.34  -31.08   13.18 |  662.66  673.81  760.88 |-1263.37-1281.68-1264.42 | 1288.94 1243.51 1319.39
v_i      |   -0.00    0.00   -0.00 |    0.04    0.04    0.05 |   -0.09   -0.09   -0.10 |    0.09    0.09    0.09
norm_rf  |    0.19 |    0.07 |    0.02 |    0.47
norm_vf  |    0.08 |    0.01 |    0.04 |    0.12
gs_f     |    1.25 |    1.86 | 

Dynamics: Max Disturbance (m/s^2):  [0.00179836 0.00129994 0.00168267] 0.0027848433135488422
ADV1:  -0.001758631828062532 0.00851932800041464 0.039151149273704 -0.061042456834337205
ADV2:  0.045491163721053086 0.8297512828135999 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.6207   1.1303   5.9012  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0020   0.0012   0.0046   6.4661   2.1407   2.4885
***** Episode 68829, Mean R = -12.5  Std R = 3.6  Min R = -22.1
PolicyLoss: -0.0343
Policy_Beta: 0.114
Policy_Entropy: 0.167
Policy_KL: 0.000824
Policy_SD: 0.525
Policy_lr_mult: 0.132
Steps: 1.17e+04
TotalSteps: 2.5e+07
VF_0_ExplainedVarNew: 0.966
VF_0_ExplainedVarOld: 0.962
VF_0_Loss : 0.000333


ADV1:  0.0007164430574310213 0.009967865222510244 0.03507733881049224 -0.094713839325887
ADV2:  0.01632678299095094 0.8731896900088023 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.9880   1.0202   4.0491  27.0893  20.3031  12.6669
ValFun  Gr

***** Episode 69077, Mean R = -12.5  Std R = 3.8  Min R = -23.2
PolicyLoss: -0.0162
Policy_Beta: 0.114
Policy_Entropy: 0.165
Policy_KL: 0.00113
Policy_SD: 0.539
Policy_lr_mult: 0.132
Steps: 1.18e+04
TotalSteps: 2.51e+07
VF_0_ExplainedVarNew: 0.989
VF_0_ExplainedVarOld: 0.986
VF_0_Loss : 0.000256


ADV1:  0.0012196145842534242 0.007269687554055808 0.0397988301102285 -0.06503334080225226
ADV2:  0.008500298621605434 0.8409100233316364 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.7351   0.3222   1.7511  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0015   0.0009   0.0032   6.4661   2.1407   2.4885
***** Episode 69108, Mean R = -12.3  Std R = 3.9  Min R = -27.3
PolicyLoss: -0.0255
Policy_Beta: 0.114
Policy_Entropy: 0.165
Policy_KL: 0.000805
Policy_SD: 0.539
Policy_lr_mult: 0.132
Steps: 1.15e+04
TotalSteps: 2.51e+07
VF_0_ExplainedVarNew: 0.978
VF_0_ExplainedVarOld: 0.975
VF_0_Loss : 0.00023


ADV1:  -0.0001474875127998899 0.006118685092564004

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.1481   0.4674   2.0977  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0015   0.0010   0.0033   6.4661   2.1407   2.4885
***** Episode 69356, Mean R = -11.9  Std R = 3.2  Min R = -21.9
PolicyLoss: -0.0249
Policy_Beta: 0.114
Policy_Entropy: 0.164
Policy_KL: 0.000874
Policy_SD: 0.534
Policy_lr_mult: 0.132
Steps: 1.17e+04
TotalSteps: 2.52e+07
VF_0_ExplainedVarNew: 0.972
VF_0_ExplainedVarOld: 0.968
VF_0_Loss : 0.000283


ADV1:  -0.001213607594049523 0.007808244112052613 0.03874879011470217 -0.07119728303520811
ADV2:  0.03826355173688652 0.8403305459994993 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.2645   1.2450   6.7945  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0019   0.0011   0.0040   6.4661   2.1407   2.4885
***** Episode 69387, Mean R = -14.1  Std R = 5.3  Min R = -31.2
PolicyLoss: -0.0307
Policy_Beta: 0.114
Policy_Entropy: 0.166
Policy_KL: 0.0009

Dynamics: Max Disturbance (m/s^2):  [0.00179836 0.00129994 0.00168267] 0.0027848433135488422
ADV1:  -0.0009014113784231105 0.010286356535036137 0.0356624857926126 -0.055700064703115296
ADV2:  0.02694982660051283 0.8814334660073 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.0279   1.0230   5.0833  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0011   0.0007   0.0025   6.4661   2.1407   2.4885
***** Episode 69635, Mean R = -13.7  Std R = 5.2  Min R = -24.3
PolicyLoss: -0.0239
Policy_Beta: 0.114
Policy_Entropy: 0.166
Policy_KL: 0.00117
Policy_SD: 0.544
Policy_lr_mult: 0.132
Steps: 1.16e+04
TotalSteps: 2.53e+07
VF_0_ExplainedVarNew: 0.956
VF_0_ExplainedVarOld: 0.952
VF_0_Loss : 0.000177


ADV1:  -0.001350493771826985 0.008216505080114978 0.0459658183140183 -0.07125841367304943
ADV2:  0.039885946376496985 0.8242943589208129 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.3640   0.6114   2.7546  27.0893  20.3031  12.6669
ValFun  G

***** Episode 69883, Mean R = -11.7  Std R = 3.9  Min R = -20.1
PolicyLoss: 0.0191
Policy_Beta: 0.114
Policy_Entropy: 0.165
Policy_KL: 0.000948
Policy_SD: 0.526
Policy_lr_mult: 0.132
Steps: 1.17e+04
TotalSteps: 2.54e+07
VF_0_ExplainedVarNew: 0.987
VF_0_ExplainedVarOld: 0.979
VF_0_Loss : 6.04e-05


ADV1:  0.0006471316559929229 0.0052424842619678575 0.065278935091174 -0.04472517298203571
ADV2:  -0.009777336109313717 0.8952147990446095 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.8502   1.0477   5.8934  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0007   0.0004   0.0016   6.4661   2.1407   2.4885
***** Episode 69914, Mean R = -11.5  Std R = 2.4  Min R = -16.1
PolicyLoss: 0.000397
Policy_Beta: 0.114
Policy_Entropy: 0.167
Policy_KL: 0.00105
Policy_SD: 0.515
Policy_lr_mult: 0.132
Steps: 1.19e+04
TotalSteps: 2.54e+07
VF_0_ExplainedVarNew: 0.988
VF_0_ExplainedVarOld: 0.985
VF_0_Loss : 3.46e-05


ADV1:  -0.00013145188757601465 0.006596121819555

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.0493   0.8883   4.9233  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0010   0.0006   0.0023   6.4661   2.1407   2.4885
***** Episode 70162, Mean R = -14.3  Std R = 5.9  Min R = -28.7
PolicyLoss: -0.00206
Policy_Beta: 0.114
Policy_Entropy: 0.163
Policy_KL: 0.0013
Policy_SD: 0.557
Policy_lr_mult: 0.132
Steps: 1.15e+04
TotalSteps: 2.55e+07
VF_0_ExplainedVarNew: 0.991
VF_0_ExplainedVarOld: 0.986
VF_0_Loss : 9.15e-05


ADV1:  -0.00046426626846615904 0.005721252163297279 0.04169089422965938 -0.08864593365913154
ADV2:  0.019518068550391364 0.8720021034933753 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.0041   0.4650   2.6554  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0007   0.0004   0.0015   6.4661   2.1407   2.4885
***** Episode 70193, Mean R = -11.6  Std R = 4.3  Min R = -24.2
PolicyLoss: -0.0171
Policy_Beta: 0.114
Policy_Entropy: 0.167
Policy_KL: 0.00

ADV1:  -0.0003452623229936378 0.006068648491524255 0.04417572364408387 -0.04492687899475223
ADV2:  0.0038902585707043117 0.8925462916897534 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.4030   1.3153   7.2628  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0006   0.0003   0.0013   6.4661   2.1407   2.4885
***** Episode 70441, Mean R = -12.0  Std R = 5.1  Min R = -28.0
PolicyLoss: -0.00233
Policy_Beta: 0.114
Policy_Entropy: 0.166
Policy_KL: 0.00123
Policy_SD: 0.54
Policy_lr_mult: 0.132
Steps: 1.16e+04
TotalSteps: 2.56e+07
VF_0_ExplainedVarNew: 0.987
VF_0_ExplainedVarOld: 0.983
VF_0_Loss : 4.58e-05


ADV1:  -0.0003612311411085382 0.005935953327353974 0.04979153592469421 -0.08977057013546452
ADV2:  0.012476328012692467 0.8541479761331863 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   3.0236   1.5465   7.6547  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0005   0.0003   0.0011   6.4661   2.1407  

cs_angles |  0.0013  0.0008 |  0.0750  0.0805 | -0.9754 -0.9835 |  0.9632  0.9994
optical_flow |  0.0000  0.0000 |  0.0235  0.0235 | -1.1084 -1.0432 |  1.1910  1.0182
v_err    | -0.0102 |  0.0577 | -0.4533 |  0.1082
landing_rewards |    9.58 |    2.00 |    0.00 |   10.00
landing_margin |   -0.02 |    0.01 |   -0.06 |    0.02
tracking_rewards |  -17.49 |    3.94 |  -33.38 |  -10.92
steps    |     377 |      21 |     332 |     419
***** Episode 70720, Mean R = -12.8  Std R = 5.3  Min R = -29.3
PolicyLoss: -0.0161
Policy_Beta: 0.114
Policy_Entropy: 0.167
Policy_KL: 0.000791
Policy_SD: 0.523
Policy_lr_mult: 0.132
Steps: 1.16e+04
TotalSteps: 2.57e+07
VF_0_ExplainedVarNew: 0.95
VF_0_ExplainedVarOld: 0.947
VF_0_Loss : 0.000225


ADV1:  -0.0010848740534382553 0.0057777255211589095 0.039207618508981634 -0.0519873632529933
ADV2:  0.02099611989771279 0.907322609648393 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.5613   0.5742   2.9101  27.0893  20.3031  12.6669
ValFun  Gradients:

attitude |   -0.06    0.03    0.01 |    1.20    0.66    1.86 |   -3.14   -1.56   -3.14 |    3.14    1.57    3.14
w        |    0.00   -0.00    0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |    0.04   -0.05 |    0.66    1.85 |   -1.52   -3.13 |    1.48    3.14
w_f      |    0.00   -0.00    0.00 |    0.01    0.01    0.01 |   -0.03   -0.02   -0.03 |    0.04    0.02    0.03
w_rewards |    0.00 |    0.00 |    0.00 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.24 |    0.25 |    0.00 |    1.51
seeker_angles |   -0.00    0.01 |    0.08    0.08 |   -0.99   -0.98 |    0.98    0.97
cs_angles | -0.0010  0.0055 |  0.0764  0.0829 | -0.9942 -0.9844 |  0.9826  0.9679
optical_flow | -0.0000 -0.0000 |  0.0236  0.0231 | -1.0843 -1.0984 |  0.9104  1.0244
v_err    | -0.0099 |  0.0575 | -0.4527 |  0.1037
landing_rewards |    9.65 |    1.85 |    0.00 |   10.00
landing_margin |   -0

attitude |   -0.00   -0.01    0.02 |    1.16    0.66    1.81 |   -3.14   -1.54   -3.14 |    3.14    1.57    3.14
w        |    0.00   -0.00    0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |   -0.00    0.05 |    0.66    1.81 |   -1.49   -3.14 |    1.45    3.13
w_f      |    0.00   -0.00   -0.00 |    0.01    0.01    0.01 |   -0.04   -0.03   -0.03 |    0.03    0.03    0.02
w_rewards |   -0.00 |    0.00 |   -0.02 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.24 |    0.25 |    0.00 |    1.64
seeker_angles |   -0.00   -0.00 |    0.08    0.08 |   -0.98   -0.98 |    0.99    0.99
cs_angles | -0.0014 -0.0004 |  0.0766  0.0811 | -0.9768 -0.9795 |  0.9877  0.9903
optical_flow | -0.0000 -0.0001 |  0.0234  0.0234 | -1.2473 -1.0463 |  0.9930  1.2062
v_err    | -0.0101 |  0.0580 | -0.4530 |  0.1145
landing_rewards |    9.42 |    2.34 |    0.00 |   10.00
landing_margin |   -0

attitude |    0.07    0.02   -0.09 |    1.11    0.65    1.82 |   -3.14   -1.57   -3.14 |    3.14    1.55    3.14
w        |    0.00    0.00   -0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |    0.01   -0.09 |    0.65    1.80 |   -1.46   -3.12 |    1.42    3.12
w_f      |    0.00   -0.00   -0.00 |    0.01    0.01    0.01 |   -0.04   -0.02   -0.02 |    0.04    0.02    0.02
w_rewards |   -0.00 |    0.00 |   -0.01 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.23 |    0.25 |    0.00 |    1.46
seeker_angles |    0.00    0.00 |    0.07    0.08 |   -0.99   -1.00 |    0.99    0.96
cs_angles |  0.0019  0.0031 |  0.0730  0.0822 | -0.9856 -0.9971 |  0.9939  0.9603
optical_flow |  0.0000 -0.0001 |  0.0247  0.0238 | -1.0036 -1.2693 |  1.1979  1.1047
v_err    | -0.0101 |  0.0573 | -0.4535 |  0.1174
landing_rewards |    9.77 |    1.49 |    0.00 |   10.00
landing_margin |   -0

attitude |   -0.01    0.05    0.04 |    1.17    0.63    1.85 |   -3.14   -1.54   -3.14 |    3.14    1.54    3.14
w        |    0.00   -0.00    0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |    0.05    0.09 |    0.63    1.85 |   -1.42   -3.13 |    1.49    3.13
w_f      |    0.00   -0.00    0.00 |    0.01    0.01    0.01 |   -0.04   -0.03   -0.02 |    0.04    0.02    0.02
w_rewards |   -0.00 |    0.00 |   -0.03 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.23 |    0.24 |    0.00 |    1.53
seeker_angles |    0.00    0.00 |    0.07    0.08 |   -0.99   -0.94 |    0.98    0.99
cs_angles |  0.0018  0.0014 |  0.0735  0.0778 | -0.9879 -0.9390 |  0.9838  0.9940
optical_flow | -0.0001 -0.0001 |  0.0234  0.0231 | -1.0236 -0.8513 |  1.1718  1.0082
v_err    | -0.0105 |  0.0579 | -0.4527 |  0.1028
landing_rewards |    9.81 |    1.38 |    0.00 |   10.00
landing_margin |   -0

attitude |   -0.04   -0.04    0.04 |    1.22    0.64    1.88 |   -3.14   -1.54   -3.14 |    3.14    1.53    3.14
w        |    0.00    0.00    0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |   -0.05    0.10 |    0.64    1.89 |   -1.49   -3.12 |    1.33    3.14
w_f      |    0.00   -0.00    0.00 |    0.01    0.01    0.01 |   -0.03   -0.02   -0.02 |    0.05    0.02    0.03
w_rewards |   -0.00 |    0.00 |   -0.02 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.24 |    0.25 |    0.00 |    1.62
seeker_angles |    0.00    0.00 |    0.08    0.08 |   -0.99   -0.97 |    0.98    1.00
cs_angles |  0.0012  0.0012 |  0.0796  0.0806 | -0.9931 -0.9722 |  0.9753  0.9997
optical_flow |  0.0001 -0.0000 |  0.0246  0.0242 | -1.1661 -1.0452 |  1.0730  1.0389
v_err    | -0.0105 |  0.0573 | -0.4520 |  0.1032
landing_rewards |    9.74 |    1.59 |    0.00 |   10.00
landing_margin |   -0

attitude |    0.01   -0.02    0.15 |    1.17    0.64    1.89 |   -3.14   -1.52   -3.14 |    3.14    1.52    3.14
w        |    0.00   -0.00    0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |   -0.01    0.23 |    0.65    1.89 |   -1.47   -3.13 |    1.50    3.14
w_f      |    0.00   -0.00    0.00 |    0.01    0.01    0.01 |   -0.03   -0.02   -0.02 |    0.04    0.02    0.03
w_rewards |   -0.00 |    0.00 |   -0.02 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.23 |    0.25 |    0.00 |    1.86
seeker_angles |    0.00    0.00 |    0.08    0.08 |   -1.00   -0.99 |    0.99    0.99
cs_angles |  0.0012  0.0006 |  0.0755  0.0787 | -0.9962 -0.9913 |  0.9897  0.9931
optical_flow |  0.0001 -0.0001 |  0.0238  0.0235 | -1.0943 -1.3285 |  0.9159  1.1513
v_err    | -0.0102 |  0.0575 | -0.4529 |  0.1047
landing_rewards |    9.77 |    1.49 |    0.00 |   10.00
landing_margin |   -0

attitude |    0.07   -0.05   -0.13 |    1.26    0.68    1.92 |   -3.14   -1.57   -3.14 |    3.14    1.54    3.14
w        |    0.00    0.00    0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |   -0.06   -0.07 |    0.69    1.93 |   -1.53   -3.13 |    1.54    3.11
w_f      |   -0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.04   -0.02   -0.03 |    0.04    0.02    0.02
w_rewards |   -0.00 |    0.00 |   -0.02 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.23 |    0.24 |    0.00 |    1.55
seeker_angles |    0.00    0.00 |    0.07    0.08 |   -1.00   -0.98 |    1.00    0.99
cs_angles |  0.0016  0.0032 |  0.0747  0.0781 | -0.9956 -0.9824 |  0.9993  0.9871
optical_flow | -0.0000  0.0001 |  0.0248  0.0235 | -1.2400 -0.9029 |  1.2651  0.9837
v_err    | -0.0102 |  0.0576 | -0.4525 |  0.1001
landing_rewards |    9.68 |    1.77 |    0.00 |   10.00
landing_margin |   -0

attitude |   -0.06    0.03   -0.07 |    1.15    0.63    1.89 |   -3.14   -1.55   -3.14 |    3.14    1.57    3.14
w        |    0.00   -0.00    0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |    0.04   -0.09 |    0.63    1.89 |   -1.45   -3.12 |    1.51    3.14
w_f      |    0.00   -0.00   -0.00 |    0.01    0.01    0.01 |   -0.03   -0.02   -0.02 |    0.04    0.02    0.03
w_rewards |   -0.00 |    0.00 |   -0.03 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.24 |    0.25 |    0.00 |    1.60
seeker_angles |    0.00    0.00 |    0.08    0.08 |   -0.99   -1.00 |    0.97    0.99
cs_angles |  0.0017  0.0023 |  0.0751  0.0840 | -0.9940 -0.9964 |  0.9687  0.9940
optical_flow |  0.0000 -0.0000 |  0.0247  0.0229 | -1.1673 -1.1901 |  1.0425  1.0897
v_err    | -0.0103 |  0.0576 | -0.4529 |  0.1038
landing_rewards |    9.71 |    1.68 |    0.00 |   10.00
landing_margin |   -0

attitude |    0.03    0.04    0.22 |    1.09    0.67    1.76 |   -3.14   -1.56   -3.14 |    3.14    1.57    3.14
w        |    0.00    0.00   -0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |    0.05    0.24 |    0.67    1.76 |   -1.46   -3.13 |    1.40    3.12
w_f      |    0.00   -0.00   -0.00 |    0.01    0.01    0.01 |   -0.03   -0.03   -0.02 |    0.03    0.02    0.02
w_rewards |   -0.00 |    0.00 |   -0.02 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.24 |    0.25 |    0.00 |    1.54
seeker_angles |    0.00    0.00 |    0.07    0.08 |   -0.99   -0.99 |    0.99    0.97
cs_angles |  0.0018  0.0027 |  0.0742  0.0837 | -0.9890 -0.9947 |  0.9943  0.9686
optical_flow | -0.0000  0.0000 |  0.0249  0.0242 | -1.2345 -1.0082 |  1.1504  1.3577
v_err    | -0.0104 |  0.0577 | -0.4518 |  0.1120
landing_rewards |    9.52 |    2.15 |    0.00 |   10.00
landing_margin |   -0

glideslope_rewards |    0.00 |    0.00 |    0.00 |    0.00
glideslope_penalty |    0.00 |    0.00 |    0.00 |    0.00
glideslope |    2.98 |   12.92 |    0.01 |  708.25
norm_af  |    1.77 |    0.95 |    0.11 |    3.38
norm_wf  |    0.02 |    0.01 |    0.00 |    0.04
rh_penalty |    0.00 |    0.00 |    0.00 |    0.00
att_rewards |    0.00 |    0.00 |    0.00 |    0.00
att_penalty |    0.00 |    0.00 |    0.00 |    0.00
attitude |   -0.06   -0.00    0.20 |    1.22    0.62    1.91 |   -3.14   -1.57   -3.14 |    3.14    1.51    3.14
w        |    0.00   -0.00    0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |   -0.00    0.17 |    0.61    1.90 |   -1.43   -3.14 |    1.47    3.14
w_f      |    0.00   -0.00    0.00 |    0.01    0.01    0.01 |   -0.03   -0.02   -0.03 |    0.03    0.02    0.03
w_rewards |   -0.00 |    0.00 |   -0.02 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_

Update Cnt = 2390    ET =   1013.2   Stats:  Mean, Std, Min, Max
r_f      |  -20.94   -9.55  -11.97 |  180.38  177.06  204.08 | -390.01 -387.07 -392.78 |  391.55  381.77  391.54
v_f      |    0.01    0.00    0.00 |    0.04    0.04    0.05 |   -0.09   -0.08   -0.10 |    0.10    0.09    0.11
r_i      |  -71.23  -13.54  -50.93 |  666.54  666.74  777.46 |-1342.05-1335.12-1314.66 | 1316.50 1307.65 1309.37
v_i      |    0.00   -0.00    0.00 |    0.04    0.04    0.05 |   -0.09   -0.09   -0.10 |    0.10    0.10    0.09
norm_rf  |    0.19 |    0.07 |    0.03 |    0.46
norm_vf  |    0.08 |    0.01 |    0.04 |    0.11
gs_f     |    1.50 |    4.28 |    0.01 |   70.00
thrust   |   -0.00    0.00   -0.00 |    0.68    0.68    0.68 |   -3.46   -3.40   -3.38 |    3.46    3.40    3.36
norm_thrust |    0.90 |    0.76 |    0.00 |    3.46
fuel     |    1.56 |    0.21 |    1.11 |    2.16
rewards  |  -12.33 |    5.11 |  -28.33 |   -4.57
fuel_rewards |   -4.47 |    0.59 |   -6.17 |   -3.20
glideslope_rewards |

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.1387   0.5721   2.6986  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0036   0.0021   0.0079   6.4661   2.1407   2.4885
***** Episode 74409, Mean R = -11.5  Std R = 5.2  Min R = -24.5
PolicyLoss: -0.0278
Policy_Beta: 0.114
Policy_Entropy: 0.166
Policy_KL: 0.000847
Policy_SD: 0.535
Policy_lr_mult: 0.132
Steps: 1.16e+04
TotalSteps: 2.71e+07
VF_0_ExplainedVarNew: 0.957
VF_0_ExplainedVarOld: 0.952
VF_0_Loss : 0.000201


ADV1:  0.0020150678431824763 0.006979442565891118 0.06606278998875359 -0.05295789993374554
ADV2:  -0.007063219053258165 0.8656837571343471 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.3750   0.5285   2.2217  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0027   0.0016   0.0057   6.4661   2.1407   2.4885
Update Cnt = 2400    ET =    989.5   Stats:  Mean, Std, Min, Max
r_f      |   -3.95   21.74    7.13 |  182.24  158.92  201.69 | -375.18 -362

ADV1:  -0.00011586674057417656 0.007101025856626999 0.06384254748788265 -0.05433027644952138
ADV2:  0.021276685081693652 0.7939126274381462 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   3.4170   1.8752   8.0664  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0002   0.0001   0.0005   6.4661   2.1407   2.4885
***** Episode 74688, Mean R = -10.8  Std R = 4.4  Min R = -24.8
PolicyLoss: -0.0239
Policy_Beta: 0.114
Policy_Entropy: 0.171
Policy_KL: 0.00175
Policy_SD: 0.514
Policy_lr_mult: 0.132
Steps: 1.16e+04
TotalSteps: 2.72e+07
VF_0_ExplainedVarNew: 0.978
VF_0_ExplainedVarOld: 0.973
VF_0_Loss : 0.000196


ADV1:  -0.00045721303002611456 0.00899476261707805 0.024812922477533673 -0.07222875943246404
ADV2:  0.025257076520073498 0.8728315374854407 2.700827165452481 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.2839   0.6386   3.5937  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0007   0.0004   0.0015   6.

***** Episode 74936, Mean R = -11.8  Std R = 3.4  Min R = -19.1
PolicyLoss: -0.0149
Policy_Beta: 0.114
Policy_Entropy: 0.17
Policy_KL: 0.00128
Policy_SD: 0.523
Policy_lr_mult: 0.132
Steps: 1.16e+04
TotalSteps: 2.73e+07
VF_0_ExplainedVarNew: 0.989
VF_0_ExplainedVarOld: 0.986
VF_0_Loss : 3.54e-05


ADV1:  -0.0014394120305021166 0.007735505338743308 0.04174523078975961 -0.0531230314440156
ADV2:  0.0377803635051728 0.8477268707740466 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.3079   0.5706   2.7173  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0015   0.0009   0.0037   6.4661   2.1407   2.4885
***** Episode 74967, Mean R = -11.2  Std R = 4.4  Min R = -22.7
PolicyLoss: -0.0295
Policy_Beta: 0.114
Policy_Entropy: 0.17
Policy_KL: 0.00113
Policy_SD: 0.511
Policy_lr_mult: 0.132
Steps: 1.17e+04
TotalSteps: 2.73e+07
VF_0_ExplainedVarNew: 0.968
VF_0_ExplainedVarOld: 0.966
VF_0_Loss : 7.51e-05


ADV1:  -0.000915015084598919 0.009875359627718206 0.0

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.5277   0.8503   4.7137  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0008   0.0005   0.0020   6.4661   2.1407   2.4885
***** Episode 75215, Mean R = -12.7  Std R = 4.0  Min R = -20.6
PolicyLoss: -0.0297
Policy_Beta: 0.114
Policy_Entropy: 0.167
Policy_KL: 0.0012
Policy_SD: 0.53
Policy_lr_mult: 0.132
Steps: 1.17e+04
TotalSteps: 2.74e+07
VF_0_ExplainedVarNew: 0.98
VF_0_ExplainedVarOld: 0.978
VF_0_Loss : 6.03e-05


ADV1:  0.0005520990479246988 0.006558930918086189 0.04339621632321805 -0.0775429208373613
ADV2:  0.020748625974960414 0.8126746087416732 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.1185   0.6602   3.5487  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0010   0.0005   0.0019   6.4661   2.1407   2.4885
***** Episode 75246, Mean R = -11.4  Std R = 4.3  Min R = -22.0
PolicyLoss: -0.0301
Policy_Beta: 0.114
Policy_Entropy: 0.17
Policy_KL: 0.00082
Pol

ADV1:  0.0007595897864790604 0.008417354181463638 0.035586755936887704 -0.05386389377241529
ADV2:  0.014132897411958735 0.8772906952664374 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.0260   1.0347   5.3246  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0012   0.0006   0.0022   6.4661   2.1407   2.4885
***** Episode 75494, Mean R = -13.0  Std R = 4.8  Min R = -24.2
PolicyLoss: -0.025
Policy_Beta: 0.114
Policy_Entropy: 0.168
Policy_KL: 0.00134
Policy_SD: 0.536
Policy_lr_mult: 0.132
Steps: 1.17e+04
TotalSteps: 2.75e+07
VF_0_ExplainedVarNew: 0.973
VF_0_ExplainedVarOld: 0.97
VF_0_Loss : 0.000327


ADV1:  -0.0034677637608159133 0.008596404024892037 0.0737951642210628 -0.07151274083680535
ADV2:  0.050761322617212445 0.8132399983374404 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.3016   1.2006   6.7654  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0041   0.0024   0.0089   6.4661   2.1407   2.4

***** Episode 75742, Mean R = -13.2  Std R = 5.3  Min R = -27.2
PolicyLoss: -0.0272
Policy_Beta: 0.114
Policy_Entropy: 0.169
Policy_KL: 0.000875
Policy_SD: 0.541
Policy_lr_mult: 0.132
Steps: 1.15e+04
TotalSteps: 2.76e+07
VF_0_ExplainedVarNew: 0.977
VF_0_ExplainedVarOld: 0.973
VF_0_Loss : 8.83e-05


ADV1:  -0.0005483787706338491 0.005097482472362681 0.048909615670928996 -0.050436123860469084
ADV2:  0.005209214793865188 0.9143885558716428 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.1937   0.9533   4.8563  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0008   0.0004   0.0016   6.4661   2.1407   2.4885
***** Episode 75773, Mean R = -11.0  Std R = 4.9  Min R = -25.9
PolicyLoss: 0.000238
Policy_Beta: 0.114
Policy_Entropy: 0.172
Policy_KL: 0.0012
Policy_SD: 0.513
Policy_lr_mult: 0.132
Steps: 1.18e+04
TotalSteps: 2.76e+07
VF_0_ExplainedVarNew: 0.99
VF_0_ExplainedVarOld: 0.987
VF_0_Loss : 4.64e-05


ADV1:  0.00047375272145541085 0.00737931575995

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.7033   0.4272   2.1385  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0009   0.0007   0.0025   6.4661   2.1407   2.4885
***** Episode 76021, Mean R = -12.2  Std R = 4.7  Min R = -25.1
PolicyLoss: -0.0215
Policy_Beta: 0.114
Policy_Entropy: 0.172
Policy_KL: 0.000963
Policy_SD: 0.521
Policy_lr_mult: 0.132
Steps: 1.16e+04
TotalSteps: 2.77e+07
VF_0_ExplainedVarNew: 0.982
VF_0_ExplainedVarOld: 0.976
VF_0_Loss : 5.27e-05


ADV1:  -0.0006774699725504768 0.008053893968135464 0.04959739369604005 -0.10928500348135228
ADV2:  0.03833324213442454 0.7864598810476525 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   3.0579   1.1408   5.7311  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0010   0.0005   0.0022   6.4661   2.1407   2.4885
***** Episode 76052, Mean R = -13.4  Std R = 6.0  Min R = -31.2
PolicyLoss: -0.0377
Policy_Beta: 0.114
Policy_Entropy: 0.169
Policy_KL: 0.001

cs_angles |  0.0016  0.0022 |  0.0781  0.0792 | -0.9864 -0.9970 |  0.9973  0.9741
optical_flow | -0.0000  0.0000 |  0.0241  0.0230 | -1.1605 -0.9537 |  1.2127  0.9873
v_err    | -0.0099 |  0.0579 | -0.4524 |  0.1072
landing_rewards |    9.71 |    1.68 |    0.00 |   10.00
landing_margin |   -0.02 |    0.01 |   -0.05 |    0.03
tracking_rewards |  -17.47 |    4.23 |  -35.40 |  -10.16
steps    |     377 |      20 |     333 |     415
***** Episode 76300, Mean R = -14.6  Std R = 5.9  Min R = -27.8
PolicyLoss: -0.0274
Policy_Beta: 0.114
Policy_Entropy: 0.169
Policy_KL: 0.000982
Policy_SD: 0.536
Policy_lr_mult: 0.132
Steps: 1.17e+04
TotalSteps: 2.78e+07
VF_0_ExplainedVarNew: 0.979
VF_0_ExplainedVarOld: 0.976
VF_0_Loss : 7.99e-05


ADV1:  -0.0016377338552760925 0.0068463774016131514 0.03785350369996088 -0.05119119953975972
ADV2:  0.04018930100232916 0.8305792013360321 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.8825   0.5275   2.7258  27.0893  20.3031  12.6669
ValFun  Gradient

w        |    0.00   -0.00    0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |   -0.00   -0.05 |    0.65    1.84 |   -1.52   -3.14 |    1.34    3.11
w_f      |    0.00   -0.00    0.00 |    0.01    0.01    0.01 |   -0.03   -0.02   -0.02 |    0.04    0.02    0.02
w_rewards |   -0.00 |    0.00 |   -0.03 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.24 |    0.25 |    0.00 |    1.49
seeker_angles |    0.00    0.01 |    0.08    0.08 |   -1.00   -0.98 |    0.98    1.00
cs_angles |  0.0019  0.0054 |  0.0784  0.0800 | -0.9999 -0.9789 |  0.9825  0.9961
optical_flow |  0.0000  0.0000 |  0.0230  0.0229 | -1.0175 -1.1011 |  0.9893  1.0848
v_err    | -0.0100 |  0.0578 | -0.4521 |  0.1062
landing_rewards |    9.48 |    2.21 |    0.00 |   10.00
landing_margin |   -0.02 |    0.01 |   -0.06 |    0.01
tracking_rewards |  -17.63 |    4.04 |  -33.59 |  -10.52
steps    |     376 |  

thrust   |    0.00   -0.00   -0.01 |    0.67    0.67    0.66 |   -3.44   -3.42   -3.36 |    3.40    3.40    3.45
norm_thrust |    0.87 |    0.75 |    0.00 |    3.46
fuel     |    1.47 |    0.19 |    0.93 |    2.25
rewards  |  -12.04 |    4.90 |  -28.06 |   -3.75
fuel_rewards |   -4.22 |    0.54 |   -6.43 |   -2.66
glideslope_rewards |    0.00 |    0.00 |    0.00 |    0.00
glideslope_penalty |    0.00 |    0.00 |    0.00 |    0.00
glideslope |    2.92 |   12.86 |    0.01 |  205.73
norm_af  |    1.79 |    0.91 |    0.06 |    3.26
norm_wf  |    0.02 |    0.01 |    0.00 |    0.04
rh_penalty |    0.00 |    0.00 |    0.00 |    0.00
att_rewards |    0.00 |    0.00 |    0.00 |    0.00
att_penalty |    0.00 |    0.00 |    0.00 |    0.00
attitude |    0.04   -0.03    0.20 |    1.28    0.67    1.89 |   -3.14   -1.57   -3.14 |    3.14    1.57    3.14
w        |    0.00   -0.00   -0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |   -0.02    0.21 |    0.66

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.7071   1.0779   4.9974  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0012   0.0006   0.0027   6.4661   2.1407   2.4885
Update Cnt = 2490    ET =   1025.1   Stats:  Mean, Std, Min, Max
r_f      |   17.60   -5.93    1.24 |  188.38  171.31  193.48 | -386.19 -382.18 -380.08 |  393.47  355.62  388.18
v_f      |   -0.00   -0.00   -0.00 |    0.04    0.04    0.05 |   -0.09   -0.09   -0.09 |    0.09    0.09    0.11
r_i      |   34.59  -10.67  -12.83 |  688.54  653.53  764.34 |-1287.17-1259.56-1284.00 | 1278.44 1356.43 1257.14
v_i      |   -0.00    0.00   -0.00 |    0.04    0.04    0.05 |   -0.09   -0.09   -0.09 |    0.08    0.09    0.09
norm_rf  |    0.19 |    0.07 |    0.01 |    0.44
norm_vf  |    0.08 |    0.01 |    0.05 |    0.13
gs_f     |    1.29 |    1.85 |    0.01 |   13.72
thrust   |    0.00   -0.00    0.00 |    0.68    0.68    0.68 |   -3.41   -3.43   -3.45 |    3.38    3.45    3.44
norm_thrust |    

ADV1:  0.000510546502783271 0.005100366547219388 0.0662169599422815 -0.05550887896249623
ADV2:  0.0070208378769110544 0.8774125593545109 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.5771   0.9051   4.6235  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0006   0.0004   0.0014   6.4661   2.1407   2.4885
***** Episode 77509, Mean R = -12.4  Std R = 5.8  Min R = -34.4
PolicyLoss: -0.0166
Policy_Beta: 0.114
Policy_Entropy: 0.17
Policy_KL: 0.00064
Policy_SD: 0.525
Policy_lr_mult: 0.132
Steps: 1.18e+04
TotalSteps: 2.83e+07
VF_0_ExplainedVarNew: 0.992
VF_0_ExplainedVarOld: 0.989
VF_0_Loss : 1.96e-05


ADV1:  -0.0026524472458064165 0.006408913888115319 0.03865932619322332 -0.04696775868019176
ADV2:  0.05071543152218566 0.8585271819390572 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.2338   1.4655   7.1743  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0035   0.0021   0.0071   6.4661   2.1407   2.48

***** Episode 77757, Mean R = -10.4  Std R = 4.2  Min R = -23.2
PolicyLoss: -0.00625
Policy_Beta: 0.114
Policy_Entropy: 0.172
Policy_KL: 0.00129
Policy_SD: 0.514
Policy_lr_mult: 0.132
Steps: 1.16e+04
TotalSteps: 2.84e+07
VF_0_ExplainedVarNew: 0.983
VF_0_ExplainedVarOld: 0.978
VF_0_Loss : 3.74e-05


ADV1:  -0.0001608518156196683 0.006418944420862287 0.03177642711983544 -0.0703351922435666
ADV2:  0.02239144806011853 0.8754026128047655 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   3.7562   1.4107   8.7046  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0002   0.0001   0.0005   6.4661   2.1407   2.4885
***** Episode 77788, Mean R = -13.1  Std R = 4.2  Min R = -20.2
PolicyLoss: -0.0249
Policy_Beta: 0.114
Policy_Entropy: 0.171
Policy_KL: 0.000931
Policy_SD: 0.523
Policy_lr_mult: 0.132
Steps: 1.17e+04
TotalSteps: 2.84e+07
VF_0_ExplainedVarNew: 0.987
VF_0_ExplainedVarOld: 0.983
VF_0_Loss : 5.78e-05


ADV1:  0.0011166615479138505 0.00750292726031150

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.4142   0.6920   3.2787  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0015   0.0008   0.0030   6.4661   2.1407   2.4885
***** Episode 78036, Mean R = -11.5  Std R = 3.9  Min R = -21.6
PolicyLoss: -0.0335
Policy_Beta: 0.114
Policy_Entropy: 0.169
Policy_KL: 0.000644
Policy_SD: 0.524
Policy_lr_mult: 0.132
Steps: 1.17e+04
TotalSteps: 2.85e+07
VF_0_ExplainedVarNew: 0.964
VF_0_ExplainedVarOld: 0.961
VF_0_Loss : 8.39e-05


ADV1:  0.00088192281670359 0.0066248632169606135 0.027947449584802032 -0.0459891945488566
ADV2:  0.01636105516559582 0.8348247866175317 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.5580   1.3651   7.2102  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0009   0.0005   0.0023   6.4661   2.1407   2.4885
***** Episode 78067, Mean R = -11.4  Std R = 3.2  Min R = -19.7
PolicyLoss: -0.0308
Policy_Beta: 0.114
Policy_Entropy: 0.171
Policy_KL: 0.00114

ADV1:  0.0007053197925845437 0.008046081674385058 0.047515618805757054 -0.06611662740469226
ADV2:  0.020491502186683292 0.8280453688344098 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.3649   0.8138   4.1639  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0009   0.0005   0.0019   6.4661   2.1407   2.4885
***** Episode 78315, Mean R = -12.3  Std R = 5.0  Min R = -24.8
PolicyLoss: -0.032
Policy_Beta: 0.114
Policy_Entropy: 0.172
Policy_KL: 0.000879
Policy_SD: 0.533
Policy_lr_mult: 0.132
Steps: 1.15e+04
TotalSteps: 2.86e+07
VF_0_ExplainedVarNew: 0.974
VF_0_ExplainedVarOld: 0.97
VF_0_Loss : 5.79e-05


ADV1:  0.0024029448700083286 0.005260906171115568 0.039066067493214895 -0.037863731709413845
ADV2:  -0.03480694624734422 0.9200239101698479 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.9968   1.3615   7.3003  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0030   0.0019   0.0066   6.4661   2.1407   

***** Episode 78563, Mean R = -11.1  Std R = 4.0  Min R = -20.2
PolicyLoss: -0.00986
Policy_Beta: 0.114
Policy_Entropy: 0.17
Policy_KL: 0.00118
Policy_SD: 0.533
Policy_lr_mult: 0.132
Steps: 1.17e+04
TotalSteps: 2.87e+07
VF_0_ExplainedVarNew: 0.988
VF_0_ExplainedVarOld: 0.985
VF_0_Loss : 2.57e-05


ADV1:  -0.0003148949967895413 0.008093203448502492 0.032117528600328626 -0.06795446944829221
ADV2:  0.03135218128246077 0.823286832737881 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.3745   0.6242   3.2581  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0006   0.0003   0.0012   6.4661   2.1407   2.4885
***** Episode 78594, Mean R = -12.2  Std R = 4.5  Min R = -24.1
PolicyLoss: -0.0334
Policy_Beta: 0.114
Policy_Entropy: 0.171
Policy_KL: 0.000925
Policy_SD: 0.525
Policy_lr_mult: 0.132
Steps: 1.18e+04
TotalSteps: 2.87e+07
VF_0_ExplainedVarNew: 0.972
VF_0_ExplainedVarOld: 0.968
VF_0_Loss : 5.94e-05


Dynamics: Max Disturbance (m/s^2):  [0.00179836 

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.4682   1.0691   5.7322  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0012   0.0008   0.0027   6.4661   2.1407   2.4885
***** Episode 78842, Mean R = -13.0  Std R = 5.2  Min R = -26.8
PolicyLoss: -0.0289
Policy_Beta: 0.114
Policy_Entropy: 0.172
Policy_KL: 0.000825
Policy_SD: 0.528
Policy_lr_mult: 0.132
Steps: 1.17e+04
TotalSteps: 2.88e+07
VF_0_ExplainedVarNew: 0.97
VF_0_ExplainedVarOld: 0.967
VF_0_Loss : 6.92e-05


ADV1:  0.004034398622958157 0.005878032746266108 0.04188340435711568 -0.038847967333349775
ADV2:  -0.04916867801090032 0.9456235626104501 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.1813   1.3815   7.0378  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0046   0.0029   0.0104   6.4661   2.1407   2.4885
***** Episode 78873, Mean R = -12.3  Std R = 5.0  Min R = -24.6
PolicyLoss: -0.00804
Policy_Beta: 0.114
Policy_Entropy: 0.168
Policy_KL: 0.001

ADV1:  -0.00016845898128224051 0.00532024071298277 0.033310067811396574 -0.051585542986450794
ADV2:  0.008367472960391201 0.8976460576358077 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.1572   0.8570   4.7098  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0004   0.0002   0.0008   6.4661   2.1407   2.4885
***** Episode 79121, Mean R = -13.2  Std R = 5.6  Min R = -26.6
PolicyLoss: -0.00975
Policy_Beta: 0.114
Policy_Entropy: 0.172
Policy_KL: 0.000835
Policy_SD: 0.54
Policy_lr_mult: 0.132
Steps: 1.18e+04
TotalSteps: 2.89e+07
VF_0_ExplainedVarNew: 0.992
VF_0_ExplainedVarOld: 0.989
VF_0_Loss : 2.24e-05


Dynamics: Max Disturbance (m/s^2):  [0.00179836 0.00129994 0.00168267] 0.0027848433135488422
ADV1:  -0.0016533811930869188 0.00886014486904825 0.05477423599590875 -0.05775079403211644
ADV2:  0.04319547387788389 0.8254667440726198 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.5313   0.6084   3.7591  27.0893  20.3031  12.6669
Va

seeker_angles |    0.00    0.00 |    0.08    0.08 |   -1.00   -0.99 |    0.99    1.00
cs_angles |  0.0025  0.0036 |  0.0766  0.0834 | -0.9963 -0.9936 |  0.9853  0.9995
optical_flow | -0.0000  0.0000 |  0.0243  0.0239 | -1.1797 -1.1485 |  0.9481  1.1402
v_err    | -0.0107 |  0.0576 | -0.4527 |  0.1072
landing_rewards |    9.68 |    1.77 |    0.00 |   10.00
landing_margin |   -0.03 |    0.01 |   -0.05 |    0.02
tracking_rewards |  -17.51 |    4.41 |  -39.56 |   -9.96
steps    |     377 |      20 |     331 |     418
***** Episode 79400, Mean R = -12.8  Std R = 5.9  Min R = -29.3
PolicyLoss: -0.0276
Policy_Beta: 0.114
Policy_Entropy: 0.17
Policy_KL: 0.00135
Policy_SD: 0.533
Policy_lr_mult: 0.132
Steps: 1.16e+04
TotalSteps: 2.9e+07
VF_0_ExplainedVarNew: 0.963
VF_0_ExplainedVarOld: 0.957
VF_0_Loss : 9.32e-05


Dynamics: Max Disturbance (m/s^2):  [0.00179836 0.00129994 0.00168267] 0.0027848433135488422
ADV1:  0.002543240481057744 0.0048981629444556285 0.03956511120414902 -0.04420905628612337


norm_wf  |    0.02 |    0.01 |    0.00 |    0.04
rh_penalty |    0.00 |    0.00 |    0.00 |    0.00
att_rewards |    0.00 |    0.00 |    0.00 |    0.00
att_penalty |    0.00 |    0.00 |    0.00 |    0.00
attitude |   -0.08    0.01   -0.09 |    1.21    0.66    1.85 |   -3.14   -1.55   -3.14 |    3.14    1.56    3.14
w        |    0.00    0.00   -0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |    0.02   -0.11 |    0.66    1.84 |   -1.55   -3.14 |    1.42    3.12
w_f      |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.03   -0.02   -0.02 |    0.04    0.02    0.02
w_rewards |   -0.00 |    0.00 |   -0.02 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.23 |    0.25 |    0.00 |    1.54
seeker_angles |    0.00    0.00 |    0.07    0.08 |   -1.00   -0.96 |    0.97    0.96
cs_angles |  0.0007  0.0038 |  0.0739  0.0786 | -0.9962 -0.9639 |  0.9733  0.9643
optical

attitude |   -0.05   -0.05   -0.04 |    1.13    0.65    1.88 |   -3.14   -1.54   -3.14 |    3.14    1.57    3.14
w        |    0.00   -0.00   -0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |   -0.06   -0.07 |    0.65    1.89 |   -1.48   -3.13 |    1.48    3.13
w_f      |    0.00   -0.00   -0.00 |    0.02    0.01    0.01 |   -0.04   -0.02   -0.02 |    0.04    0.02    0.02
w_rewards |   -0.00 |    0.00 |   -0.01 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.23 |    0.25 |    0.00 |    1.72
seeker_angles |    0.00    0.00 |    0.08    0.08 |   -0.96   -0.99 |    1.00    0.99
cs_angles |  0.0004  0.0022 |  0.0773  0.0775 | -0.9615 -0.9926 |  0.9950  0.9937
optical_flow |  0.0000  0.0000 |  0.0257  0.0234 | -1.2709 -1.2631 |  1.3477  1.0064
v_err    | -0.0105 |  0.0578 | -0.4528 |  0.1102
landing_rewards |    9.77 |    1.49 |    0.00 |   10.00
landing_margin |   -0

attitude |    0.04   -0.01    0.07 |    1.26    0.66    1.92 |   -3.14   -1.54   -3.14 |    3.14    1.53    3.14
w        |   -0.00   -0.00    0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |   -0.01    0.08 |    0.66    1.90 |   -1.47   -3.14 |    1.44    3.14
w_f      |   -0.00   -0.00    0.00 |    0.01    0.01    0.01 |   -0.03   -0.02   -0.02 |    0.04    0.03    0.02
w_rewards |   -0.00 |    0.00 |   -0.07 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.23 |    0.24 |    0.00 |    1.99
seeker_angles |    0.00    0.00 |    0.07    0.08 |   -0.96   -0.97 |    1.00    1.00
cs_angles |  0.0019  0.0030 |  0.0698  0.0793 | -0.9577 -0.9688 |  0.9987  0.9963
optical_flow |  0.0000  0.0001 |  0.0230  0.0228 | -1.1765 -1.2229 |  0.9585  1.0340
v_err    | -0.0108 |  0.0578 | -0.4518 |  0.1181
landing_rewards |    9.74 |    1.59 |    0.00 |   10.00
landing_margin |   -0

attitude |   -0.04   -0.01    0.10 |    1.16    0.67    1.78 |   -3.14   -1.53   -3.14 |    3.14    1.51    3.14
w        |    0.00    0.00   -0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |   -0.00    0.15 |    0.66    1.77 |   -1.49   -3.13 |    1.38    3.12
w_f      |    0.00   -0.00   -0.00 |    0.01    0.01    0.01 |   -0.03   -0.02   -0.02 |    0.04    0.02    0.02
w_rewards |   -0.00 |    0.00 |   -0.01 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.23 |    0.25 |    0.00 |    1.43
seeker_angles |    0.00    0.00 |    0.08    0.08 |   -0.99   -0.97 |    0.99    0.99
cs_angles |  0.0007  0.0043 |  0.0774  0.0803 | -0.9890 -0.9745 |  0.9906  0.9868
optical_flow | -0.0000  0.0000 |  0.0250  0.0241 | -1.2370 -1.0444 |  1.2081  1.1198
v_err    | -0.0106 |  0.0575 | -0.4528 |  0.1033
landing_rewards |    9.77 |    1.49 |    0.00 |   10.00
landing_margin |   -0

w        |    0.00   -0.00   -0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |   -0.07    0.10 |    0.64    1.84 |   -1.41   -3.14 |    1.42    3.14
w_f      |    0.00   -0.00    0.00 |    0.01    0.01    0.01 |   -0.04   -0.02   -0.02 |    0.04    0.02    0.02
w_rewards |   -0.00 |    0.00 |   -0.01 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.24 |    0.25 |    0.00 |    1.52
seeker_angles |    0.00    0.00 |    0.07    0.08 |   -0.99   -1.00 |    1.00    0.98
cs_angles |  0.0025  0.0042 |  0.0735  0.0821 | -0.9931 -0.9983 |  0.9984  0.9822
optical_flow |  0.0001 -0.0000 |  0.0242  0.0247 | -0.9094 -1.0697 |  1.1489  1.1277
v_err    | -0.0106 |  0.0583 | -0.4532 |  0.1166
landing_rewards |    9.68 |    1.77 |    0.00 |   10.00
landing_margin |   -0.03 |    0.01 |   -0.07 |    0.02
tracking_rewards |  -17.27 |    3.84 |  -40.24 |  -10.48
steps    |     377 |  

w        |    0.00   -0.00    0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |   -0.00    0.27 |    0.71    1.84 |   -1.48   -3.12 |    1.51    3.14
w_f      |    0.00   -0.00   -0.00 |    0.01    0.01    0.01 |   -0.03   -0.02   -0.03 |    0.04    0.02    0.02
w_rewards |   -0.00 |    0.00 |   -0.03 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.24 |    0.25 |    0.00 |    1.50
seeker_angles |   -0.00    0.00 |    0.08    0.08 |   -1.00   -0.99 |    0.98    1.00
cs_angles | -0.0000  0.0042 |  0.0757  0.0794 | -0.9992 -0.9925 |  0.9814  0.9982
optical_flow |  0.0000 -0.0001 |  0.0227  0.0239 | -1.1766 -1.0815 |  0.9116  1.0704
v_err    | -0.0104 |  0.0581 | -0.4534 |  0.1190
landing_rewards |    9.81 |    1.38 |    0.00 |   10.00
landing_margin |   -0.02 |    0.01 |   -0.05 |    0.02
tracking_rewards |  -17.53 |    4.03 |  -32.78 |  -10.28
steps    |     378 |  

attitude |   -0.07    0.04    0.10 |    1.22    0.67    1.90 |   -3.14   -1.56   -3.14 |    3.14    1.57    3.14
w        |    0.00    0.00    0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |    0.04    0.09 |    0.67    1.89 |   -1.42   -3.14 |    1.46    3.14
w_f      |    0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.04   -0.02   -0.03 |    0.04    0.03    0.03
w_rewards |   -0.00 |    0.00 |   -0.03 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.24 |    0.26 |    0.00 |    1.69
seeker_angles |    0.00    0.00 |    0.07    0.08 |   -0.95   -1.00 |    1.00    0.99
cs_angles |  0.0031  0.0033 |  0.0747  0.0842 | -0.9463 -0.9987 |  0.9974  0.9922
optical_flow |  0.0000  0.0000 |  0.0223  0.0236 | -1.2551 -1.1009 |  1.1264  1.0573
v_err    | -0.0104 |  0.0580 | -0.4515 |  0.1069
landing_rewards |    9.68 |    1.77 |    0.00 |   10.00
landing_margin |   -0

attitude |    0.12    0.03    0.07 |    1.12    0.62    1.82 |   -3.14   -1.57   -3.14 |    3.14    1.56    3.14
w        |    0.00   -0.00   -0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |    0.03    0.03 |    0.63    1.82 |   -1.43   -3.14 |    1.52    3.13
w_f      |    0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.03   -0.04   -0.02 |    0.03    0.02    0.02
w_rewards |   -0.00 |    0.00 |   -0.01 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.23 |    0.25 |    0.00 |    1.46
seeker_angles |   -0.00    0.00 |    0.08    0.07 |   -0.99   -1.00 |    0.98    0.99
cs_angles | -0.0007  0.0026 |  0.0795  0.0739 | -0.9885 -0.9985 |  0.9779  0.9895
optical_flow | -0.0001 -0.0000 |  0.0241  0.0235 | -1.0927 -0.8565 |  1.2364  0.9632
v_err    | -0.0101 |  0.0578 | -0.4530 |  0.1194
landing_rewards |    9.61 |    1.93 |    0.00 |   10.00
landing_margin |   -0

attitude |    0.12   -0.01   -0.29 |    1.07    0.64    1.76 |   -3.14   -1.56   -3.14 |    3.14    1.53    3.14
w        |    0.00   -0.00   -0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |   -0.01   -0.30 |    0.64    1.77 |   -1.38   -3.10 |    1.49    3.09
w_f      |    0.00   -0.00   -0.00 |    0.01    0.01    0.01 |   -0.03   -0.02   -0.03 |    0.03    0.02    0.02
w_rewards |   -0.00 |    0.00 |   -0.02 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.23 |    0.25 |    0.00 |    1.54
seeker_angles |    0.00    0.00 |    0.07    0.08 |   -0.98   -0.99 |    0.97    0.98
cs_angles |  0.0026  0.0023 |  0.0748  0.0809 | -0.9771 -0.9941 |  0.9679  0.9766
optical_flow |  0.0000 -0.0001 |  0.0222  0.0234 | -1.2358 -0.9622 |  1.0031  1.3268
v_err    | -0.0102 |  0.0579 | -0.4503 |  0.1037
landing_rewards |    9.58 |    2.00 |    0.00 |   10.00
landing_margin |   -0

thrust   |    0.00    0.00    0.00 |    0.67    0.68    0.66 |   -3.35   -3.46   -3.45 |    3.35    3.36    3.46
norm_thrust |    0.89 |    0.76 |    0.00 |    3.46
fuel     |    1.53 |    0.20 |    1.05 |    2.23
rewards  |  -12.23 |    5.26 |  -33.07 |   -3.85
fuel_rewards |   -4.39 |    0.56 |   -6.38 |   -3.01
glideslope_rewards |    0.00 |    0.00 |    0.00 |    0.00
glideslope_penalty |    0.00 |    0.00 |    0.00 |    0.00
glideslope |    3.08 |   13.35 |    0.00 |  301.38
norm_af  |    1.81 |    0.89 |    0.05 |    3.34
norm_wf  |    0.02 |    0.01 |    0.00 |    0.04
rh_penalty |    0.00 |    0.00 |    0.00 |    0.00
att_rewards |    0.00 |    0.00 |    0.00 |    0.00
att_penalty |    0.00 |    0.00 |    0.00 |    0.00
attitude |   -0.02    0.04    0.13 |    1.17    0.66    1.88 |   -3.14   -1.54   -3.14 |    3.14    1.57    3.14
w        |    0.00   -0.00   -0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |    0.04    0.16 |    0.66

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.1359   0.7986   4.3608  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0005   0.0003   0.0014   6.4661   2.1407   2.4885
Update Cnt = 2670    ET =   1150.1   Stats:  Mean, Std, Min, Max
r_f      |   -1.93    0.09   -1.70 |  189.69  170.37  200.34 | -399.20 -390.87 -384.85 |  389.24  369.60  392.86
v_f      |    0.00   -0.00   -0.00 |    0.04    0.04    0.05 |   -0.10   -0.10   -0.10 |    0.10    0.10    0.10
r_i      |   -5.28    6.97   42.88 |  711.62  662.38  743.28 |-1357.87-1309.89-1352.46 | 1312.04 1318.24 1365.27
v_i      |    0.00   -0.00   -0.00 |    0.05    0.04    0.05 |   -0.09   -0.09   -0.10 |    0.10    0.09    0.09
norm_rf  |    0.19 |    0.07 |    0.04 |    0.41
norm_vf  |    0.08 |    0.01 |    0.03 |    0.12
gs_f     |    1.56 |    3.45 |    0.00 |   30.55
thrust   |   -0.00   -0.00   -0.01 |    0.66    0.68    0.66 |   -3.45   -3.43   -3.39 |    3.46    3.34    3.44
norm_thrust |    

ADV1:  0.0007331320336401372 0.0067881276316358 0.04119922732017289 -0.06396976262972562
ADV2:  0.012396849857988572 0.8390761629547515 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.7513   0.8944   3.9897  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0008   0.0005   0.0019   6.4661   2.1407   2.4885
***** Episode 83089, Mean R = -12.5  Std R = 4.8  Min R = -26.7
PolicyLoss: -0.0255
Policy_Beta: 0.114
Policy_Entropy: 0.17
Policy_KL: 0.00102
Policy_SD: 0.537
Policy_lr_mult: 0.132
Steps: 1.16e+04
TotalSteps: 3.04e+07
VF_0_ExplainedVarNew: 0.984
VF_0_ExplainedVarOld: 0.981
VF_0_Loss : 5.78e-05


ADV1:  -0.002570857184623861 0.008416834973569192 0.047562235526944996 -0.06061529760407754
ADV2:  0.04152677558531773 0.848686387738347 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.1098   0.5208   2.5601  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0028   0.0019   0.0066   6.4661   2.1407   2.4885

***** Episode 83337, Mean R = -11.0  Std R = 4.2  Min R = -20.6
PolicyLoss: -0.0334
Policy_Beta: 0.114
Policy_Entropy: 0.17
Policy_KL: 0.00125
Policy_SD: 0.537
Policy_lr_mult: 0.132
Steps: 1.17e+04
TotalSteps: 3.05e+07
VF_0_ExplainedVarNew: 0.971
VF_0_ExplainedVarOld: 0.968
VF_0_Loss : 6.53e-05


ADV1:  0.00018464667392611915 0.00822039461815778 0.03989700583796513 -0.059913171469570314
ADV2:  0.024757664761233648 0.8486773333916457 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.9903   1.5427   7.9395  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0006   0.0003   0.0012   6.4661   2.1407   2.4885
***** Episode 83368, Mean R = -12.8  Std R = 7.2  Min R = -45.5
PolicyLoss: -0.0306
Policy_Beta: 0.114
Policy_Entropy: 0.169
Policy_KL: 0.00138
Policy_SD: 0.553
Policy_lr_mult: 0.132
Steps: 1.17e+04
TotalSteps: 3.05e+07
VF_0_ExplainedVarNew: 0.975
VF_0_ExplainedVarOld: 0.972
VF_0_Loss : 6.74e-05


Dynamics: Max Disturbance (m/s^2):  [0.00179836 0

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.7869   1.7231   8.9069  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0033   0.0021   0.0072   6.4661   2.1407   2.4885
***** Episode 83616, Mean R = -12.0  Std R = 6.3  Min R = -30.7
PolicyLoss: -0.0301
Policy_Beta: 0.114
Policy_Entropy: 0.168
Policy_KL: 0.00114
Policy_SD: 0.545
Policy_lr_mult: 0.132
Steps: 1.17e+04
TotalSteps: 3.06e+07
VF_0_ExplainedVarNew: 0.971
VF_0_ExplainedVarOld: 0.967
VF_0_Loss : 7.71e-05


ADV1:  0.0022538098069571897 0.006830196575930147 0.03382471430903966 -0.07321630743180862
ADV2:  0.004965708843719984 0.8250790178885283 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.3331   0.5476   2.7117  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0023   0.0014   0.0058   6.4661   2.1407   2.4885
***** Episode 83647, Mean R = -12.1  Std R = 5.8  Min R = -28.4
PolicyLoss: -0.0329
Policy_Beta: 0.114
Policy_Entropy: 0.17
Policy_KL: 0.00088

ADV1:  0.0013653715178718916 0.00614979585659664 0.034024144681831014 -0.06074603615141372
ADV2:  0.007522899514877126 0.8066046956811681 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.3231   0.6042   2.7076  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0023   0.0011   0.0043   6.4661   2.1407   2.4885
***** Episode 83895, Mean R = -11.4  Std R = 6.8  Min R = -41.8
PolicyLoss: -0.0322
Policy_Beta: 0.114
Policy_Entropy: 0.17
Policy_KL: 0.00118
Policy_SD: 0.542
Policy_lr_mult: 0.132
Steps: 1.18e+04
TotalSteps: 3.07e+07
VF_0_ExplainedVarNew: 0.989
VF_0_ExplainedVarOld: 0.983
VF_0_Loss : 2.81e-05


Dynamics: Max Disturbance (m/s^2):  [0.00179836 0.00129994 0.00168267] 0.0027848433135488422
ADV1:  -0.001547954060152872 0.008534497959204928 0.03281963224139417 -0.06201509639145893
ADV2:  0.03847372563346053 0.8549006705739306 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.2002   0.9540   4.2439  27.0893  20.3031  12.6669
ValFun 

***** Episode 84143, Mean R = -10.8  Std R = 4.2  Min R = -20.3
PolicyLoss: -0.0291
Policy_Beta: 0.114
Policy_Entropy: 0.172
Policy_KL: 0.000857
Policy_SD: 0.525
Policy_lr_mult: 0.132
Steps: 1.16e+04
TotalSteps: 3.08e+07
VF_0_ExplainedVarNew: 0.977
VF_0_ExplainedVarOld: 0.973
VF_0_Loss : 4.62e-05


ADV1:  -0.000811849534594153 0.007781597336357348 0.06351453258685102 -0.04532947993049215
ADV2:  0.03339632255860167 0.8399352049602421 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.3522   1.1168   5.8645  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0007   0.0005   0.0022   6.4661   2.1407   2.4885
***** Episode 84174, Mean R = -11.5  Std R = 3.9  Min R = -19.7
PolicyLoss: -0.0303
Policy_Beta: 0.114
Policy_Entropy: 0.171
Policy_KL: 0.00118
Policy_SD: 0.527
Policy_lr_mult: 0.132
Steps: 1.18e+04
TotalSteps: 3.08e+07
VF_0_ExplainedVarNew: 0.972
VF_0_ExplainedVarOld: 0.967
VF_0_Loss : 5.71e-05


Dynamics: Max Disturbance (m/s^2):  [0.00179836 0

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   3.2593   1.8760   9.6292  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0020   0.0013   0.0046   6.4661   2.1407   2.4885
***** Episode 84422, Mean R = -12.1  Std R = 5.4  Min R = -26.7
PolicyLoss: -0.0246
Policy_Beta: 0.114
Policy_Entropy: 0.172
Policy_KL: 0.00129
Policy_SD: 0.527
Policy_lr_mult: 0.132
Steps: 1.16e+04
TotalSteps: 3.09e+07
VF_0_ExplainedVarNew: 0.972
VF_0_ExplainedVarOld: 0.966
VF_0_Loss : 7.67e-05


Dynamics: Max Disturbance (m/s^2):  [0.00179836 0.00129994 0.00168267] 0.0027848433135488422
ADV1:  0.0016395868843022412 0.006595670510917444 0.04153577831310426 -0.046815303615647265
ADV2:  0.00518075746166549 0.8632760828830831 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.4836   1.3010   5.2358  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0017   0.0011   0.0042   6.4661   2.1407   2.4885
***** Episode 84453, Mean R = -12.6  Std R = 4.0 

ADV1:  -0.00013241212198813294 0.007959563398388861 0.042230036330374254 -0.04382059137026469
ADV2:  0.02134955567740828 0.8707268708270816 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.9483   0.8005   3.4874  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0006   0.0004   0.0015   6.4661   2.1407   2.4885
***** Episode 84701, Mean R = -11.2  Std R = 4.9  Min R = -27.9
PolicyLoss: -0.0244
Policy_Beta: 0.114
Policy_Entropy: 0.173
Policy_KL: 0.00112
Policy_SD: 0.524
Policy_lr_mult: 0.132
Steps: 1.15e+04
TotalSteps: 3.1e+07
VF_0_ExplainedVarNew: 0.97
VF_0_ExplainedVarOld: 0.967
VF_0_Loss : 6.55e-05


Dynamics: Max Disturbance (m/s^2):  [0.00179836 0.00129994 0.00168267] 0.0027848433135488422
ADV1:  0.000543354728667265 0.01024950361772982 0.06782426951002185 -0.07463439465002672
ADV2:  0.020809754724351946 0.8516888327490907 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.8933   0.8233   4.3936  27.0893  20.3031  12.6669
ValFun 

seeker_angles |    0.00    0.00 |    0.08    0.08 |   -0.99   -1.00 |    1.00    1.00
cs_angles |  0.0037  0.0041 |  0.0758  0.0819 | -0.9866 -0.9965 |  0.9994  0.9972
optical_flow |  0.0000  0.0000 |  0.0241  0.0231 | -1.2726 -0.9569 |  1.0421  1.0599
v_err    | -0.0106 |  0.0579 | -0.4523 |  0.1000
landing_rewards |    9.58 |    2.00 |    0.00 |   10.00
landing_margin |   -0.02 |    0.01 |   -0.07 |    0.02
tracking_rewards |  -17.29 |    4.18 |  -41.73 |  -11.01
steps    |     378 |      20 |     335 |     420
***** Episode 84980, Mean R = -12.5  Std R = 5.3  Min R = -26.2
PolicyLoss: -0.0196
Policy_Beta: 0.114
Policy_Entropy: 0.172
Policy_KL: 0.00109
Policy_SD: 0.53
Policy_lr_mult: 0.132
Steps: 1.18e+04
TotalSteps: 3.11e+07
VF_0_ExplainedVarNew: 0.981
VF_0_ExplainedVarOld: 0.977
VF_0_Loss : 8.32e-05


ADV1:  0.0010306294562429771 0.006738371386347812 0.06062668026706136 -0.0453761713917388
ADV2:  0.014408126902026551 0.8358854350895853 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max

attitude |    0.01    0.02    0.03 |    1.25    0.64    1.90 |   -3.14   -1.55   -3.14 |    3.14    1.55    3.14
w        |    0.00   -0.00   -0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |    0.02    0.01 |    0.64    1.89 |   -1.48   -3.14 |    1.51    3.11
w_f      |    0.00   -0.00    0.00 |    0.01    0.01    0.01 |   -0.03   -0.02   -0.02 |    0.03    0.02    0.02
w_rewards |   -0.00 |    0.00 |   -0.01 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.24 |    0.25 |    0.00 |    1.71
seeker_angles |    0.00    0.01 |    0.08    0.08 |   -0.99   -0.99 |    0.99    0.99
cs_angles |  0.0050  0.0057 |  0.0751  0.0810 | -0.9920 -0.9916 |  0.9912  0.9918
optical_flow |  0.0000 -0.0001 |  0.0235  0.0244 | -1.0921 -1.1621 |  0.9410  1.0709
v_err    | -0.0107 |  0.0583 | -0.4520 |  0.1091
landing_rewards |    9.74 |    1.59 |    0.00 |   10.00
landing_margin |   -0

attitude |   -0.05   -0.01   -0.09 |    1.22    0.68    1.84 |   -3.14   -1.52   -3.14 |    3.14    1.57    3.14
w        |    0.00    0.00   -0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |   -0.01   -0.12 |    0.69    1.83 |   -1.52   -3.13 |    1.51    3.11
w_f      |    0.00   -0.00   -0.00 |    0.01    0.01    0.01 |   -0.03   -0.03   -0.03 |    0.04    0.03    0.02
w_rewards |    0.00 |    0.00 |    0.00 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.24 |    0.25 |    0.00 |    1.51
seeker_angles |    0.00    0.01 |    0.07    0.08 |   -0.98   -0.99 |    0.98    0.99
cs_angles |  0.0021  0.0058 |  0.0745  0.0775 | -0.9768 -0.9897 |  0.9842  0.9903
optical_flow | -0.0001  0.0000 |  0.0215  0.0232 | -1.1218 -1.2740 |  1.0444  1.0721
v_err    | -0.0106 |  0.0584 | -0.4537 |  0.1065
landing_rewards |    9.58 |    2.00 |    0.00 |   10.00
landing_margin |   -0

rewards  |  -12.04 |    5.56 |  -35.72 |   -3.42
fuel_rewards |   -4.38 |    0.60 |   -6.33 |   -3.08
glideslope_rewards |    0.00 |    0.00 |    0.00 |    0.00
glideslope_penalty |    0.00 |    0.00 |    0.00 |    0.00
glideslope |    2.94 |   12.74 |    0.01 |  204.23
norm_af  |    1.72 |    0.93 |    0.02 |    3.31
norm_wf  |    0.02 |    0.01 |    0.00 |    0.03
rh_penalty |    0.00 |    0.00 |    0.00 |    0.00
att_rewards |    0.00 |    0.00 |    0.00 |    0.00
att_penalty |    0.00 |    0.00 |    0.00 |    0.00
attitude |   -0.06    0.08   -0.09 |    1.18    0.66    1.83 |   -3.14   -1.57   -3.14 |    3.14    1.53    3.14
w        |    0.00   -0.00   -0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |    0.07   -0.11 |    0.66    1.84 |   -1.46   -3.14 |    1.39    3.14
w_f      |    0.00   -0.00   -0.00 |    0.01    0.01    0.01 |   -0.03   -0.02   -0.02 |    0.03    0.02    0.03
w_rewards |   -0.00 |    0.00 |   -0.01 |    0.00
w_pena

Update Cnt = 2780    ET =   1037.3   Stats:  Mean, Std, Min, Max
r_f      |   -1.61   -5.46   13.53 |  180.24  162.23  213.10 | -386.73 -381.96 -384.76 |  392.76  394.69  380.37
v_f      |   -0.00   -0.00   -0.00 |    0.05    0.04    0.05 |   -0.11   -0.09   -0.11 |    0.09    0.09    0.10
r_i      |   -0.71   12.17   48.45 |  705.07  623.87  776.11 |-1381.06-1216.02-1338.75 | 1271.08 1368.37 1293.57
v_i      |   -0.00    0.00   -0.00 |    0.04    0.04    0.05 |   -0.09   -0.09   -0.09 |    0.09    0.09    0.10
norm_rf  |    0.18 |    0.07 |    0.01 |    0.39
norm_vf  |    0.08 |    0.01 |    0.04 |    0.12
gs_f     |    1.32 |    1.72 |    0.01 |   14.81
thrust   |   -0.00   -0.00   -0.00 |    0.67    0.68    0.68 |   -3.44   -3.45   -3.44 |    3.46    3.42    3.46
norm_thrust |    0.89 |    0.76 |    0.00 |    3.46
fuel     |    1.53 |    0.18 |    1.11 |    2.16
rewards  |  -12.15 |    4.96 |  -33.75 |   -3.61
fuel_rewards |   -4.39 |    0.53 |   -6.18 |   -3.17
glideslope_rewards |

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.7234   0.6480   3.2694  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0026   0.0015   0.0051   6.4661   2.1407   2.4885
***** Episode 86499, Mean R = -10.7  Std R = 4.1  Min R = -23.2
PolicyLoss: -0.0163
Policy_Beta: 0.114
Policy_Entropy: 0.17
Policy_KL: 0.00105
Policy_SD: 0.531
Policy_lr_mult: 0.132
Steps: 1.18e+04
TotalSteps: 3.17e+07
VF_0_ExplainedVarNew: 0.988
VF_0_ExplainedVarOld: 0.983
VF_0_Loss : 2.42e-05


ADV1:  -0.0035108161171035148 0.009745717132677642 0.042303252145732495 -0.07705163252083658
ADV2:  0.04936072115398834 0.8427550636238154 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.4120   0.8485   4.5424  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0035   0.0023   0.0089   6.4661   2.1407   2.4885
Update Cnt = 2790    ET =   1079.4   Stats:  Mean, Std, Min, Max
r_f      |    4.20   -2.21   -1.11 |  186.69  176.28  198.27 | -395.37 -387.0

ADV1:  -0.0005874413797334657 0.008103544301907694 0.03609303269550235 -0.06210950645129293
ADV2:  0.030159798643048834 0.8466492595688863 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.1166   1.0942   4.6601  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0009   0.0005   0.0022   6.4661   2.1407   2.4885
***** Episode 86778, Mean R = -12.9  Std R = 5.1  Min R = -25.4
PolicyLoss: -0.029
Policy_Beta: 0.114
Policy_Entropy: 0.171
Policy_KL: 0.0012
Policy_SD: 0.536
Policy_lr_mult: 0.132
Steps: 1.19e+04
TotalSteps: 3.18e+07
VF_0_ExplainedVarNew: 0.974
VF_0_ExplainedVarOld: 0.97
VF_0_Loss : 6.14e-05


ADV1:  0.0009982663642082656 0.006837050711459397 0.047429595340652164 -0.0544763321388495
ADV2:  0.007711199078146465 0.8379474687175814 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.6114   0.5249   2.6017  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0012   0.0007   0.0025   6.4661   2.1407   2.48

***** Episode 87026, Mean R = -11.4  Std R = 5.5  Min R = -27.5
PolicyLoss: -0.0341
Policy_Beta: 0.114
Policy_Entropy: 0.173
Policy_KL: 0.00094
Policy_SD: 0.534
Policy_lr_mult: 0.132
Steps: 1.15e+04
TotalSteps: 3.19e+07
VF_0_ExplainedVarNew: 0.973
VF_0_ExplainedVarOld: 0.968
VF_0_Loss : 7.61e-05


ADV1:  0.00037919356729883323 0.00827625811586906 0.03842393021980495 -0.06232772426849909
ADV2:  0.02192234812474014 0.8533341423292305 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.2881   0.5368   2.6902  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0004   0.0002   0.0010   6.4661   2.1407   2.4885
***** Episode 87057, Mean R = -13.1  Std R = 5.2  Min R = -22.9
PolicyLoss: -0.0291
Policy_Beta: 0.114
Policy_Entropy: 0.172
Policy_KL: 0.00123
Policy_SD: 0.541
Policy_lr_mult: 0.132
Steps: 1.17e+04
TotalSteps: 3.19e+07
VF_0_ExplainedVarNew: 0.974
VF_0_ExplainedVarOld: 0.971
VF_0_Loss : 7.36e-05


ADV1:  0.00041275695495132333 0.007669573089111498

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.8909   1.9522  10.5284  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0013   0.0008   0.0033   6.4661   2.1407   2.4885
***** Episode 87305, Mean R = -11.2  Std R = 4.5  Min R = -24.6
PolicyLoss: 0.00794
Policy_Beta: 0.114
Policy_Entropy: 0.173
Policy_KL: 0.000899
Policy_SD: 0.54
Policy_lr_mult: 0.132
Steps: 1.18e+04
TotalSteps: 3.2e+07
VF_0_ExplainedVarNew: 0.99
VF_0_ExplainedVarOld: 0.984
VF_0_Loss : 3.71e-05


ADV1:  -0.00031333427733166525 0.007794006102144936 0.048447051774451355 -0.08263704622337448
ADV2:  0.03372035209174046 0.7949632711595862 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.7582   0.7768   4.6698  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0007   0.0003   0.0014   6.4661   2.1407   2.4885
***** Episode 87336, Mean R = -13.0  Std R = 6.1  Min R = -31.7
PolicyLoss: -0.0349
Policy_Beta: 0.114
Policy_Entropy: 0.172
Policy_KL: 0.0007

ADV1:  0.00031708196723967836 0.005211328241794951 0.039556227664982235 -0.03460443561160159
ADV2:  -0.005745058178281537 0.9088385586444786 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.4387   1.0601   5.6376  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0007   0.0004   0.0016   6.4661   2.1407   2.4885
***** Episode 87584, Mean R = -11.8  Std R = 4.4  Min R = -20.8
PolicyLoss: -0.00273
Policy_Beta: 0.114
Policy_Entropy: 0.171
Policy_KL: 0.00147
Policy_SD: 0.544
Policy_lr_mult: 0.132
Steps: 1.17e+04
TotalSteps: 3.21e+07
VF_0_ExplainedVarNew: 0.99
VF_0_ExplainedVarOld: 0.988
VF_0_Loss : 2.23e-05


ADV1:  -0.00038251928524637627 0.00725166200989139 0.03552595047937243 -0.058822424391342096
ADV2:  0.027486732728567883 0.8458117608389963 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.2022   1.1268   5.4092  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0005   0.0003   0.0011   6.4661   2.1407

***** Episode 87832, Mean R = -11.5  Std R = 4.5  Min R = -26.1
PolicyLoss: -0.0283
Policy_Beta: 0.114
Policy_Entropy: 0.172
Policy_KL: 0.000925
Policy_SD: 0.536
Policy_lr_mult: 0.132
Steps: 1.15e+04
TotalSteps: 3.22e+07
VF_0_ExplainedVarNew: 0.981
VF_0_ExplainedVarOld: 0.977
VF_0_Loss : 0.000152


ADV1:  -0.0015004747630294234 0.006322541688570326 0.05958753423001323 -0.08924939214698108
ADV2:  0.02146954313042985 0.8340261122918143 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.9986   0.9757   4.4762  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0015   0.0009   0.0039   6.4661   2.1407   2.4885
***** Episode 87863, Mean R = -13.7  Std R = 5.8  Min R = -27.6
PolicyLoss: -0.00793
Policy_Beta: 0.114
Policy_Entropy: 0.169
Policy_KL: 0.000906
Policy_SD: 0.559
Policy_lr_mult: 0.132
Steps: 1.16e+04
TotalSteps: 3.22e+07
VF_0_ExplainedVarNew: 0.991
VF_0_ExplainedVarOld: 0.986
VF_0_Loss : 0.000109


Dynamics: Max Disturbance (m/s^2):  [0.0017983

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.8599   1.1120   5.9798  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0016   0.0009   0.0033   6.4661   2.1407   2.4885
***** Episode 88111, Mean R = -12.9  Std R = 5.5  Min R = -28.3
PolicyLoss: -0.0228
Policy_Beta: 0.114
Policy_Entropy: 0.173
Policy_KL: 0.000927
Policy_SD: 0.531
Policy_lr_mult: 0.132
Steps: 1.18e+04
TotalSteps: 3.23e+07
VF_0_ExplainedVarNew: 0.968
VF_0_ExplainedVarOld: 0.964
VF_0_Loss : 0.000103


ADV1:  -0.0005517785447024328 0.008142030830202233 0.04230276861497334 -0.060118852075903506
ADV2:  0.030722235474065676 0.840681141940169 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.6934   0.9301   4.7028  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0009   0.0005   0.0019   6.4661   2.1407   2.4885
***** Episode 88142, Mean R = -11.8  Std R = 5.3  Min R = -25.0
PolicyLoss: -0.0301
Policy_Beta: 0.114
Policy_Entropy: 0.172
Policy_KL: 0.00

v_err    | -0.0104 |  0.0581 | -0.4528 |  0.1027
landing_rewards |    9.61 |    1.93 |    0.00 |   10.00
landing_margin |   -0.02 |    0.01 |   -0.06 |    0.03
tracking_rewards |  -16.66 |    4.09 |  -39.98 |  -10.29
steps    |     378 |      20 |     332 |     416
***** Episode 88390, Mean R = -12.1  Std R = 5.9  Min R = -27.8
PolicyLoss: -0.0316
Policy_Beta: 0.114
Policy_Entropy: 0.171
Policy_KL: 0.00109
Policy_SD: 0.534
Policy_lr_mult: 0.132
Steps: 1.17e+04
TotalSteps: 3.24e+07
VF_0_ExplainedVarNew: 0.978
VF_0_ExplainedVarOld: 0.974
VF_0_Loss : 4.98e-05


Dynamics: Max Disturbance (m/s^2):  [0.00179836 0.00129994 0.00168267] 0.0027848433135488422
ADV1:  0.00021990813593316424 0.007960475562810975 0.04658400052821407 -0.053710386641825314
ADV2:  0.019372368978165706 0.8729413658468307 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.5205   1.7861   9.8680  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0008   0.0005   0.0021   6.4661   2.1

attitude |   -0.08    0.09    0.03 |    1.22    0.67    1.86 |   -3.14   -1.55   -3.14 |    3.14    1.55    3.14
w        |    0.00   -0.00   -0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |    0.09   -0.04 |    0.67    1.85 |   -1.36   -3.14 |    1.47    3.11
w_f      |    0.00   -0.00    0.00 |    0.01    0.01    0.01 |   -0.03   -0.02   -0.02 |    0.03    0.02    0.03
w_rewards |   -0.00 |    0.00 |   -0.03 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.23 |    0.25 |    0.00 |    1.55
seeker_angles |    0.00    0.00 |    0.08    0.08 |   -0.99   -0.95 |    1.00    0.97
cs_angles |  0.0011  0.0031 |  0.0773  0.0774 | -0.9898 -0.9507 |  0.9966  0.9693
optical_flow | -0.0001 -0.0001 |  0.0240  0.0228 | -1.0964 -0.9945 |  0.9881  1.0829
v_err    | -0.0105 |  0.0578 | -0.4514 |  0.1015
landing_rewards |    9.68 |    1.77 |    0.00 |   10.00
landing_margin |   -0

thrust   |    0.00   -0.00   -0.00 |    0.68    0.68    0.68 |   -3.43   -3.41   -3.42 |    3.45    3.45    3.44
norm_thrust |    0.89 |    0.76 |    0.00 |    3.46
fuel     |    1.53 |    0.19 |    1.08 |    2.11
rewards  |  -11.95 |    5.29 |  -34.15 |   -3.34
fuel_rewards |   -4.38 |    0.56 |   -6.05 |   -3.09
glideslope_rewards |    0.00 |    0.00 |    0.00 |    0.00
glideslope_penalty |    0.00 |    0.00 |    0.00 |    0.00
glideslope |    2.79 |   12.75 |    0.01 |  212.63
norm_af  |    1.76 |    0.86 |    0.14 |    3.30
norm_wf  |    0.01 |    0.01 |    0.00 |    0.03
rh_penalty |    0.00 |    0.00 |    0.00 |    0.00
att_rewards |    0.00 |    0.00 |    0.00 |    0.00
att_penalty |    0.00 |    0.00 |    0.00 |    0.00
attitude |   -0.09    0.00   -0.07 |    1.12    0.65    1.85 |   -3.14   -1.56   -3.14 |    3.14    1.56    3.14
w        |    0.00   -0.00   -0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |    0.01   -0.06 |    0.64

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.2957   0.6010   2.7355  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0007   0.0004   0.0014   6.4661   2.1407   2.4885
Update Cnt = 2880    ET =   1065.5   Stats:  Mean, Std, Min, Max
r_f      |   11.55  -11.73  -29.11 |  179.08  172.20  204.65 | -381.75 -391.70 -393.32 |  385.46  366.64  380.48
v_f      |   -0.00   -0.00    0.00 |    0.04    0.04    0.05 |   -0.09   -0.10   -0.11 |    0.10    0.09    0.10
r_i      |   37.46  -11.63  -79.24 |  688.73  659.30  767.15 |-1323.36-1350.06-1296.33 | 1369.61 1306.61 1251.19
v_i      |   -0.00    0.00    0.01 |    0.04    0.04    0.05 |   -0.09   -0.09   -0.10 |    0.09    0.09    0.10
norm_rf  |    0.17 |    0.07 |    0.04 |    0.46
norm_vf  |    0.08 |    0.01 |    0.04 |    0.12
gs_f     |    1.28 |    1.66 |    0.00 |   11.58
thrust   |   -0.00   -0.00    0.00 |    0.66    0.68    0.66 |   -3.38   -3.46   -3.44 |    3.35    3.42    3.43
norm_thrust |    

ADV1:  -0.0012430523808302349 0.007020830594516494 0.03856522167612597 -0.051270776922014816
ADV2:  0.03631672368622978 0.8405648950304994 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.6215   0.3950   2.2486  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0013   0.0008   0.0032   6.4661   2.1407   2.4885
***** Episode 89599, Mean R = -11.1  Std R = 5.0  Min R = -23.7
PolicyLoss: -0.0266
Policy_Beta: 0.114
Policy_Entropy: 0.17
Policy_KL: 0.000875
Policy_SD: 0.546
Policy_lr_mult: 0.132
Steps: 1.17e+04
TotalSteps: 3.29e+07
VF_0_ExplainedVarNew: 0.979
VF_0_ExplainedVarOld: 0.975
VF_0_Loss : 5.15e-05


ADV1:  0.0015892487046523783 0.006541182284889533 0.030813486479824556 -0.06894410746808965
ADV2:  0.006542363233864628 0.8556798713400109 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.9204   0.7261   3.3842  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0017   0.0011   0.0041   6.4661   2.1407   

***** Episode 89847, Mean R = -12.5  Std R = 4.6  Min R = -25.1
PolicyLoss: -0.037
Policy_Beta: 0.114
Policy_Entropy: 0.171
Policy_KL: 0.000799
Policy_SD: 0.551
Policy_lr_mult: 0.132
Steps: 1.17e+04
TotalSteps: 3.3e+07
VF_0_ExplainedVarNew: 0.974
VF_0_ExplainedVarOld: 0.969
VF_0_Loss : 5.73e-05


ADV1:  0.002793336480984178 0.006991248900195099 0.0418155704020321 -0.048961335761753544
ADV2:  -0.0012782105062113995 0.8497429590662144 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.3441   0.8266   3.9968  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0029   0.0017   0.0072   6.4661   2.1407   2.4885
***** Episode 89878, Mean R = -12.0  Std R = 5.0  Min R = -22.3
PolicyLoss: -0.0302
Policy_Beta: 0.114
Policy_Entropy: 0.172
Policy_KL: 0.000898
Policy_SD: 0.535
Policy_lr_mult: 0.132
Steps: 1.2e+04
TotalSteps: 3.3e+07
VF_0_ExplainedVarNew: 0.981
VF_0_ExplainedVarOld: 0.978
VF_0_Loss : 4.18e-05


ADV1:  -0.0015214381026626839 0.006536491871988126

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   3.2868   1.4867   7.1424  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0011   0.0007   0.0025   6.4661   2.1407   2.4885
***** Episode 90126, Mean R = -11.0  Std R = 4.1  Min R = -17.8
PolicyLoss: -0.00666
Policy_Beta: 0.114
Policy_Entropy: 0.172
Policy_KL: 0.00167
Policy_SD: 0.533
Policy_lr_mult: 0.132
Steps: 1.16e+04
TotalSteps: 3.31e+07
VF_0_ExplainedVarNew: 0.987
VF_0_ExplainedVarOld: 0.985
VF_0_Loss : 2.63e-05


ADV1:  -0.0002772430808881606 0.006828607929133752 0.042939398869853596 -0.07717478689304685
ADV2:  0.03125300361168237 0.7995422544580483 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.0810   0.5460   2.6564  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0004   0.0002   0.0009   6.4661   2.1407   2.4885
***** Episode 90157, Mean R = -11.6  Std R = 4.7  Min R = -26.1
PolicyLoss: -0.0325
Policy_Beta: 0.114
Policy_Entropy: 0.169
Policy_KL: 0.00

ADV1:  0.002261679589733723 0.006480210487787033 0.054906602197715426 -0.06902536242110335
ADV2:  0.0006237176209525065 0.8213173592968274 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.0126   0.3024   1.6802  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0024   0.0015   0.0057   6.4661   2.1407   2.4885
***** Episode 90405, Mean R = -12.1  Std R = 5.2  Min R = -24.4
PolicyLoss: -0.0283
Policy_Beta: 0.114
Policy_Entropy: 0.17
Policy_KL: 0.000936
Policy_SD: 0.55
Policy_lr_mult: 0.132
Steps: 1.17e+04
TotalSteps: 3.32e+07
VF_0_ExplainedVarNew: 0.984
VF_0_ExplainedVarOld: 0.982
VF_0_Loss : 3.97e-05


ADV1:  -6.428725964794892e-05 0.00497524702251797 0.044966074587489746 -0.04202656115493364
ADV2:  -0.006383552979883215 0.8864948780220714 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.4916   0.7632   3.8243  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0010   0.0006   0.0024   6.4661   2.1407   

***** Episode 90653, Mean R = -12.4  Std R = 5.5  Min R = -35.1
PolicyLoss: -0.0276
Policy_Beta: 0.114
Policy_Entropy: 0.17
Policy_KL: 0.00145
Policy_SD: 0.548
Policy_lr_mult: 0.132
Steps: 1.17e+04
TotalSteps: 3.33e+07
VF_0_ExplainedVarNew: 0.974
VF_0_ExplainedVarOld: 0.968
VF_0_Loss : 7.96e-05


ADV1:  0.002070708150612747 0.005138063916315061 0.03991013280886177 -0.0346468417416152
ADV2:  -0.02302095851474416 0.9205830250114043 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.9933   1.0813   5.9287  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0021   0.0013   0.0053   6.4661   2.1407   2.4885
***** Episode 90684, Mean R = -10.6  Std R = 4.1  Min R = -24.0
PolicyLoss: -0.0082
Policy_Beta: 0.114
Policy_Entropy: 0.173
Policy_KL: 0.00079
Policy_SD: 0.527
Policy_lr_mult: 0.132
Steps: 1.18e+04
TotalSteps: 3.33e+07
VF_0_ExplainedVarNew: 0.99
VF_0_ExplainedVarOld: 0.987
VF_0_Loss : 3.54e-05


ADV1:  -0.0008501968401224651 0.007778825016923933 0.

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.1445   0.5857   3.4047  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0028   0.0017   0.0062   6.4661   2.1407   2.4885
***** Episode 90932, Mean R = -11.4  Std R = 4.8  Min R = -22.4
PolicyLoss: -0.0226
Policy_Beta: 0.114
Policy_Entropy: 0.174
Policy_KL: 0.000659
Policy_SD: 0.524
Policy_lr_mult: 0.132
Steps: 1.19e+04
TotalSteps: 3.34e+07
VF_0_ExplainedVarNew: 0.975
VF_0_ExplainedVarOld: 0.969
VF_0_Loss : 6e-05


ADV1:  0.0016634704955320197 0.008363361635122997 0.03578124412278588 -0.05779837680942451
ADV2:  0.013409456414454218 0.8582727227813786 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.6012   0.6597   3.8231  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0018   0.0010   0.0043   6.4661   2.1407   2.4885
***** Episode 90963, Mean R = -12.2  Std R = 3.9  Min R = -21.4
PolicyLoss: -0.0294
Policy_Beta: 0.114
Policy_Entropy: 0.173
Policy_KL: 0.0011
P

ADV1:  0.0013193425482000086 0.00544391589243759 0.038823712146674516 -0.05781464318847518
ADV2:  -0.019489320658675473 0.8929119243823533 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.5202   0.7180   4.1357  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0015   0.0009   0.0034   6.4661   2.1407   2.4885
***** Episode 91211, Mean R = -11.1  Std R = 4.7  Min R = -20.9
PolicyLoss: -0.00293
Policy_Beta: 0.114
Policy_Entropy: 0.173
Policy_KL: 0.000968
Policy_SD: 0.542
Policy_lr_mult: 0.132
Steps: 1.16e+04
TotalSteps: 3.35e+07
VF_0_ExplainedVarNew: 0.989
VF_0_ExplainedVarOld: 0.986
VF_0_Loss : 0.000153


ADV1:  -0.001039952629205216 0.006838494694577543 0.03244060440590785 -0.07499085230626826
ADV2:  0.04076162003219286 0.7872053636161308 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.3498   0.6417   3.0314  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0011   0.0007   0.0026   6.4661   2.1407   

seeker_angles |    0.00    0.00 |    0.08    0.08 |   -1.00   -1.00 |    0.99    1.00
cs_angles |  0.0045  0.0018 |  0.0778  0.0798 | -0.9962 -0.9969 |  0.9948  0.9958
optical_flow |  0.0001  0.0000 |  0.0238  0.0228 | -0.9954 -1.0447 |  1.1902  1.1037
v_err    | -0.0100 |  0.0576 | -0.4516 |  0.1098
landing_rewards |    9.65 |    1.85 |    0.00 |   10.00
landing_margin |   -0.02 |    0.01 |   -0.07 |    0.03
tracking_rewards |  -16.95 |    4.39 |  -38.97 |   -9.51
steps    |     377 |      20 |     331 |     415
***** Episode 91490, Mean R = -10.4  Std R = 3.7  Min R = -25.1
PolicyLoss: -0.00142
Policy_Beta: 0.114
Policy_Entropy: 0.171
Policy_KL: 0.00141
Policy_SD: 0.542
Policy_lr_mult: 0.132
Steps: 1.17e+04
TotalSteps: 3.36e+07
VF_0_ExplainedVarNew: 0.989
VF_0_ExplainedVarOld: 0.985
VF_0_Loss : 4.24e-05


ADV1:  0.0008571721087468894 0.005521156559534077 0.029849668211221647 -0.049291939974565546
ADV2:  -0.0022022341819417346 0.9025997708386221 3.0 -3.0
Policy  Gradients: u/sd/Max/C 

attitude |    0.11    0.02    0.09 |    1.21    0.63    1.85 |   -3.14   -1.47   -3.14 |    3.14    1.55    3.14
w        |   -0.00   -0.00    0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |    0.02    0.15 |    0.63    1.84 |   -1.31   -3.14 |    1.44    3.14
w_f      |   -0.00   -0.00   -0.00 |    0.01    0.01    0.01 |   -0.04   -0.02   -0.02 |    0.03    0.02    0.02
w_rewards |   -0.00 |    0.00 |   -0.03 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.23 |    0.25 |    0.00 |    1.65
seeker_angles |    0.00    0.00 |    0.07    0.08 |   -0.99   -1.00 |    0.99    0.96
cs_angles |  0.0030  0.0017 |  0.0725  0.0775 | -0.9926 -0.9999 |  0.9865  0.9627
optical_flow | -0.0001  0.0001 |  0.0243  0.0217 | -1.1771 -0.9644 |  1.0854  0.8631
v_err    | -0.0100 |  0.0575 | -0.4527 |  0.0994
landing_rewards |    9.55 |    2.08 |    0.00 |   10.00
landing_margin |   -0

w        |   -0.00   -0.00   -0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |    0.02   -0.04 |    0.62    1.88 |   -1.52   -3.13 |    1.31    3.13
w_f      |   -0.00   -0.00   -0.00 |    0.01    0.01    0.01 |   -0.03   -0.02   -0.02 |    0.03    0.02    0.03
w_rewards |   -0.00 |    0.00 |   -0.01 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.24 |    0.26 |    0.00 |    1.50
seeker_angles |    0.00    0.00 |    0.08    0.08 |   -0.99   -0.99 |    1.00    0.96
cs_angles |  0.0009  0.0026 |  0.0758  0.0809 | -0.9946 -0.9928 |  0.9951  0.9596
optical_flow |  0.0000  0.0001 |  0.0246  0.0236 | -1.4155 -1.2379 |  1.0912  1.0813
v_err    | -0.0099 |  0.0577 | -0.4516 |  0.1032
landing_rewards |    9.58 |    2.00 |    0.00 |   10.00
landing_margin |   -0.02 |    0.01 |   -0.05 |    0.02
tracking_rewards |  -16.79 |    4.19 |  -34.13 |   -9.87
steps    |     379 |  

attitude |    0.03   -0.02   -0.14 |    1.18    0.64    1.87 |   -3.14   -1.55   -3.14 |    3.14    1.55    3.14
w        |    0.00   -0.00    0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |   -0.02   -0.10 |    0.65    1.87 |   -1.50   -3.12 |    1.45    3.14
w_f      |   -0.00   -0.00   -0.00 |    0.01    0.01    0.01 |   -0.03   -0.02   -0.02 |    0.03    0.03    0.02
w_rewards |   -0.00 |    0.00 |   -0.04 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.24 |    0.26 |    0.00 |    1.61
seeker_angles |    0.00    0.00 |    0.08    0.08 |   -0.99   -0.99 |    1.00    0.99
cs_angles |  0.0033  0.0029 |  0.0774  0.0819 | -0.9881 -0.9935 |  0.9992  0.9924
optical_flow |  0.0000 -0.0000 |  0.0234  0.0227 | -1.1068 -1.3799 |  1.2576  0.9800
v_err    | -0.0102 |  0.0579 | -0.4517 |  0.1046
landing_rewards |    9.77 |    1.49 |    0.00 |   10.00
landing_margin |   -0

thrust   |   -0.00    0.00   -0.00 |    0.67    0.67    0.67 |   -3.45   -3.42   -3.37 |    3.36    3.42    3.45
norm_thrust |    0.88 |    0.76 |    0.00 |    3.46
fuel     |    1.51 |    0.18 |    1.14 |    2.16
rewards  |  -11.24 |    4.80 |  -30.13 |   -3.92
fuel_rewards |   -4.33 |    0.52 |   -6.19 |   -3.26
glideslope_rewards |    0.00 |    0.00 |    0.00 |    0.00
glideslope_penalty |    0.00 |    0.00 |    0.00 |    0.00
glideslope |    3.00 |   12.32 |    0.01 |  133.61
norm_af  |    1.83 |    0.94 |    0.14 |    3.29
norm_wf  |    0.02 |    0.01 |    0.00 |    0.04
rh_penalty |    0.00 |    0.00 |    0.00 |    0.00
att_rewards |    0.00 |    0.00 |    0.00 |    0.00
att_penalty |    0.00 |    0.00 |    0.00 |    0.00
attitude |    0.05    0.02    0.23 |    1.26    0.64    1.95 |   -3.14   -1.55   -3.14 |    3.14    1.57    3.14
w        |    0.00   -0.00    0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |    0.01    0.31 |    0.64

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.0234   0.9387   3.8636  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0011   0.0007   0.0024   6.4661   2.1407   2.4885
Update Cnt = 3000    ET =   1063.5   Stats:  Mean, Std, Min, Max
r_f      |  -11.26   17.93    3.90 |  178.67  172.64  200.41 | -389.10 -352.21 -379.58 |  390.88  391.53  396.51
v_f      |    0.00   -0.00   -0.00 |    0.04    0.04    0.05 |   -0.10   -0.09   -0.10 |    0.10    0.10    0.12
r_i      |  -69.09   23.38   25.90 |  685.77  658.61  751.49 |-1284.48-1327.02-1292.25 | 1329.24 1303.64 1379.58
v_i      |    0.00   -0.00   -0.00 |    0.04    0.04    0.05 |   -0.09   -0.09   -0.09 |    0.09    0.10    0.10
norm_rf  |    0.18 |    0.07 |    0.04 |    0.40
norm_vf  |    0.08 |    0.01 |    0.04 |    0.12
gs_f     |    1.57 |    4.61 |    0.01 |   70.88
thrust   |   -0.01    0.00    0.00 |    0.67    0.69    0.66 |   -3.38   -3.43   -3.39 |    3.46    3.34    3.37
norm_thrust |    

ADV1:  -4.762225594804374e-05 0.00558966274126366 0.08572508482125707 -0.037030209205864584
ADV2:  -0.008537152375431064 0.8483240195325294 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.5329   0.6944   3.9153  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0011   0.0007   0.0026   6.4661   2.1407   2.4885
***** Episode 93319, Mean R = -10.7  Std R = 4.2  Min R = -22.6
PolicyLoss: 0.00717
Policy_Beta: 0.114
Policy_Entropy: 0.174
Policy_KL: 0.000979
Policy_SD: 0.528
Policy_lr_mult: 0.132
Steps: 1.16e+04
TotalSteps: 3.43e+07
VF_0_ExplainedVarNew: 0.99
VF_0_ExplainedVarOld: 0.984
VF_0_Loss : 2.79e-05


ADV1:  -0.0036893686870970318 0.009567244465369542 0.02957721705084939 -0.07138514666220466
ADV2:  0.05482428315261564 0.8685211922842587 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.1350   1.1585   5.8715  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0042   0.0025   0.0095   6.4661   2.1407   

***** Episode 93567, Mean R = -11.4  Std R = 4.2  Min R = -24.7
PolicyLoss: -0.0392
Policy_Beta: 0.114
Policy_Entropy: 0.173
Policy_KL: 0.00125
Policy_SD: 0.522
Policy_lr_mult: 0.132
Steps: 1.19e+04
TotalSteps: 3.44e+07
VF_0_ExplainedVarNew: 0.973
VF_0_ExplainedVarOld: 0.97
VF_0_Loss : 5.89e-05


ADV1:  0.0007358942677697776 0.006514590085995488 0.03458044967248258 -0.05690300019946909
ADV2:  0.021308199180576026 0.7989270944243028 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.0506   0.4045   2.2045  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0012   0.0006   0.0026   6.4661   2.1407   2.4885
***** Episode 93598, Mean R = -10.3  Std R = 3.9  Min R = -21.3
PolicyLoss: -0.0331
Policy_Beta: 0.114
Policy_Entropy: 0.176
Policy_KL: 0.00103
Policy_SD: 0.509
Policy_lr_mult: 0.132
Steps: 1.17e+04
TotalSteps: 3.44e+07
VF_0_ExplainedVarNew: 0.979
VF_0_ExplainedVarOld: 0.976
VF_0_Loss : 5.48e-05


ADV1:  0.00126387451086875 0.006852707306961399 0.

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.9872   0.8763   4.2114  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0012   0.0008   0.0032   6.4661   2.1407   2.4885
***** Episode 93846, Mean R = -10.6  Std R = 3.2  Min R = -16.7
PolicyLoss: -0.0212
Policy_Beta: 0.114
Policy_Entropy: 0.177
Policy_KL: 0.00102
Policy_SD: 0.505
Policy_lr_mult: 0.132
Steps: 1.18e+04
TotalSteps: 3.45e+07
VF_0_ExplainedVarNew: 0.979
VF_0_ExplainedVarOld: 0.976
VF_0_Loss : 8.01e-05


ADV1:  0.0008837099234907465 0.005888654356628953 0.02625408122936889 -0.04105261380500448
ADV2:  0.008748222465632569 0.8695201812802617 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.2366   1.3080   6.5764  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0011   0.0006   0.0024   6.4661   2.1407   2.4885
***** Episode 93877, Mean R = -11.3  Std R = 4.8  Min R = -27.0
PolicyLoss: -0.0245
Policy_Beta: 0.114
Policy_Entropy: 0.177
Policy_KL: 0.0013

ADV1:  0.0024541674185861377 0.005502115453058544 0.07871939785298704 -0.04161194161936754
ADV2:  -0.030819634178454926 0.8670570936397752 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.7676   0.8278   4.2943  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0029   0.0017   0.0065   6.4661   2.1407   2.4885
***** Episode 94125, Mean R = -11.2  Std R = 4.7  Min R = -24.7
PolicyLoss: -0.0104
Policy_Beta: 0.114
Policy_Entropy: 0.175
Policy_KL: 0.0012
Policy_SD: 0.529
Policy_lr_mult: 0.132
Steps: 1.16e+04
TotalSteps: 3.46e+07
VF_0_ExplainedVarNew: 0.991
VF_0_ExplainedVarOld: 0.986
VF_0_Loss : 0.000141


ADV1:  -0.004459133362444151 0.009636462437811882 0.04793104731813963 -0.06322868505437691
ADV2:  0.053024397518577286 0.8816897431896883 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.8229   1.1733   5.7442  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0048   0.0030   0.0115   6.4661   2.1407   2.

***** Episode 94373, Mean R = -12.1  Std R = 5.5  Min R = -27.1
PolicyLoss: -0.0254
Policy_Beta: 0.114
Policy_Entropy: 0.178
Policy_KL: 0.00127
Policy_SD: 0.523
Policy_lr_mult: 0.132
Steps: 1.14e+04
TotalSteps: 3.47e+07
VF_0_ExplainedVarNew: 0.968
VF_0_ExplainedVarOld: 0.963
VF_0_Loss : 0.00024


ADV1:  0.0009343120463121983 0.006680608239412396 0.03609443821113992 -0.06073382663817162
ADV2:  0.014452119089691537 0.8533541403636233 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.0660   1.0843   5.3085  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0010   0.0006   0.0024   6.4661   2.1407   2.4885
***** Episode 94404, Mean R = -11.4  Std R = 4.3  Min R = -27.1
PolicyLoss: -0.0277
Policy_Beta: 0.114
Policy_Entropy: 0.176
Policy_KL: 0.00138
Policy_SD: 0.517
Policy_lr_mult: 0.132
Steps: 1.16e+04
TotalSteps: 3.47e+07
VF_0_ExplainedVarNew: 0.982
VF_0_ExplainedVarOld: 0.979
VF_0_Loss : 0.000176


ADV1:  -0.0025467440446099287 0.007936310220919401

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.0298   0.9031   4.8466  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0004   0.0003   0.0012   6.4661   2.1407   2.4885
***** Episode 94652, Mean R = -11.8  Std R = 4.6  Min R = -22.5
PolicyLoss: -0.0261
Policy_Beta: 0.114
Policy_Entropy: 0.179
Policy_KL: 0.0011
Policy_SD: 0.518
Policy_lr_mult: 0.132
Steps: 1.18e+04
TotalSteps: 3.48e+07
VF_0_ExplainedVarNew: 0.989
VF_0_ExplainedVarOld: 0.986
VF_0_Loss : 0.000153


ADV1:  -0.0011331210612955675 0.007960505907641814 0.03562949789202752 -0.05309080528485238
ADV2:  0.033181725308720565 0.8604228366902333 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.0660   0.5561   2.6697  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0014   0.0009   0.0030   6.4661   2.1407   2.4885
***** Episode 94683, Mean R = -13.2  Std R = 4.6  Min R = -26.0
PolicyLoss: -0.0291
Policy_Beta: 0.114
Policy_Entropy: 0.177
Policy_KL: 0.0009

ADV1:  0.0017831075179924353 0.008009681216893421 0.039509128481939326 -0.04809231272265842
ADV2:  0.0062191980989721755 0.872165858631394 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.3210   1.4012   6.7447  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0022   0.0013   0.0046   6.4661   2.1407   2.4885
***** Episode 94931, Mean R = -11.1  Std R = 3.9  Min R = -21.4
PolicyLoss: -0.0253
Policy_Beta: 0.114
Policy_Entropy: 0.179
Policy_KL: 0.00107
Policy_SD: 0.512
Policy_lr_mult: 0.132
Steps: 1.18e+04
TotalSteps: 3.49e+07
VF_0_ExplainedVarNew: 0.97
VF_0_ExplainedVarOld: 0.966
VF_0_Loss : 0.000274


ADV1:  -0.001060180419849267 0.007036660627205135 0.041736931233113395 -0.05230557314257134
ADV2:  0.01869169048667409 0.8784300950264029 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.3057   0.6457   2.9673  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0013   0.0008   0.0028   6.4661   2.1407   2.

cs_angles |  0.0029  0.0064 |  0.0780  0.0798 | -0.9956 -0.9970 |  0.9764  0.9614
optical_flow | -0.0001 -0.0001 |  0.0220  0.0234 | -1.1839 -1.2905 |  1.0221  0.8915
v_err    | -0.0103 |  0.0580 | -0.4522 |  0.1035
landing_rewards |    9.77 |    1.49 |    0.00 |   10.00
landing_margin |   -0.02 |    0.01 |   -0.06 |    0.01
tracking_rewards |  -17.33 |    4.47 |  -39.26 |  -10.00
steps    |     377 |      21 |     333 |     417
***** Episode 95210, Mean R = -10.7  Std R = 4.5  Min R = -28.0
PolicyLoss: -0.0126
Policy_Beta: 0.114
Policy_Entropy: 0.178
Policy_KL: 0.00177
Policy_SD: 0.518
Policy_lr_mult: 0.132
Steps: 1.19e+04
TotalSteps: 3.5e+07
VF_0_ExplainedVarNew: 0.987
VF_0_ExplainedVarOld: 0.983
VF_0_Loss : 0.000175


ADV1:  -0.0004783594610033205 0.004983200857405176 0.03938036079544799 -0.038156948949163993
ADV2:  0.003715898758190406 0.9168713302702338 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.0425   1.1377   6.2583  27.0893  20.3031  12.6669
ValFun  Gradients

attitude |    0.01   -0.03   -0.10 |    1.07    0.64    1.78 |   -3.14   -1.57   -3.14 |    3.14    1.55    3.14
w        |    0.00   -0.00    0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |   -0.04   -0.11 |    0.64    1.77 |   -1.51   -3.14 |    1.35    3.12
w_f      |    0.00   -0.00    0.00 |    0.01    0.01    0.01 |   -0.03   -0.02   -0.02 |    0.04    0.03    0.03
w_rewards |   -0.00 |    0.00 |   -0.02 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.23 |    0.25 |    0.00 |    1.73
seeker_angles |    0.00    0.00 |    0.08    0.08 |   -0.97   -0.98 |    1.00    0.98
cs_angles |  0.0005  0.0037 |  0.0759  0.0792 | -0.9697 -0.9787 |  0.9979  0.9794
optical_flow |  0.0000  0.0000 |  0.0224  0.0238 | -1.3428 -1.0500 |  0.8820  1.0100
v_err    | -0.0103 |  0.0578 | -0.4518 |  0.1040
landing_rewards |    9.68 |    1.77 |    0.00 |   10.00
landing_margin |   -0

thrust   |   -0.00   -0.01   -0.00 |    0.67    0.68    0.67 |   -3.39   -3.45   -3.42 |    3.31    3.45    3.46
norm_thrust |    0.88 |    0.76 |    0.00 |    3.46
fuel     |    1.50 |    0.19 |    1.05 |    2.00
rewards  |  -11.69 |    4.95 |  -28.11 |   -2.55
fuel_rewards |   -4.29 |    0.53 |   -5.73 |   -3.01
glideslope_rewards |    0.00 |    0.00 |    0.00 |    0.00
glideslope_penalty |    0.00 |    0.00 |    0.00 |    0.00
glideslope |    2.89 |   12.62 |    0.00 |  150.80
norm_af  |    1.75 |    0.90 |    0.07 |    3.28
norm_wf  |    0.02 |    0.01 |    0.00 |    0.04
rh_penalty |    0.00 |    0.00 |    0.00 |    0.00
att_rewards |    0.00 |    0.00 |    0.00 |    0.00
att_penalty |    0.00 |    0.00 |    0.00 |    0.00
attitude |   -0.05    0.04    0.15 |    1.13    0.65    1.85 |   -3.14   -1.48   -3.14 |    3.14    1.56    3.14
w        |    0.00   -0.00    0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |    0.04    0.21 |    0.65

ADV1:  -0.00017841319029192289 0.006566175010174333 0.04325039447930129 -0.06747597587626408
ADV2:  0.02590195524975919 0.824078587757367 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.7767   0.9600   5.0705  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0004   0.0002   0.0009   6.4661   2.1407   2.4885
Update Cnt = 3100    ET =    996.7   Stats:  Mean, Std, Min, Max
r_f      |   22.99   16.57    6.95 |  176.87  167.46  207.38 | -390.45 -383.68 -386.21 |  398.55  389.76  389.67
v_f      |   -0.01   -0.00   -0.00 |    0.04    0.04    0.05 |   -0.10   -0.10   -0.09 |    0.09    0.10    0.11
r_i      |   58.41   64.25   30.73 |  669.17  646.16  782.50 |-1323.62-1219.26-1334.55 | 1367.29 1272.09 1272.90
v_i      |   -0.00   -0.00   -0.00 |    0.04    0.04    0.05 |   -0.09   -0.09   -0.09 |    0.10    0.08    0.09
norm_rf  |    0.17 |    0.07 |    0.02 |    0.46
norm_vf  |    0.08 |    0.01 |    0.05 |    0.12
gs_f     |    1.57 |    3.48 |  

***** Episode 96388, Mean R = -10.7  Std R = 5.2  Min R = -25.6
PolicyLoss: -0.0202
Policy_Beta: 0.114
Policy_Entropy: 0.177
Policy_KL: 0.00111
Policy_SD: 0.513
Policy_lr_mult: 0.132
Steps: 1.18e+04
TotalSteps: 3.54e+07
VF_0_ExplainedVarNew: 0.98
VF_0_ExplainedVarOld: 0.975
VF_0_Loss : 6.83e-05


ADV1:  5.161725003293902e-05 0.006129416089013699 0.04457164739002606 -0.0412220840981824
ADV2:  0.003751821423863448 0.9035033528350511 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.1852   1.2014   5.9044  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0002   0.0001   0.0005   6.4661   2.1407   2.4885
***** Episode 96419, Mean R = -10.6  Std R = 5.8  Min R = -28.2
PolicyLoss: -0.00842
Policy_Beta: 0.114
Policy_Entropy: 0.176
Policy_KL: 0.00133
Policy_SD: 0.52
Policy_lr_mult: 0.132
Steps: 1.18e+04
TotalSteps: 3.54e+07
VF_0_ExplainedVarNew: 0.988
VF_0_ExplainedVarOld: 0.982
VF_0_Loss : 6.33e-05


ADV1:  0.001409148810632626 0.005056358195256923 0.

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.5906   0.8286   3.9338  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0028   0.0017   0.0074   6.4661   2.1407   2.4885
***** Episode 96667, Mean R = -11.6  Std R = 5.2  Min R = -28.9
PolicyLoss: -0.00187
Policy_Beta: 0.114
Policy_Entropy: 0.175
Policy_KL: 0.000888
Policy_SD: 0.54
Policy_lr_mult: 0.132
Steps: 1.17e+04
TotalSteps: 3.55e+07
VF_0_ExplainedVarNew: 0.99
VF_0_ExplainedVarOld: 0.985
VF_0_Loss : 3.36e-05


ADV1:  0.0003827507269196502 0.006796971895478782 0.0742305776564895 -0.05694623510247626
ADV2:  0.01968667683097801 0.8263226852589795 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.4165   1.0894   5.6088  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0010   0.0005   0.0019   6.4661   2.1407   2.4885
***** Episode 96698, Mean R = -12.0  Std R = 4.5  Min R = -26.6
PolicyLoss: -0.0273
Policy_Beta: 0.114
Policy_Entropy: 0.174
Policy_KL: 0.00083


ADV1:  -0.0010042186605138334 0.007975242299847892 0.03700678699399601 -0.06471580400081646
ADV2:  0.035929790626880086 0.8263802296216844 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.9262   0.8945   4.3707  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0011   0.0007   0.0026   6.4661   2.1407   2.4885
***** Episode 96946, Mean R = -12.3  Std R = 5.9  Min R = -27.0
PolicyLoss: -0.0308
Policy_Beta: 0.114
Policy_Entropy: 0.174
Policy_KL: 0.00106
Policy_SD: 0.541
Policy_lr_mult: 0.132
Steps: 1.18e+04
TotalSteps: 3.56e+07
VF_0_ExplainedVarNew: 0.974
VF_0_ExplainedVarOld: 0.971
VF_0_Loss : 5.86e-05


ADV1:  0.0015119742180862083 0.006574483938349096 0.030736473416317297 -0.04908881399819359
ADV2:  0.006362348606369894 0.8474366170490034 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.3455   1.2696   6.9597  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0021   0.0011   0.0043   6.4661   2.1407   

***** Episode 97194, Mean R = -10.8  Std R = 4.7  Min R = -22.9
PolicyLoss: -0.0419
Policy_Beta: 0.114
Policy_Entropy: 0.175
Policy_KL: 0.000922
Policy_SD: 0.522
Policy_lr_mult: 0.132
Steps: 1.18e+04
TotalSteps: 3.57e+07
VF_0_ExplainedVarNew: 0.975
VF_0_ExplainedVarOld: 0.972
VF_0_Loss : 5.02e-05


ADV1:  0.0004371963238970562 0.006566306545093576 0.04445566651976196 -0.051598732749115084
ADV2:  0.007665511437871408 0.8748057196749146 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.6504   0.8325   3.4499  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0005   0.0003   0.0011   6.4661   2.1407   2.4885
***** Episode 97225, Mean R = -11.8  Std R = 4.6  Min R = -21.4
PolicyLoss: -0.0155
Policy_Beta: 0.114
Policy_Entropy: 0.176
Policy_KL: 0.000868
Policy_SD: 0.525
Policy_lr_mult: 0.132
Steps: 1.17e+04
TotalSteps: 3.57e+07
VF_0_ExplainedVarNew: 0.983
VF_0_ExplainedVarOld: 0.981
VF_0_Loss : 3.73e-05


ADV1:  -0.0007281699175260527 0.00781645121253

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.2986   0.4737   2.2575  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0008   0.0005   0.0018   6.4661   2.1407   2.4885
***** Episode 97473, Mean R = -10.2  Std R = 4.0  Min R = -18.9
PolicyLoss: -0.011
Policy_Beta: 0.114
Policy_Entropy: 0.176
Policy_KL: 0.00117
Policy_SD: 0.528
Policy_lr_mult: 0.132
Steps: 1.16e+04
TotalSteps: 3.58e+07
VF_0_ExplainedVarNew: 0.991
VF_0_ExplainedVarOld: 0.989
VF_0_Loss : 1.83e-05


ADV1:  -0.0021548456561834134 0.007189287258501676 0.05518050735787772 -0.07313870559996632
ADV2:  0.05482558231570184 0.7871645544338491 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.4433   1.1090   5.3699  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0023   0.0014   0.0055   6.4661   2.1407   2.4885
***** Episode 97504, Mean R = -10.9  Std R = 4.9  Min R = -25.3
PolicyLoss: -0.0391
Policy_Beta: 0.114
Policy_Entropy: 0.176
Policy_KL: 0.00124

ADV1:  0.0028173727828547366 0.00632146436624202 0.03606849328793729 -0.04335264872470317
ADV2:  -0.01469860968420437 0.8841113503994722 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.7323   0.6729   3.5337  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0036   0.0021   0.0073   6.4661   2.1407   2.4885
***** Episode 97752, Mean R = -10.9  Std R = 4.8  Min R = -25.9
PolicyLoss: -0.0214
Policy_Beta: 0.114
Policy_Entropy: 0.178
Policy_KL: 0.00137
Policy_SD: 0.516
Policy_lr_mult: 0.132
Steps: 1.17e+04
TotalSteps: 3.59e+07
VF_0_ExplainedVarNew: 0.983
VF_0_ExplainedVarOld: 0.98
VF_0_Loss : 8.18e-05


ADV1:  -0.0026902244591229378 0.0066801703501427655 0.03216057409842813 -0.055594802716779856
ADV2:  0.05201625221880173 0.8244915630776097 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.6668   1.2084   6.6429  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0036   0.0021   0.0074   6.4661   2.1407   2.

***** Episode 98000, Mean R = -10.7  Std R = 3.8  Min R = -20.2
PolicyLoss: -0.0339
Policy_Beta: 0.114
Policy_Entropy: 0.178
Policy_KL: 0.00128
Policy_SD: 0.505
Policy_lr_mult: 0.132
Steps: 1.18e+04
TotalSteps: 3.6e+07
VF_0_ExplainedVarNew: 0.972
VF_0_ExplainedVarOld: 0.968
VF_0_Loss : 4.91e-05


ADV1:  0.0009134229993120519 0.00473361575413931 0.03923416701401561 -0.060958356416442094
ADV2:  -0.013058644380421473 0.8780884154066897 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.9990   0.8998   4.2133  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0010   0.0006   0.0024   6.4661   2.1407   2.4885
***** Episode 98031, Mean R = -10.1  Std R = 3.6  Min R = -22.6
PolicyLoss: -0.00498
Policy_Beta: 0.114
Policy_Entropy: 0.177
Policy_KL: 0.000934
Policy_SD: 0.521
Policy_lr_mult: 0.132
Steps: 1.17e+04
TotalSteps: 3.6e+07
VF_0_ExplainedVarNew: 0.99
VF_0_ExplainedVarOld: 0.988
VF_0_Loss : 2.16e-05


ADV1:  0.00021619613668661256 0.00521451587733426

cs_angles |  0.0040  0.0026 |  0.0734  0.0804 | -0.9979 -0.9986 |  0.9839  0.9853
optical_flow |  0.0000 -0.0000 |  0.0231  0.0222 | -1.1798 -0.9878 |  0.9677  1.1149
v_err    | -0.0103 |  0.0577 | -0.4530 |  0.1080
landing_rewards |    9.74 |    1.59 |    0.00 |   10.00
landing_margin |   -0.02 |    0.01 |   -0.05 |    0.02
tracking_rewards |  -16.71 |    4.22 |  -44.17 |   -9.94
steps    |     376 |      20 |     339 |     417
***** Episode 98310, Mean R = -11.3  Std R = 3.5  Min R = -20.0
PolicyLoss: -0.0337
Policy_Beta: 0.114
Policy_Entropy: 0.176
Policy_KL: 0.000931
Policy_SD: 0.522
Policy_lr_mult: 0.132
Steps: 1.18e+04
TotalSteps: 3.61e+07
VF_0_ExplainedVarNew: 0.981
VF_0_ExplainedVarOld: 0.979
VF_0_Loss : 7.98e-05


ADV1:  0.0001770396744248435 0.004936744864120225 0.052137974428569045 -0.05488495161864482
ADV2:  -0.003983382127188839 0.8670494956013363 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.1484   1.1478   6.2014  27.0893  20.3031  12.6669
ValFun  Gradien

w        |   -0.00    0.00    0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |   -0.00    0.17 |    0.61    1.88 |   -1.46   -3.14 |    1.43    3.14
w_f      |    0.00   -0.00   -0.00 |    0.01    0.01    0.01 |   -0.03   -0.03   -0.02 |    0.03    0.03    0.02
w_rewards |   -0.00 |    0.00 |   -0.01 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.22 |    0.24 |    0.00 |    1.48
seeker_angles |    0.00    0.00 |    0.07    0.08 |   -1.00   -1.00 |    1.00    0.92
cs_angles |  0.0021  0.0039 |  0.0712  0.0780 | -0.9993 -0.9978 |  0.9985  0.9217
optical_flow | -0.0001 -0.0001 |  0.0220  0.0221 | -1.1715 -0.9726 |  1.0415  0.9781
v_err    | -0.0105 |  0.0575 | -0.4530 |  0.0971
landing_rewards |    9.74 |    1.59 |    0.00 |   10.00
landing_margin |   -0.02 |    0.01 |   -0.06 |    0.02
tracking_rewards |  -16.45 |    3.76 |  -33.50 |   -9.52
steps    |     378 |  

w        |    0.00    0.00    0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |   -0.06    0.03 |    0.66    1.85 |   -1.41   -3.14 |    1.51    3.11
w_f      |    0.00   -0.00    0.00 |    0.01    0.01    0.01 |   -0.03   -0.02   -0.02 |    0.03    0.03    0.03
w_rewards |   -0.00 |    0.00 |   -0.03 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.22 |    0.25 |    0.00 |    1.61
seeker_angles |    0.00    0.00 |    0.08    0.08 |   -1.00   -0.99 |    0.99    0.94
cs_angles |  0.0018  0.0043 |  0.0765  0.0769 | -0.9985 -0.9882 |  0.9937  0.9428
optical_flow |  0.0001  0.0000 |  0.0227  0.0222 | -0.9399 -0.8935 |  0.9829  1.0390
v_err    | -0.0100 |  0.0573 | -0.4519 |  0.1068
landing_rewards |    9.58 |    2.00 |    0.00 |   10.00
landing_margin |   -0.02 |    0.01 |   -0.06 |    0.02
tracking_rewards |  -16.55 |    3.88 |  -35.71 |  -10.08
steps    |     376 |  

attitude |    0.08   -0.04    0.01 |    1.20    0.66    1.88 |   -3.14   -1.55   -3.14 |    3.14    1.57    3.14
w        |   -0.00    0.00   -0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |   -0.05    0.03 |    0.65    1.88 |   -1.47   -3.13 |    1.50    3.13
w_f      |   -0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.03   -0.03   -0.02 |    0.03    0.03    0.03
w_rewards |   -0.00 |    0.00 |   -0.05 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.23 |    0.25 |    0.00 |    1.62
seeker_angles |    0.00    0.01 |    0.07    0.08 |   -0.96   -1.00 |    0.99    0.99
cs_angles |  0.0028  0.0058 |  0.0749  0.0795 | -0.9649 -0.9995 |  0.9911  0.9887
optical_flow | -0.0000  0.0000 |  0.0215  0.0219 | -0.9139 -1.0050 |  1.0051  0.9330
v_err    | -0.0098 |  0.0577 | -0.4520 |  0.1002
landing_rewards |    9.81 |    1.38 |    0.00 |   10.00
landing_margin |   -0

attitude |   -0.02   -0.02    0.07 |    1.19    0.67    1.87 |   -3.14   -1.54   -3.14 |    3.14    1.56    3.14
w        |   -0.00    0.00    0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |   -0.02   -0.00 |    0.66    1.88 |   -1.44   -3.14 |    1.50    3.10
w_f      |    0.00   -0.00   -0.00 |    0.01    0.01    0.01 |   -0.03   -0.02   -0.02 |    0.03    0.02    0.02
w_rewards |    0.00 |    0.00 |    0.00 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.22 |    0.25 |    0.00 |    1.52
seeker_angles |    0.00    0.00 |    0.07    0.08 |   -0.97   -0.99 |    0.98    1.00
cs_angles |  0.0015  0.0019 |  0.0727  0.0797 | -0.9720 -0.9932 |  0.9794  0.9991
optical_flow | -0.0000 -0.0001 |  0.0239  0.0218 | -1.2464 -1.2242 |  1.1831  0.9501
v_err    | -0.0097 |  0.0573 | -0.4534 |  0.1044
landing_rewards |    9.48 |    2.21 |    0.00 |   10.00
landing_margin |   -0

w        |    0.00   -0.00   -0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |   -0.00   -0.08 |    0.68    1.83 |   -1.46   -3.14 |    1.55    3.11
w_f      |    0.00   -0.00    0.00 |    0.01    0.01    0.01 |   -0.03   -0.03   -0.02 |    0.03    0.03    0.03
w_rewards |   -0.00 |    0.00 |   -0.00 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.22 |    0.25 |    0.00 |    1.73
seeker_angles |    0.00    0.00 |    0.08    0.08 |   -1.00   -0.97 |    0.97    0.94
cs_angles |  0.0012  0.0048 |  0.0755  0.0802 | -0.9995 -0.9733 |  0.9721  0.9388
optical_flow |  0.0001 -0.0000 |  0.0222  0.0216 | -1.1372 -1.0453 |  0.7794  1.0362
v_err    | -0.0103 |  0.0581 | -0.4526 |  0.1055
landing_rewards |    9.77 |    1.49 |    0.00 |   10.00
landing_margin |   -0.02 |    0.01 |   -0.06 |    0.02
tracking_rewards |  -16.96 |    4.25 |  -45.30 |   -9.19
steps    |     376 |  

attitude |    0.02    0.02   -0.32 |    1.17    0.69    1.82 |   -3.14   -1.56   -3.14 |    3.14    1.57    3.14
w        |   -0.00    0.00   -0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |    0.02   -0.31 |    0.69    1.82 |   -1.47   -3.11 |    1.43    3.13
w_f      |   -0.00   -0.00    0.00 |    0.01    0.01    0.01 |   -0.04   -0.02   -0.03 |    0.03    0.02    0.03
w_rewards |   -0.00 |    0.00 |   -0.00 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.22 |    0.25 |    0.00 |    1.46
seeker_angles |    0.00    0.00 |    0.07    0.08 |   -0.98   -0.99 |    1.00    0.99
cs_angles |  0.0034  0.0034 |  0.0745  0.0801 | -0.9781 -0.9924 |  0.9967  0.9927
optical_flow |  0.0000 -0.0001 |  0.0229  0.0225 | -1.0476 -1.1646 |  1.0913  1.2801
v_err    | -0.0101 |  0.0578 | -0.4525 |  0.1098
landing_rewards |    9.68 |    1.77 |    0.00 |   10.00
landing_margin |   -0

attitude |    0.05    0.03   -0.01 |    1.12    0.64    1.86 |   -3.14   -1.56   -3.14 |    3.14    1.57    3.14
w        |    0.00   -0.00    0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |    0.02   -0.03 |    0.65    1.86 |   -1.41   -3.14 |    1.53    3.11
w_f      |   -0.00   -0.00    0.00 |    0.01    0.01    0.01 |   -0.03   -0.02   -0.02 |    0.03    0.02    0.02
w_rewards |    0.00 |    0.00 |    0.00 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.22 |    0.25 |    0.00 |    1.67
seeker_angles |    0.01    0.00 |    0.08    0.08 |   -0.99   -0.99 |    1.00    1.00
cs_angles |  0.0052  0.0042 |  0.0752  0.0808 | -0.9940 -0.9879 |  0.9952  0.9951
optical_flow |  0.0000 -0.0000 |  0.0223  0.0229 | -1.0262 -1.0139 |  1.0385  1.0838
v_err    | -0.0102 |  0.0577 | -0.4522 |  0.1005
landing_rewards |    9.55 |    2.08 |    0.00 |   10.00
landing_margin |   -0

attitude |    0.02    0.01    0.01 |    1.17    0.67    1.89 |   -3.14   -1.54   -3.14 |    3.14    1.54    3.14
w        |   -0.00   -0.00    0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |    0.02    0.00 |    0.67    1.89 |   -1.48   -3.13 |    1.46    3.13
w_f      |   -0.00   -0.00   -0.00 |    0.01    0.01    0.01 |   -0.03   -0.02   -0.02 |    0.03    0.02    0.03
w_rewards |   -0.00 |    0.00 |   -0.04 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.22 |    0.24 |    0.00 |    1.60
seeker_angles |    0.00    0.01 |    0.07    0.08 |   -1.00   -0.99 |    1.00    0.98
cs_angles |  0.0030  0.0053 |  0.0714  0.0759 | -0.9996 -0.9867 |  0.9969  0.9759
optical_flow | -0.0000 -0.0001 |  0.0228  0.0224 | -1.1908 -1.0283 |  1.3323  1.0459
v_err    | -0.0103 |  0.0576 | -0.4519 |  0.0995
landing_rewards |    9.74 |    1.59 |    0.00 |   10.00
landing_margin |   -0

attitude |   -0.04    0.01    0.08 |    1.27    0.67    1.87 |   -3.14   -1.57   -3.14 |    3.14    1.50    3.14
w        |   -0.00   -0.00    0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |    0.01    0.05 |    0.67    1.88 |   -1.43   -3.14 |    1.50    3.14
w_f      |   -0.00   -0.00    0.00 |    0.01    0.01    0.01 |   -0.04   -0.03   -0.02 |    0.03    0.02    0.03
w_rewards |    0.00 |    0.00 |    0.00 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.22 |    0.24 |    0.00 |    1.47
seeker_angles |    0.00    0.00 |    0.07    0.08 |   -0.91   -0.99 |    0.96    0.98
cs_angles |  0.0019  0.0005 |  0.0740  0.0756 | -0.9143 -0.9942 |  0.9629  0.9803
optical_flow |  0.0000 -0.0000 |  0.0224  0.0226 | -0.9193 -1.1626 |  1.0848  0.8380
v_err    | -0.0106 |  0.0577 | -0.4821 |  0.1045
landing_rewards |    9.68 |    1.77 |    0.00 |   10.00
landing_margin |   -0

attitude |   -0.04    0.01    0.03 |    1.17    0.66    1.83 |   -3.14   -1.56   -3.14 |    3.14    1.48    3.14
w        |    0.00    0.00    0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |    0.01   -0.08 |    0.66    1.85 |   -1.41   -3.14 |    1.43    3.12
w_f      |    0.00   -0.00    0.00 |    0.01    0.01    0.01 |   -0.03   -0.03   -0.02 |    0.03    0.02    0.02
w_rewards |   -0.00 |    0.00 |   -0.00 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.22 |    0.25 |    0.00 |    1.52
seeker_angles |    0.00    0.00 |    0.08    0.08 |   -0.98   -0.99 |    0.95    0.97
cs_angles |  0.0022  0.0026 |  0.0779  0.0771 | -0.9844 -0.9913 |  0.9547  0.9663
optical_flow |  0.0001 -0.0001 |  0.0237  0.0226 | -1.2349 -1.2034 |  1.0883  0.9368
v_err    | -0.0103 |  0.0578 | -0.4529 |  0.1078
landing_rewards |    9.29 |    2.57 |    0.00 |   10.00
landing_margin |   -0

attitude |   -0.08    0.02    0.13 |    1.19    0.67    1.88 |   -3.14   -1.57   -3.14 |    3.14    1.54    3.14
w        |   -0.00   -0.00    0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |    0.02    0.13 |    0.67    1.88 |   -1.46   -3.14 |    1.45    3.14
w_f      |   -0.00   -0.00    0.00 |    0.01    0.01    0.01 |   -0.03   -0.03   -0.02 |    0.03    0.03    0.02
w_rewards |   -0.00 |    0.00 |   -0.00 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.23 |    0.25 |    0.00 |    1.52
seeker_angles |    0.00    0.00 |    0.08    0.08 |   -0.99   -1.00 |    0.98    1.00
cs_angles |  0.0034  0.0030 |  0.0767  0.0792 | -0.9854 -0.9951 |  0.9843  0.9979
optical_flow |  0.0000 -0.0000 |  0.0225  0.0223 | -1.0244 -1.2543 |  0.9647  1.2334
v_err    | -0.0105 |  0.0584 | -0.4524 |  0.1095
landing_rewards |    9.55 |    2.08 |    0.00 |   10.00
landing_margin |   -0

thrust   |    0.00    0.00    0.00 |    0.66    0.67    0.66 |   -3.45   -3.30   -3.41 |    3.46    3.42    3.41
norm_thrust |    0.87 |    0.75 |    0.00 |    3.46
fuel     |    1.48 |    0.18 |    1.07 |    2.32
rewards  |  -11.12 |    5.10 |  -35.79 |   -3.26
fuel_rewards |   -4.25 |    0.51 |   -6.67 |   -3.08
glideslope_rewards |    0.00 |    0.00 |    0.00 |    0.00
glideslope_penalty |    0.00 |    0.00 |    0.00 |    0.00
glideslope |    2.85 |   12.71 |    0.01 |  661.97
norm_af  |    1.79 |    0.90 |    0.11 |    3.20
norm_wf  |    0.01 |    0.01 |    0.00 |    0.03
rh_penalty |    0.00 |    0.00 |    0.00 |    0.00
att_rewards |    0.00 |    0.00 |    0.00 |    0.00
att_penalty |    0.00 |    0.00 |    0.00 |    0.00
attitude |   -0.09   -0.02   -0.03 |    1.22    0.66    1.89 |   -3.14   -1.56   -3.14 |    3.14    1.54    3.14
w        |    0.00   -0.00    0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |   -0.04   -0.09 |    0.65

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.4882   0.7647   4.0812  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0017   0.0010   0.0035   6.4661   2.1407   2.4885
Update Cnt = 3300    ET =    972.2   Stats:  Mean, Std, Min, Max
r_f      |   13.85   -3.29  -13.12 |  191.09  166.99  201.15 | -381.91 -389.83 -395.60 |  376.34  381.28  372.26
v_f      |   -0.00    0.00    0.00 |    0.05    0.04    0.05 |   -0.09   -0.09   -0.12 |    0.09    0.10    0.11
r_i      |   39.98   -3.79  -34.82 |  689.31  655.80  763.83 |-1241.21-1283.06-1263.65 | 1306.14 1259.41 1284.71
v_i      |   -0.00    0.00    0.00 |    0.04    0.04    0.05 |   -0.09   -0.09   -0.10 |    0.10    0.09    0.09
norm_rf  |    0.17 |    0.07 |    0.03 |    0.43
norm_vf  |    0.08 |    0.01 |    0.05 |    0.12
gs_f     |    1.21 |    1.98 |    0.01 |   27.84
thrust   |    0.00    0.00    0.00 |    0.67    0.67    0.67 |   -3.43   -3.43   -3.41 |    3.21    3.44    3.45
norm_thrust |    

ADV1:  -0.0019522684804184848 0.006037419421622166 0.0444525257694679 -0.0443772888635553
ADV2:  0.02827127536356211 0.8843564004695696 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.6792   1.1788   6.4377  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0020   0.0012   0.0049   6.4661   2.1407   2.4885
***** Episode 102619, Mean R = -12.2  Std R = 4.9  Min R = -27.4
PolicyLoss: -0.0113
Policy_Beta: 0.114
Policy_Entropy: 0.176
Policy_KL: 0.000964
Policy_SD: 0.536
Policy_lr_mult: 0.132
Steps: 1.17e+04
TotalSteps: 3.78e+07
VF_0_ExplainedVarNew: 0.991
VF_0_ExplainedVarOld: 0.985
VF_0_Loss : 3.76e-05


ADV1:  -0.00020511228424293387 0.004840994739361525 0.0367175366370448 -0.03471979331774336
ADV2:  0.00413944840792616 0.9014645832807207 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.8420   0.8970   3.7161  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0005   0.0003   0.0010   6.4661   2.1407   2.

***** Episode 102867, Mean R = -12.1  Std R = 6.5  Min R = -27.0
PolicyLoss: -0.0334
Policy_Beta: 0.114
Policy_Entropy: 0.174
Policy_KL: 0.00121
Policy_SD: 0.532
Policy_lr_mult: 0.132
Steps: 1.16e+04
TotalSteps: 3.79e+07
VF_0_ExplainedVarNew: 0.968
VF_0_ExplainedVarOld: 0.965
VF_0_Loss : 9.8e-05


ADV1:  0.001339574923571688 0.008703220341928405 0.035635800749225954 -0.05823899655843839
ADV2:  0.01556339462066249 0.8565744299429673 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.6004   0.2020   1.1466  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0017   0.0010   0.0034   6.4661   2.1407   2.4885
***** Episode 102898, Mean R = -11.6  Std R = 5.0  Min R = -23.7
PolicyLoss: -0.0298
Policy_Beta: 0.114
Policy_Entropy: 0.175
Policy_KL: 0.000978
Policy_SD: 0.528
Policy_lr_mult: 0.132
Steps: 1.18e+04
TotalSteps: 3.79e+07
VF_0_ExplainedVarNew: 0.968
VF_0_ExplainedVarOld: 0.964
VF_0_Loss : 7.45e-05


ADV1:  -3.683156445530331e-05 0.0061475392143307

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.8645   1.0270   4.6407  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0022   0.0013   0.0048   6.4661   2.1407   2.4885
***** Episode 103146, Mean R = -14.1  Std R = 5.7  Min R = -25.8
PolicyLoss: -0.0272
Policy_Beta: 0.114
Policy_Entropy: 0.177
Policy_KL: 0.000963
Policy_SD: 0.546
Policy_lr_mult: 0.132
Steps: 1.16e+04
TotalSteps: 3.8e+07
VF_0_ExplainedVarNew: 0.969
VF_0_ExplainedVarOld: 0.967
VF_0_Loss : 0.000148


ADV1:  0.0005543193639148079 0.007192927838681055 0.031018052860108253 -0.07424898312656575
ADV2:  0.016954923366686258 0.8608683500099813 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.4606   0.6923   3.4559  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0007   0.0004   0.0015   6.4661   2.1407   2.4885
***** Episode 103177, Mean R = -12.6  Std R = 5.8  Min R = -30.7
PolicyLoss: -0.0255
Policy_Beta: 0.114
Policy_Entropy: 0.177
Policy_KL: 0.0

ADV1:  0.00016183942180643442 0.006454563300991361 0.05628914019930581 -0.07297849784672367
ADV2:  0.026487150940907166 0.7948218706109896 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.9712   1.0866   5.9070  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0006   0.0003   0.0011   6.4661   2.1407   2.4885
***** Episode 103425, Mean R = -11.5  Std R = 5.4  Min R = -24.2
PolicyLoss: -0.0332
Policy_Beta: 0.114
Policy_Entropy: 0.176
Policy_KL: 0.00104
Policy_SD: 0.539
Policy_lr_mult: 0.132
Steps: 1.16e+04
TotalSteps: 3.81e+07
VF_0_ExplainedVarNew: 0.984
VF_0_ExplainedVarOld: 0.982
VF_0_Loss : 0.000531


ADV1:  -0.00023864633059179533 0.006906219451478962 0.03995159030292439 -0.051112988644971345
ADV2:  0.028179504359517087 0.8284860895485356 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.6244   1.2667   5.6817  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0003   0.0002   0.0007   6.4661   2.1407

***** Episode 103673, Mean R = -11.7  Std R = 3.8  Min R = -19.5
PolicyLoss: -0.00804
Policy_Beta: 0.114
Policy_Entropy: 0.175
Policy_KL: 0.000857
Policy_SD: 0.541
Policy_lr_mult: 0.132
Steps: 1.18e+04
TotalSteps: 3.82e+07
VF_0_ExplainedVarNew: 0.992
VF_0_ExplainedVarOld: 0.989
VF_0_Loss : 6.62e-05


ADV1:  -0.0011289022140284677 0.0074368114087535134 0.039699799508145506 -0.05876782088648391
ADV2:  0.03895728991103944 0.827783456672352 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.3144   0.6586   3.5286  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0013   0.0008   0.0029   6.4661   2.1407   2.4885
***** Episode 103704, Mean R = -11.8  Std R = 5.5  Min R = -24.2
PolicyLoss: -0.0334
Policy_Beta: 0.114
Policy_Entropy: 0.178
Policy_KL: 0.00111
Policy_SD: 0.53
Policy_lr_mult: 0.132
Steps: 1.17e+04
TotalSteps: 3.82e+07
VF_0_ExplainedVarNew: 0.978
VF_0_ExplainedVarOld: 0.975
VF_0_Loss : 7.58e-05


ADV1:  0.001581811094370886 0.005151881293449

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   3.6943   2.1162   9.3115  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0007   0.0004   0.0014   6.4661   2.1407   2.4885
***** Episode 103952, Mean R = -11.0  Std R = 5.3  Min R = -26.9
PolicyLoss: -0.028
Policy_Beta: 0.114
Policy_Entropy: 0.177
Policy_KL: 0.00163
Policy_SD: 0.529
Policy_lr_mult: 0.132
Steps: 1.15e+04
TotalSteps: 3.83e+07
VF_0_ExplainedVarNew: 0.977
VF_0_ExplainedVarOld: 0.974
VF_0_Loss : 5.95e-05


ADV1:  -0.0011395827356957852 0.009238211327487774 0.03670751504034048 -0.04714764423589695
ADV2:  0.02528683307875849 0.9022388449488067 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   3.7366   1.9986   8.8904  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0013   0.0008   0.0029   6.4661   2.1407   2.4885
***** Episode 103983, Mean R = -12.5  Std R = 4.5  Min R = -22.0
PolicyLoss: -0.0203
Policy_Beta: 0.114
Policy_Entropy: 0.178
Policy_KL: 0.001

ADV1:  -0.000696061016295196 0.007827188591656943 0.04785579528414502 -0.056690800102326536
ADV2:  0.03726061629982602 0.8183805021471523 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.2238   0.4378   2.3522  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0008   0.0005   0.0019   6.4661   2.1407   2.4885
***** Episode 104231, Mean R = -13.0  Std R = 9.0  Min R = -50.3
PolicyLoss: -0.0355
Policy_Beta: 0.114
Policy_Entropy: 0.178
Policy_KL: 0.0011
Policy_SD: 0.546
Policy_lr_mult: 0.132
Steps: 1.16e+04
TotalSteps: 3.84e+07
VF_0_ExplainedVarNew: 0.981
VF_0_ExplainedVarOld: 0.978
VF_0_Loss : 5.46e-05


ADV1:  -0.0013920444250450253 0.009400560077016236 0.03360184140133354 -0.09095144981342529
ADV2:  0.03778817523429988 0.8407810360213293 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.7136   1.3302   5.7922  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0017   0.0010   0.0035   6.4661   2.1407   2.

theta_cv |    0.23 |    0.25 |    0.00 |    1.79
seeker_angles |    0.00    0.00 |    0.07    0.08 |   -1.00   -0.99 |    1.00    0.99
cs_angles |  0.0023  0.0018 |  0.0742  0.0810 | -0.9973 -0.9926 |  0.9979  0.9891
optical_flow |  0.0001 -0.0000 |  0.0217  0.0244 | -0.9954 -1.0655 |  1.0389  1.2478
v_err    | -0.0101 |  0.0580 | -0.4526 |  0.1066
landing_rewards |    9.45 |    2.28 |    0.00 |   10.00
landing_margin |   -0.02 |    0.01 |   -0.06 |    0.02
tracking_rewards |  -16.65 |    4.50 |  -54.37 |   -9.51
steps    |     376 |      20 |     337 |     414
***** Episode 104510, Mean R = -11.2  Std R = 3.4  Min R = -19.8
PolicyLoss: -0.0144
Policy_Beta: 0.114
Policy_Entropy: 0.178
Policy_KL: 0.000922
Policy_SD: 0.533
Policy_lr_mult: 0.132
Steps: 1.18e+04
TotalSteps: 3.85e+07
VF_0_ExplainedVarNew: 0.988
VF_0_ExplainedVarOld: 0.985
VF_0_Loss : 2.52e-05


ADV1:  -0.003576268578834928 0.008027935641224504 0.030297220483633758 -0.06174054464477646
ADV2:  0.06325398108004653 0.8302818968

attitude |   -0.07    0.01    0.17 |    1.19    0.67    1.85 |   -3.14   -1.56   -3.14 |    3.14    1.57    3.14
w        |   -0.00   -0.00    0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |    0.01    0.18 |    0.68    1.86 |   -1.42   -3.12 |    1.50    3.12
w_f      |   -0.00   -0.00   -0.00 |    0.01    0.01    0.01 |   -0.03   -0.03   -0.02 |    0.03    0.02    0.02
w_rewards |   -0.00 |    0.00 |   -0.01 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.23 |    0.25 |    0.00 |    1.57
seeker_angles |    0.00    0.00 |    0.07    0.08 |   -0.99   -0.95 |    0.99    0.99
cs_angles |  0.0029  0.0027 |  0.0740  0.0761 | -0.9891 -0.9485 |  0.9867  0.9853
optical_flow | -0.0001  0.0000 |  0.0225  0.0242 | -1.2731 -1.1157 |  1.2113  1.2407
v_err    | -0.0099 |  0.0576 | -0.4517 |  0.1009
landing_rewards |    9.74 |    1.59 |    0.00 |   10.00
landing_margin |   -0

w        |    0.00   -0.00    0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |    0.06    0.01 |    0.64    1.87 |   -1.51   -3.14 |    1.44    3.13
w_f      |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.03   -0.03   -0.02 |    0.03    0.02    0.03
w_rewards |   -0.00 |    0.00 |   -0.01 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.22 |    0.25 |    0.00 |    1.51
seeker_angles |    0.00   -0.00 |    0.07    0.08 |   -1.00   -0.97 |    0.98    0.99
cs_angles |  0.0030 -0.0002 |  0.0733  0.0755 | -0.9988 -0.9652 |  0.9833  0.9922
optical_flow | -0.0001 -0.0000 |  0.0209  0.0229 | -0.9942 -0.9905 |  1.2018  1.3020
v_err    | -0.0101 |  0.0572 | -0.4530 |  0.0924
landing_rewards |    9.68 |    1.77 |    0.00 |   10.00
landing_margin |   -0.02 |    0.01 |   -0.05 |    0.01
tracking_rewards |  -16.19 |    4.12 |  -33.29 |   -8.45
steps    |     379 |  

attitude |   -0.05    0.00    0.07 |    1.25    0.68    1.88 |   -3.14   -1.56   -3.14 |    3.14    1.50    3.14
w        |    0.00   -0.00    0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |    0.02    0.05 |    0.69    1.89 |   -1.47   -3.11 |    1.47    3.11
w_f      |   -0.00   -0.00    0.00 |    0.01    0.01    0.01 |   -0.03   -0.02   -0.02 |    0.03    0.02    0.03
w_rewards |   -0.00 |    0.00 |   -0.02 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.23 |    0.25 |    0.00 |    1.39
seeker_angles |    0.00   -0.00 |    0.07    0.08 |   -0.99   -0.98 |    0.99    1.00
cs_angles |  0.0034 -0.0003 |  0.0749  0.0792 | -0.9946 -0.9810 |  0.9930  0.9981
optical_flow |  0.0000 -0.0000 |  0.0225  0.0226 | -1.0771 -1.1454 |  1.0264  0.7978
v_err    | -0.0105 |  0.0577 | -0.4530 |  0.0936
landing_rewards |    9.87 |    1.13 |    0.00 |   10.00
landing_margin |   -0

w        |    0.00   -0.00    0.00 |    0.01    0.00    0.00 |   -0.06   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |    0.00    0.00 |    0.65    1.86 |   -1.53   -3.14 |    1.46    3.12
w_f      |   -0.00   -0.00    0.00 |    0.01    0.01    0.01 |   -0.04   -0.02   -0.03 |    0.03    0.03    0.03
w_rewards |   -0.00 |    0.00 |   -0.05 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.23 |    0.25 |    0.00 |    1.62
seeker_angles |    0.00    0.00 |    0.07    0.08 |   -0.98   -0.96 |    0.98    1.00
cs_angles |  0.0007  0.0027 |  0.0750  0.0786 | -0.9794 -0.9602 |  0.9806  0.9984
optical_flow |  0.0000 -0.0000 |  0.0221  0.0218 | -1.1596 -1.0693 |  1.2082  1.1158
v_err    | -0.0099 |  0.0575 | -0.4516 |  0.1025
landing_rewards |    9.84 |    1.26 |    0.00 |   10.00
landing_margin |   -0.02 |    0.01 |   -0.06 |    0.01
tracking_rewards |  -16.63 |    4.20 |  -37.35 |   -9.53
steps    |     378 |  

attitude |    0.01   -0.03   -0.11 |    1.21    0.69    1.82 |   -3.14   -1.57   -3.14 |    3.14    1.55    3.14
w        |    0.00   -0.00   -0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |   -0.03   -0.11 |    0.69    1.82 |   -1.53   -3.14 |    1.42    3.12
w_f      |    0.00   -0.00    0.00 |    0.01    0.01    0.01 |   -0.03   -0.02   -0.02 |    0.03    0.03    0.02
w_rewards |   -0.00 |    0.00 |   -0.02 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.23 |    0.26 |    0.00 |    1.56
seeker_angles |    0.00    0.00 |    0.07    0.08 |   -0.99   -1.00 |    0.94    1.00
cs_angles |  0.0028  0.0030 |  0.0734  0.0797 | -0.9918 -0.9977 |  0.9410  0.9985
optical_flow |  0.0000 -0.0000 |  0.0208  0.0221 | -0.8992 -0.9806 |  0.9943  1.0351
v_err    | -0.0099 |  0.0576 | -0.4529 |  0.1145
landing_rewards |    9.58 |    2.00 |    0.00 |   10.00
landing_margin |   -0

attitude |    0.08   -0.04    0.10 |    1.21    0.67    1.85 |   -3.14   -1.56   -3.14 |    3.14    1.53    3.14
w        |    0.00   -0.00    0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |   -0.04    0.16 |    0.68    1.84 |   -1.55   -3.12 |    1.34    3.14
w_f      |    0.00   -0.00    0.00 |    0.01    0.01    0.01 |   -0.04   -0.04   -0.02 |    0.03    0.02    0.02
w_rewards |   -0.00 |    0.00 |   -0.01 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.23 |    0.25 |    0.00 |    1.56
seeker_angles |    0.00    0.00 |    0.08    0.08 |   -0.96   -0.97 |    1.00    1.00
cs_angles |  0.0048  0.0008 |  0.0764  0.0751 | -0.9587 -0.9668 |  1.0000  0.9957
optical_flow | -0.0001 -0.0000 |  0.0227  0.0242 | -1.1608 -1.2952 |  1.3004  1.1046
v_err    | -0.0100 |  0.0575 | -0.4517 |  0.1037
landing_rewards |    9.68 |    1.77 |    0.00 |   10.00
landing_margin |   -0

attitude |   -0.10   -0.03   -0.02 |    1.28    0.68    1.88 |   -3.14   -1.56   -3.14 |    3.14    1.57    3.14
w        |    0.00   -0.00    0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |   -0.02   -0.03 |    0.67    1.89 |   -1.46   -3.13 |    1.48    3.14
w_f      |    0.00   -0.00    0.00 |    0.01    0.01    0.01 |   -0.03   -0.02   -0.02 |    0.03    0.03    0.03
w_rewards |   -0.00 |    0.00 |   -0.04 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.23 |    0.25 |    0.00 |    1.65
seeker_angles |    0.00    0.00 |    0.07    0.08 |   -0.98   -0.99 |    1.00    0.98
cs_angles |  0.0029  0.0019 |  0.0738  0.0773 | -0.9823 -0.9875 |  0.9994  0.9798
optical_flow | -0.0001 -0.0000 |  0.0214  0.0223 | -1.1785 -1.0021 |  1.1115  1.1501
v_err    | -0.0101 |  0.0578 | -0.4529 |  0.1063
landing_rewards |    9.61 |    1.93 |    0.00 |   10.00
landing_margin |   -0

thrust   |    0.00    0.01   -0.00 |    0.67    0.68    0.66 |   -3.46   -3.45   -3.44 |    3.40    3.46    3.35
norm_thrust |    0.88 |    0.75 |    0.00 |    3.46
fuel     |    1.51 |    0.17 |    1.00 |    1.95
rewards  |  -11.48 |    4.55 |  -29.61 |   -3.27
fuel_rewards |   -4.32 |    0.48 |   -5.58 |   -2.88
glideslope_rewards |    0.00 |    0.00 |    0.00 |    0.00
glideslope_penalty |    0.00 |    0.00 |    0.00 |    0.00
glideslope |    2.98 |   13.10 |    0.00 |  216.10
norm_af  |    1.76 |    0.91 |    0.08 |    3.34
norm_wf  |    0.02 |    0.01 |    0.00 |    0.03
rh_penalty |    0.00 |    0.00 |    0.00 |    0.00
att_rewards |    0.00 |    0.00 |    0.00 |    0.00
att_penalty |    0.00 |    0.00 |    0.00 |    0.00
attitude |   -0.02   -0.08    0.00 |    1.18    0.64    1.85 |   -3.14   -1.52   -3.14 |    3.14    1.53    3.14
w        |   -0.00   -0.00    0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |   -0.08   -0.02 |    0.65

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.6946   0.7606   4.3353  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0016   0.0010   0.0034   6.4661   2.1407   2.4885
Update Cnt = 3460    ET =   1110.4   Stats:  Mean, Std, Min, Max
r_f      |  -15.23  -18.58    6.96 |  186.28  176.51  198.70 | -388.99 -704.35 -378.75 |  394.27  357.72  393.15
v_f      |    0.01    0.00   -0.00 |    0.05    0.06    0.05 |   -0.09   -0.09   -0.26 |    0.36    0.66    0.10
r_i      |  -90.95  -17.28   61.42 |  655.49  679.44  769.10 |-1370.85-1376.24-1353.58 | 1348.46 1352.60 1323.46
v_i      |    0.01    0.00   -0.00 |    0.04    0.04    0.05 |   -0.09   -0.10   -0.09 |    0.10    0.09    0.10
norm_rf  |    1.66 |   26.12 |    0.03 |  460.79
norm_vf  |    0.08 |    0.04 |    0.04 |    0.80
gs_f     |    1.55 |    3.73 |    0.01 |   42.58
thrust   |    0.00    0.00   -0.00 |    0.67    0.67    0.68 |   -3.31   -3.44   -3.39 |    3.42    3.33    3.45
norm_thrust |    

ADV1:  -0.0012862599952428093 0.007140031228497737 0.032893935537848806 -0.07436751849806189
ADV2:  0.034826012984970164 0.8478043443227935 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.2988   0.4128   2.0105  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0015   0.0009   0.0034   6.4661   2.1407   2.4885
***** Episode 107579, Mean R = -12.0  Std R = 5.9  Min R = -28.3
PolicyLoss: -0.026
Policy_Beta: 0.114
Policy_Entropy: 0.178
Policy_KL: 0.00103
Policy_SD: 0.537
Policy_lr_mult: 0.132
Steps: 1.17e+04
TotalSteps: 3.96e+07
VF_0_ExplainedVarNew: 0.983
VF_0_ExplainedVarOld: 0.979
VF_0_Loss : 8.63e-05


ADV1:  -0.0008705999102831475 0.007674375084688186 0.044815904721700495 -0.05372457791916131
ADV2:  0.03279345999284244 0.8435168699226766 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.5311   0.6830   2.8339  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0009   0.0005   0.0022   6.4661   2.1407  

***** Episode 107827, Mean R = -11.0  Std R = 4.3  Min R = -23.3
PolicyLoss: -0.00883
Policy_Beta: 0.114
Policy_Entropy: 0.18
Policy_KL: 0.000956
Policy_SD: 0.531
Policy_lr_mult: 0.132
Steps: 1.18e+04
TotalSteps: 3.97e+07
VF_0_ExplainedVarNew: 0.99
VF_0_ExplainedVarOld: 0.988
VF_0_Loss : 9.69e-05


ADV1:  0.0014806973481139374 0.005215461576755941 0.04928517117855913 -0.055784425525771564
ADV2:  -0.015754167767014424 0.8690875836388889 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.0156   1.6034   8.0861  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0021   0.0012   0.0046   6.4661   2.1407   2.4885
***** Episode 107858, Mean R = -10.1  Std R = 3.6  Min R = -18.4
PolicyLoss: -0.00985
Policy_Beta: 0.114
Policy_Entropy: 0.178
Policy_KL: 0.000892
Policy_SD: 0.531
Policy_lr_mult: 0.132
Steps: 1.18e+04
TotalSteps: 3.97e+07
VF_0_ExplainedVarNew: 0.99
VF_0_ExplainedVarOld: 0.986
VF_0_Loss : 8.16e-05


ADV1:  -0.0006408016620104316 0.005030977792

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.0461   0.6368   3.5482  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0007   0.0004   0.0014   6.4661   2.1407   2.4885
***** Episode 108106, Mean R = -10.9  Std R = 6.0  Min R = -34.5
PolicyLoss: -0.0357
Policy_Beta: 0.114
Policy_Entropy: 0.177
Policy_KL: 0.00095
Policy_SD: 0.532
Policy_lr_mult: 0.132
Steps: 1.16e+04
TotalSteps: 3.98e+07
VF_0_ExplainedVarNew: 0.969
VF_0_ExplainedVarOld: 0.967
VF_0_Loss : 0.000122


ADV1:  1.0860897821997758e-05 0.00645114854524187 0.08163974508178201 -0.049790622764208425
ADV2:  0.019415822512898837 0.797144775772431 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.2477   1.2820   6.7695  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0002   0.0001   0.0004   6.4661   2.1407   2.4885
***** Episode 108137, Mean R = -10.8  Std R = 5.0  Min R = -23.8
PolicyLoss: -0.0239
Policy_Beta: 0.114
Policy_Entropy: 0.177
Policy_KL: 0.00

ADV1:  -2.9650298514198904e-05 0.00508084873569056 0.03213294912933118 -0.04744123549182705
ADV2:  0.008405859418314975 0.8926416103168776 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.1704   0.8562   4.5166  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0005   0.0003   0.0012   6.4661   2.1407   2.4885
***** Episode 108385, Mean R = -11.0  Std R = 5.2  Min R = -24.1
PolicyLoss: -0.0124
Policy_Beta: 0.114
Policy_Entropy: 0.176
Policy_KL: 0.00118
Policy_SD: 0.547
Policy_lr_mult: 0.132
Steps: 1.16e+04
TotalSteps: 3.99e+07
VF_0_ExplainedVarNew: 0.991
VF_0_ExplainedVarOld: 0.989
VF_0_Loss : 4.1e-05


ADV1:  -0.0018164099486608124 0.0051442308720409955 0.04734994751366989 -0.04532211817277454
ADV2:  0.028642318311910893 0.8883787810322062 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.3445   0.5442   2.6640  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0021   0.0013   0.0047   6.4661   2.1407  

***** Episode 108633, Mean R = -11.6  Std R = 5.3  Min R = -24.6
PolicyLoss: -0.0104
Policy_Beta: 0.114
Policy_Entropy: 0.177
Policy_KL: 0.00124
Policy_SD: 0.545
Policy_lr_mult: 0.132
Steps: 1.16e+04
TotalSteps: 4e+07
VF_0_ExplainedVarNew: 0.989
VF_0_ExplainedVarOld: 0.986
VF_0_Loss : 3.78e-05


ADV1:  -0.0018523153979963806 0.0071553211215223044 0.0612309838737371 -0.061157632756853375
ADV2:  0.006227756920574544 0.8631938057748479 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.7392   1.6094   8.9583  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0018   0.0011   0.0049   6.4661   2.1407   2.4885
***** Episode 108664, Mean R = -10.7  Std R = 4.5  Min R = -24.6
PolicyLoss: 0.0108
Policy_Beta: 0.114
Policy_Entropy: 0.179
Policy_KL: 0.000906
Policy_SD: 0.528
Policy_lr_mult: 0.132
Steps: 1.17e+04
TotalSteps: 4e+07
VF_0_ExplainedVarNew: 0.986
VF_0_ExplainedVarOld: 0.976
VF_0_Loss : 6.67e-05


ADV1:  -0.00019509415316002762 0.006911132486062181

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.6837   0.9748   5.2158  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0021   0.0012   0.0044   6.4661   2.1407   2.4885
***** Episode 108912, Mean R = -11.7  Std R = 5.0  Min R = -23.3
PolicyLoss: -0.0283
Policy_Beta: 0.114
Policy_Entropy: 0.178
Policy_KL: 0.00134
Policy_SD: 0.53
Policy_lr_mult: 0.132
Steps: 1.16e+04
TotalSteps: 4.01e+07
VF_0_ExplainedVarNew: 0.967
VF_0_ExplainedVarOld: 0.965
VF_0_Loss : 7.47e-05


ADV1:  0.002326939504541815 0.007372717925505469 0.03884733134936613 -0.057748199785010654
ADV2:  0.0019053960528367866 0.8612623779243928 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.7526   0.9068   4.6775  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0026   0.0016   0.0059   6.4661   2.1407   2.4885
***** Episode 108943, Mean R = -11.1  Std R = 4.7  Min R = -25.1
PolicyLoss: -0.0253
Policy_Beta: 0.114
Policy_Entropy: 0.178
Policy_KL: 0.00

ADV1:  0.00042341721472462327 0.006470194183271849 0.041570862012929866 -0.052255640520116574
ADV2:  0.018873077631593786 0.8123374162595095 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.8075   0.8769   3.8253  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0007   0.0004   0.0013   6.4661   2.1407   2.4885
***** Episode 109191, Mean R = -10.5  Std R = 5.4  Min R = -25.5
PolicyLoss: -0.0282
Policy_Beta: 0.114
Policy_Entropy: 0.176
Policy_KL: 0.000871
Policy_SD: 0.541
Policy_lr_mult: 0.132
Steps: 1.16e+04
TotalSteps: 4.02e+07
VF_0_ExplainedVarNew: 0.983
VF_0_ExplainedVarOld: 0.98
VF_0_Loss : 5.72e-05


ADV1:  2.090422794557649e-05 0.005280002303142754 0.03464647650605207 -0.05669355468998527
ADV2:  0.015581600817984159 0.8626866087759754 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.0950   1.4459   7.5266  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0003   0.0002   0.0007   6.4661   2.1407 

cs_angles |  0.0037  0.0033 |  0.0766  0.0805 | -0.9899 -0.9987 |  0.9904  0.9945
optical_flow |  0.0000  0.0000 |  0.0227  0.0226 | -1.1993 -1.0732 |  1.1102  1.1519
v_err    | -0.0103 |  0.0576 | -0.4523 |  0.0948
landing_rewards |    9.81 |    1.38 |    0.00 |   10.00
landing_margin |   -0.03 |    0.01 |   -0.05 |    0.01
tracking_rewards |  -16.56 |    4.22 |  -33.26 |   -9.61
steps    |     377 |      20 |     333 |     418
***** Episode 109470, Mean R = -10.9  Std R = 4.9  Min R = -22.1
PolicyLoss: -0.00588
Policy_Beta: 0.114
Policy_Entropy: 0.178
Policy_KL: 0.00115
Policy_SD: 0.531
Policy_lr_mult: 0.132
Steps: 1.17e+04
TotalSteps: 4.04e+07
VF_0_ExplainedVarNew: 0.992
VF_0_ExplainedVarOld: 0.99
VF_0_Loss : 4.81e-05


ADV1:  -0.00108986501740202 0.00665015640174159 0.04320303420930044 -0.055586662332399915
ADV2:  0.03464784146898582 0.8120026197380739 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.8455   0.9914   5.1683  27.0893  20.3031  12.6669
ValFun  Gradients: 

attitude |    0.06   -0.05   -0.10 |    1.17    0.65    1.83 |   -3.14   -1.56   -3.14 |    3.14    1.54    3.14
w        |    0.00   -0.00   -0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |   -0.05   -0.13 |    0.65    1.84 |   -1.51   -3.12 |    1.50    3.13
w_f      |    0.00   -0.00   -0.00 |    0.01    0.01    0.01 |   -0.04   -0.03   -0.02 |    0.03    0.02    0.02
w_rewards |   -0.00 |    0.00 |   -0.01 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.22 |    0.24 |    0.00 |    1.52
seeker_angles |    0.00    0.00 |    0.07    0.08 |   -0.99   -0.98 |    0.94    0.96
cs_angles |  0.0029  0.0039 |  0.0701  0.0776 | -0.9913 -0.9835 |  0.9361  0.9569
optical_flow | -0.0000 -0.0001 |  0.0214  0.0224 | -1.0246 -1.1957 |  1.1177  1.1124
v_err    | -0.0101 |  0.0576 | -0.4526 |  0.1106
landing_rewards |    9.65 |    1.85 |    0.00 |   10.00
landing_margin |   -0

attitude |   -0.03   -0.01    0.09 |    1.15    0.68    1.82 |   -3.14   -1.55   -3.14 |    3.14    1.55    3.14
w        |    0.00   -0.00    0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |   -0.00    0.09 |    0.67    1.82 |   -1.44   -3.13 |    1.38    3.14
w_f      |    0.00   -0.00   -0.00 |    0.01    0.01    0.01 |   -0.03   -0.02   -0.02 |    0.03    0.02    0.02
w_rewards |   -0.00 |    0.00 |   -0.02 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.23 |    0.26 |    0.00 |    1.74
seeker_angles |    0.00    0.00 |    0.08    0.08 |   -0.99   -1.00 |    0.99    0.99
cs_angles |  0.0021  0.0028 |  0.0768  0.0793 | -0.9943 -0.9989 |  0.9894  0.9905
optical_flow | -0.0001 -0.0000 |  0.0218  0.0234 | -1.3409 -1.2976 |  1.0742  1.0388
v_err    | -0.0102 |  0.0572 | -0.4532 |  0.0951
landing_rewards |    9.87 |    1.13 |    0.00 |   10.00
landing_margin |   -0

attitude |   -0.01   -0.02   -0.21 |    1.18    0.70    1.81 |   -3.14   -1.57   -3.14 |    3.14    1.57    3.14
w        |    0.00   -0.00    0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |   -0.02   -0.24 |    0.69    1.81 |   -1.47   -3.12 |    1.50    3.13
w_f      |    0.00   -0.00    0.00 |    0.01    0.01    0.01 |   -0.03   -0.03   -0.02 |    0.03    0.03    0.03
w_rewards |   -0.00 |    0.00 |   -0.01 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.23 |    0.25 |    0.00 |    1.52
seeker_angles |    0.00    0.00 |    0.08    0.08 |   -0.99   -0.99 |    1.00    0.96
cs_angles |  0.0026  0.0043 |  0.0773  0.0767 | -0.9887 -0.9914 |  0.9960  0.9577
optical_flow | -0.0000 -0.0002 |  0.0225  0.0246 | -1.1523 -1.3683 |  1.1744  1.1560
v_err    | -0.0099 |  0.0576 | -0.4529 |  0.0946
landing_rewards |    9.87 |    1.13 |    0.00 |   10.00
landing_margin |   -0

w        |    0.00    0.00    0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |   -0.05    0.06 |    0.66    1.80 |   -1.54   -3.14 |    1.35    3.13
w_f      |   -0.00   -0.00   -0.00 |    0.01    0.01    0.01 |   -0.03   -0.02   -0.02 |    0.03    0.02    0.02
w_rewards |   -0.00 |    0.00 |   -0.00 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.23 |    0.26 |    0.00 |    1.61
seeker_angles |    0.00    0.00 |    0.07    0.08 |   -0.91   -0.95 |    0.98    0.99
cs_angles |  0.0042  0.0016 |  0.0738  0.0816 | -0.9128 -0.9546 |  0.9830  0.9885
optical_flow |  0.0001  0.0000 |  0.0209  0.0215 | -1.0039 -1.2782 |  1.1787  0.9871
v_err    | -0.0099 |  0.0577 | -0.4517 |  0.0972
landing_rewards |    9.74 |    1.59 |    0.00 |   10.00
landing_margin |   -0.03 |    0.01 |   -0.05 |    0.02
tracking_rewards |  -16.62 |    4.11 |  -31.39 |  -10.04
steps    |     377 |  

attitude |    0.09   -0.02   -0.12 |    1.15    0.63    1.80 |   -3.14   -1.57   -3.14 |    3.14    1.57    3.14
w        |    0.00    0.00    0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |   -0.02    0.00 |    0.64    1.82 |   -1.50   -3.14 |    1.56    3.13
w_f      |    0.00   -0.00    0.00 |    0.01    0.01    0.01 |   -0.03   -0.03   -0.02 |    0.03    0.04    0.02
w_rewards |   -0.00 |    0.00 |   -0.03 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.23 |    0.25 |    0.00 |    1.49
seeker_angles |   -0.00    0.00 |    0.08    0.08 |   -0.99   -1.00 |    0.99    0.98
cs_angles | -0.0002  0.0024 |  0.0755  0.0777 | -0.9886 -0.9991 |  0.9850  0.9838
optical_flow |  0.0001 -0.0000 |  0.0211  0.0219 | -1.1619 -0.9664 |  1.0346  1.0349
v_err    | -0.0099 |  0.0579 | -0.4530 |  0.1039
landing_rewards |    9.65 |    1.85 |    0.00 |   10.00
landing_margin |   -0

attitude |    0.03   -0.01    0.09 |    1.10    0.65    1.74 |   -3.14   -1.50   -3.14 |    3.14    1.56    3.14
w        |    0.00    0.00    0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |   -0.00    0.06 |    0.66    1.74 |   -1.38   -3.14 |    1.44    3.14
w_f      |    0.00   -0.00    0.00 |    0.01    0.01    0.01 |   -0.03   -0.02   -0.03 |    0.04    0.03    0.02
w_rewards |    0.00 |    0.00 |    0.00 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.23 |    0.25 |    0.00 |    1.53
seeker_angles |    0.00    0.00 |    0.07    0.08 |   -0.99   -1.00 |    0.99    0.98
cs_angles |  0.0038  0.0039 |  0.0748  0.0801 | -0.9931 -0.9952 |  0.9892  0.9807
optical_flow | -0.0000 -0.0002 |  0.0227  0.0232 | -1.0119 -1.1155 |  1.0446  1.0141
v_err    | -0.0098 |  0.0582 | -0.4522 |  0.1037
landing_rewards |    9.55 |    2.08 |    0.00 |   10.00
landing_margin |   -0

thrust   |   -0.00   -0.00    0.00 |    0.68    0.68    0.68 |   -3.45   -3.39   -3.45 |    3.44    3.17    3.45
norm_thrust |    0.90 |    0.76 |    0.00 |    3.46
fuel     |    1.54 |    0.19 |    1.06 |    2.24
rewards  |  -10.97 |    4.65 |  -32.19 |   -2.71
fuel_rewards |   -4.42 |    0.55 |   -6.42 |   -3.05
glideslope_rewards |    0.00 |    0.00 |    0.00 |    0.00
glideslope_penalty |    0.00 |    0.00 |    0.00 |    0.00
glideslope |    2.95 |   12.76 |    0.00 |  388.94
norm_af  |    1.72 |    0.91 |    0.07 |    3.38
norm_wf  |    0.01 |    0.01 |    0.00 |    0.04
rh_penalty |    0.00 |    0.00 |    0.00 |    0.00
att_rewards |    0.00 |    0.00 |    0.00 |    0.00
att_penalty |    0.00 |    0.00 |    0.00 |    0.00
attitude |    0.06   -0.03    0.04 |    1.11    0.64    1.83 |   -3.14   -1.57   -3.14 |    3.14    1.55    3.14
w        |    0.00   -0.00    0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |   -0.02   -0.02 |    0.65

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.5344   0.9905   5.3615  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0019   0.0011   0.0041   6.4661   2.1407   2.4885
Update Cnt = 3610    ET =   1077.5   Stats:  Mean, Std, Min, Max
r_f      |   -7.05   16.59    5.93 |  186.90  169.97  198.29 | -394.95 -373.47 -381.55 |  391.38  390.55  388.74
v_f      |   -0.00   -0.00   -0.00 |    0.04    0.04    0.05 |   -0.11   -0.09   -0.12 |    0.11    0.09    0.10
r_i      |   26.25   35.77   17.00 |  678.69  671.90  754.52 |-1298.20-1325.91-1314.16 | 1277.78 1271.34 1353.33
v_i      |   -0.00   -0.00   -0.00 |    0.04    0.04    0.05 |   -0.09   -0.09   -0.10 |    0.08    0.10    0.10
norm_rf  |    0.16 |    0.06 |    0.02 |    0.38
norm_vf  |    0.08 |    0.01 |    0.04 |    0.13
gs_f     |    1.50 |    2.79 |    0.02 |   31.31
thrust   |    0.00   -0.01    0.01 |    0.68    0.68    0.67 |   -3.41   -3.43   -3.46 |    3.42    3.43    3.40
norm_thrust |    

ADV1:  -0.00046486824715944087 0.008372735254092092 0.05911293455538491 -0.06890983272612464
ADV2:  0.032983372741929896 0.8075742966710467 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.0792   0.9786   5.3375  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0011   0.0006   0.0023   6.4661   2.1407   2.4885
***** Episode 112229, Mean R = -12.2  Std R = 5.3  Min R = -25.3
PolicyLoss: -0.0333
Policy_Beta: 0.114
Policy_Entropy: 0.179
Policy_KL: 0.00115
Policy_SD: 0.544
Policy_lr_mult: 0.132
Steps: 1.16e+04
TotalSteps: 4.14e+07
VF_0_ExplainedVarNew: 0.973
VF_0_ExplainedVarOld: 0.97
VF_0_Loss : 6.69e-05


ADV1:  0.002801962184269635 0.0046875118598883785 0.031095539691159177 -0.031082725994899085
ADV2:  -0.03069963407771468 0.9268584422035686 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.5013   1.1360   6.0081  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0032   0.0019   0.0072   6.4661   2.1407 

***** Episode 112477, Mean R = -13.2  Std R = 5.1  Min R = -31.5
PolicyLoss: -0.0249
Policy_Beta: 0.114
Policy_Entropy: 0.179
Policy_KL: 0.00117
Policy_SD: 0.544
Policy_lr_mult: 0.132
Steps: 1.18e+04
TotalSteps: 4.15e+07
VF_0_ExplainedVarNew: 0.969
VF_0_ExplainedVarOld: 0.966
VF_0_Loss : 7.37e-05


ADV1:  0.0033555929755138447 0.006250615785872139 0.04923390411966849 -0.04100033061692038
ADV2:  -0.017126061012453446 0.8436649571246305 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   3.0841   1.4765   6.5508  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0037   0.0023   0.0086   6.4661   2.1407   2.4885
***** Episode 112508, Mean R = -11.6  Std R = 4.8  Min R = -24.0
PolicyLoss: -0.0249
Policy_Beta: 0.114
Policy_Entropy: 0.178
Policy_KL: 0.00114
Policy_SD: 0.546
Policy_lr_mult: 0.132
Steps: 1.16e+04
TotalSteps: 4.15e+07
VF_0_ExplainedVarNew: 0.987
VF_0_ExplainedVarOld: 0.984
VF_0_Loss : 3.39e-05


ADV1:  -0.0011169797766524677 0.00677116228007

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.2129   1.0491   5.7612  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0002   0.0001   0.0006   6.4661   2.1407   2.4885
***** Episode 112756, Mean R = -11.1  Std R = 3.5  Min R = -19.7
PolicyLoss: -0.0352
Policy_Beta: 0.114
Policy_Entropy: 0.179
Policy_KL: 0.0011
Policy_SD: 0.532
Policy_lr_mult: 0.132
Steps: 1.19e+04
TotalSteps: 4.16e+07
VF_0_ExplainedVarNew: 0.979
VF_0_ExplainedVarOld: 0.977
VF_0_Loss : 4.19e-05


ADV1:  -0.00032371283807448745 0.006572886659818733 0.04927148692031913 -0.057183083221203856
ADV2:  0.025775751813429285 0.835555448767137 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.9458   1.0890   5.3674  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0004   0.0002   0.0010   6.4661   2.1407   2.4885
***** Episode 112787, Mean R = -11.3  Std R = 4.1  Min R = -23.4
PolicyLoss: -0.027
Policy_Beta: 0.114
Policy_Entropy: 0.177
Policy_KL: 0.00

ADV1:  -0.000867285034746652 0.008655955156641679 0.0583735134403493 -0.05201260431491358
ADV2:  0.032665188947280675 0.8449771082806258 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.0924   0.4954   2.4106  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0009   0.0006   0.0025   6.4661   2.1407   2.4885
***** Episode 113035, Mean R = -12.2  Std R = 5.4  Min R = -29.4
PolicyLoss: -0.0286
Policy_Beta: 0.114
Policy_Entropy: 0.177
Policy_KL: 0.000912
Policy_SD: 0.558
Policy_lr_mult: 0.132
Steps: 1.16e+04
TotalSteps: 4.17e+07
VF_0_ExplainedVarNew: 0.973
VF_0_ExplainedVarOld: 0.969
VF_0_Loss : 0.000149


ADV1:  -0.0016345572019067585 0.008016674811912877 0.04166095027621358 -0.05151902454084269
ADV2:  0.0352235376266401 0.874575946021591 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.8480   0.7523   3.5169  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0019   0.0011   0.0042   6.4661   2.1407   2.4

***** Episode 113283, Mean R = -10.7  Std R = 4.9  Min R = -21.5
PolicyLoss: -0.0103
Policy_Beta: 0.114
Policy_Entropy: 0.176
Policy_KL: 0.00102
Policy_SD: 0.539
Policy_lr_mult: 0.132
Steps: 1.18e+04
TotalSteps: 4.18e+07
VF_0_ExplainedVarNew: 0.99
VF_0_ExplainedVarOld: 0.988
VF_0_Loss : 3.23e-05


ADV1:  0.0011474169752227802 0.005397706326563823 0.04548080459142584 -0.07289810988279921
ADV2:  -0.00914030739382508 0.8911468765070925 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.8760   1.2467   5.5865  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0012   0.0008   0.0030   6.4661   2.1407   2.4885
***** Episode 113314, Mean R = -11.0  Std R = 3.7  Min R = -18.1
PolicyLoss: -0.00906
Policy_Beta: 0.114
Policy_Entropy: 0.178
Policy_KL: 0.00145
Policy_SD: 0.538
Policy_lr_mult: 0.132
Steps: 1.18e+04
TotalSteps: 4.18e+07
VF_0_ExplainedVarNew: 0.989
VF_0_ExplainedVarOld: 0.986
VF_0_Loss : 2.44e-05


ADV1:  0.0004290487916655643 0.0056924936857735

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.2931   0.5890   2.7248  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0019   0.0011   0.0041   6.4661   2.1407   2.4885
***** Episode 113562, Mean R = -9.2  Std R = 3.5  Min R = -19.7
PolicyLoss: -0.0291
Policy_Beta: 0.114
Policy_Entropy: 0.18
Policy_KL: 0.000812
Policy_SD: 0.527
Policy_lr_mult: 0.132
Steps: 1.17e+04
TotalSteps: 4.19e+07
VF_0_ExplainedVarNew: 0.98
VF_0_ExplainedVarOld: 0.978
VF_0_Loss : 3.81e-05


ADV1:  -0.0005961810436123156 0.006508200693148712 0.042209977218776895 -0.06090404447846484
ADV2:  0.03468805180025865 0.8058676686152848 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.5113   0.5361   2.9717  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0008   0.0004   0.0015   6.4661   2.1407   2.4885
***** Episode 113593, Mean R = -10.9  Std R = 3.5  Min R = -21.0
PolicyLoss: -0.0328
Policy_Beta: 0.114
Policy_Entropy: 0.177
Policy_KL: 0.001

ADV1:  -0.0010601786679613637 0.005296060630740122 0.03499259173601227 -0.059970111332706855
ADV2:  0.016891468333312898 0.8884889742857527 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.6537   0.8835   4.8874  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0014   0.0007   0.0028   6.4661   2.1407   2.4885
***** Episode 113841, Mean R = -11.0  Std R = 4.5  Min R = -22.4
PolicyLoss: -0.00898
Policy_Beta: 0.114
Policy_Entropy: 0.18
Policy_KL: 0.0012
Policy_SD: 0.529
Policy_lr_mult: 0.132
Steps: 1.18e+04
TotalSteps: 4.2e+07
VF_0_ExplainedVarNew: 0.991
VF_0_ExplainedVarOld: 0.987
VF_0_Loss : 4.37e-05


ADV1:  0.001382960354863671 0.004555046437876207 0.029649977487278864 -0.06504408632911529
ADV2:  -0.009495819576882931 0.8209510550708885 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.3277   1.0965   4.7808  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0019   0.0011   0.0038   6.4661   2.1407   

seeker_angles |    0.00    0.00 |    0.07    0.08 |   -0.99   -0.99 |    0.96    0.97
cs_angles |  0.0022  0.0020 |  0.0726  0.0764 | -0.9861 -0.9891 |  0.9614  0.9730
optical_flow |  0.0001  0.0000 |  0.0207  0.0219 | -1.1398 -1.0770 |  0.9205  0.9527
v_err    | -0.0101 |  0.0578 | -0.4514 |  0.0922
landing_rewards |    9.87 |    1.13 |    0.00 |   10.00
landing_margin |   -0.03 |    0.01 |   -0.05 |    0.01
tracking_rewards |  -15.99 |    3.94 |  -29.70 |   -9.23
steps    |     379 |      21 |     340 |     420
***** Episode 114120, Mean R = -9.6  Std R = 4.3  Min R = -19.7
PolicyLoss: -0.0119
Policy_Beta: 0.114
Policy_Entropy: 0.179
Policy_KL: 0.000992
Policy_SD: 0.517
Policy_lr_mult: 0.132
Steps: 1.18e+04
TotalSteps: 4.21e+07
VF_0_ExplainedVarNew: 0.989
VF_0_ExplainedVarOld: 0.987
VF_0_Loss : 2.98e-05


Dynamics: Max Disturbance (m/s^2):  [0.00179836 0.00129994 0.00168267] 0.0027848433135488422
ADV1:  0.0006437420103141278 0.005498075948492257 0.05401122529442093 -0.050829003273821

theta_cv |    0.23 |    0.25 |    0.00 |    1.55
seeker_angles |    0.00    0.00 |    0.08    0.08 |   -0.99   -0.94 |    0.99    0.97
cs_angles |  0.0048  0.0007 |  0.0753  0.0791 | -0.9904 -0.9419 |  0.9905  0.9667
optical_flow | -0.0000  0.0001 |  0.0213  0.0228 | -0.9235 -1.1575 |  0.9789  0.8712
v_err    | -0.0101 |  0.0581 | -0.4533 |  0.0960
landing_rewards |    9.74 |    1.59 |    0.00 |   10.00
landing_margin |   -0.03 |    0.01 |   -0.06 |    0.02
tracking_rewards |  -16.50 |    4.20 |  -32.89 |  -10.27
steps    |     376 |      20 |     336 |     415
***** Episode 114430, Mean R = -11.3  Std R = 5.3  Min R = -23.9
PolicyLoss: -0.0224
Policy_Beta: 0.114
Policy_Entropy: 0.179
Policy_KL: 0.00122
Policy_SD: 0.531
Policy_lr_mult: 0.132
Steps: 1.15e+04
TotalSteps: 4.22e+07
VF_0_ExplainedVarNew: 0.974
VF_0_ExplainedVarOld: 0.969
VF_0_Loss : 8.15e-05


ADV1:  0.0009834567756174851 0.0070625959320122274 0.047254235456422156 -0.09629024358137389
ADV2:  0.01584230467242984 0.8237550651

w        |    0.00   -0.00   -0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |    0.04    0.03 |    0.66    1.95 |   -1.53   -3.09 |    1.33    3.11
w_f      |    0.00   -0.00   -0.00 |    0.01    0.01    0.01 |   -0.03   -0.03   -0.02 |    0.03    0.03    0.02
w_rewards |   -0.00 |    0.00 |   -0.02 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.22 |    0.25 |    0.00 |    1.75
seeker_angles |    0.00    0.00 |    0.07    0.08 |   -1.00   -0.99 |    0.88    0.98
cs_angles |  0.0043  0.0029 |  0.0720  0.0761 | -0.9966 -0.9856 |  0.8800  0.9758
optical_flow | -0.0002  0.0001 |  0.0205  0.0232 | -1.0268 -1.3187 |  0.9753  1.0426
v_err    | -0.0101 |  0.0578 | -0.4521 |  0.1019
landing_rewards |    9.68 |    1.77 |    0.00 |   10.00
landing_margin |   -0.02 |    0.01 |   -0.06 |    0.03
tracking_rewards |  -16.19 |    3.83 |  -38.97 |  -10.13
steps    |     378 |  

w        |    0.00   -0.00   -0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |   -0.01    0.12 |    0.68    1.87 |   -1.54   -3.14 |    1.53    3.13
w_f      |    0.00   -0.00    0.00 |    0.01    0.01    0.01 |   -0.03   -0.02   -0.02 |    0.03    0.02    0.03
w_rewards |   -0.00 |    0.00 |   -0.00 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.23 |    0.25 |    0.00 |    1.74
seeker_angles |    0.00    0.00 |    0.08    0.08 |   -0.98   -0.98 |    0.97    0.97
cs_angles |  0.0024  0.0040 |  0.0782  0.0777 | -0.9798 -0.9759 |  0.9670  0.9734
optical_flow | -0.0000 -0.0001 |  0.0226  0.0219 | -1.0601 -0.9771 |  1.0735  0.9561
v_err    | -0.0102 |  0.0581 | -0.4527 |  0.1085
landing_rewards |    9.74 |    1.59 |    0.00 |   10.00
landing_margin |   -0.03 |    0.01 |   -0.05 |    0.03
tracking_rewards |  -16.76 |    5.01 |  -53.38 |   -9.16
steps    |     377 |  

attitude |    0.02   -0.03    0.14 |    1.13    0.66    1.85 |   -3.14   -1.57   -3.14 |    3.14    1.57    3.14
w        |    0.00   -0.00    0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |   -0.03    0.06 |    0.65    1.85 |   -1.45   -3.14 |    1.54    3.11
w_f      |    0.00   -0.00    0.00 |    0.01    0.01    0.01 |   -0.03   -0.03   -0.02 |    0.03    0.02    0.03
w_rewards |   -0.00 |    0.00 |   -0.01 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.23 |    0.25 |    0.00 |    1.43
seeker_angles |    0.00    0.00 |    0.07    0.08 |   -0.99   -0.99 |    0.99    0.98
cs_angles |  0.0017  0.0028 |  0.0737  0.0797 | -0.9857 -0.9917 |  0.9864  0.9811
optical_flow |  0.0000  0.0000 |  0.0204  0.0224 | -1.0364 -1.1569 |  1.0288  1.1137
v_err    | -0.0100 |  0.0576 | -0.4518 |  0.1124
landing_rewards |    9.77 |    1.49 |    0.00 |   10.00
landing_margin |   -0

attitude |   -0.15    0.01   -0.01 |    1.24    0.69    1.91 |   -3.14   -1.56   -3.14 |    3.14    1.57    3.14
w        |    0.00   -0.00   -0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |    0.00    0.02 |    0.70    1.90 |   -1.47   -3.13 |    1.46    3.14
w_f      |    0.00   -0.00    0.00 |    0.01    0.01    0.01 |   -0.03   -0.03   -0.02 |    0.03    0.03    0.03
w_rewards |   -0.00 |    0.00 |   -0.03 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.23 |    0.25 |    0.00 |    1.75
seeker_angles |    0.00    0.00 |    0.07    0.08 |   -0.99   -0.99 |    0.96    0.92
cs_angles |  0.0013  0.0023 |  0.0743  0.0780 | -0.9863 -0.9861 |  0.9564  0.9187
optical_flow |  0.0001 -0.0001 |  0.0203  0.0213 | -0.9472 -1.2461 |  1.2875  0.9049
v_err    | -0.0099 |  0.0575 | -0.4523 |  0.1153
landing_rewards |    9.87 |    1.13 |    0.00 |   10.00
landing_margin |   -0

w        |    0.00    0.00   -0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |   -0.01   -0.01 |    0.65    1.85 |   -1.54   -3.13 |    1.55    3.11
w_f      |   -0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.03   -0.03   -0.02 |    0.04    0.03    0.02
w_rewards |   -0.00 |    0.00 |   -0.00 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.23 |    0.25 |    0.00 |    1.35
seeker_angles |   -0.00    0.00 |    0.07    0.08 |   -0.97   -0.95 |    0.99    0.99
cs_angles | -0.0009  0.0004 |  0.0743  0.0810 | -0.9667 -0.9459 |  0.9905  0.9878
optical_flow |  0.0001  0.0002 |  0.0219  0.0235 | -1.0945 -0.9846 |  1.0472  1.2047
v_err    | -0.0103 |  0.0575 | -0.4535 |  0.1011
landing_rewards |    9.74 |    1.59 |    0.00 |   10.00
landing_margin |   -0.03 |    0.01 |   -0.06 |    0.01
tracking_rewards |  -16.56 |    4.10 |  -40.24 |   -9.93
steps    |     379 |  

attitude |    0.18    0.00   -0.04 |    1.11    0.68    1.76 |   -3.14   -1.53   -3.14 |    3.14    1.54    3.14
w        |    0.00   -0.00   -0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |    0.01   -0.01 |    0.68    1.77 |   -1.33   -3.11 |    1.43    3.13
w_f      |    0.00   -0.00    0.00 |    0.01    0.01    0.01 |   -0.03   -0.03   -0.02 |    0.04    0.02    0.03
w_rewards |   -0.00 |    0.00 |   -0.00 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.24 |    0.26 |    0.00 |    1.51
seeker_angles |    0.00    0.00 |    0.08    0.08 |   -0.96   -1.00 |    0.98    0.97
cs_angles |  0.0016  0.0033 |  0.0776  0.0827 | -0.9621 -0.9997 |  0.9753  0.9691
optical_flow | -0.0001 -0.0001 |  0.0221  0.0231 | -1.2358 -0.9719 |  1.0531  1.1175
v_err    | -0.0105 |  0.0581 | -0.4524 |  0.1021
landing_rewards |    9.74 |    1.59 |    0.00 |   10.00
landing_margin |   -0

thrust   |   -0.00   -0.00   -0.01 |    0.67    0.69    0.67 |   -3.43   -3.36   -3.41 |    3.26    3.44    3.46
norm_thrust |    0.90 |    0.76 |    0.00 |    3.46
fuel     |    1.52 |    0.19 |    1.09 |    2.13
rewards  |  -11.61 |    5.36 |  -44.15 |   -2.85
fuel_rewards |   -4.34 |    0.55 |   -6.08 |   -3.14
glideslope_rewards |    0.00 |    0.00 |    0.00 |    0.00
glideslope_penalty |    0.00 |    0.00 |    0.00 |    0.00
glideslope |    2.91 |   13.05 |    0.00 |  443.18
norm_af  |    1.78 |    0.89 |    0.07 |    3.32
norm_wf  |    0.01 |    0.01 |    0.00 |    0.04
rh_penalty |    0.00 |    0.00 |    0.00 |    0.00
att_rewards |    0.00 |    0.00 |    0.00 |    0.00
att_penalty |    0.00 |    0.00 |    0.00 |    0.00
attitude |   -0.04   -0.03   -0.12 |    1.17    0.65    1.86 |   -3.14   -1.55   -3.14 |    3.14    1.54    3.14
w        |    0.00    0.00   -0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |   -0.03   -0.11 |    0.66

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.0735   0.8921   4.9897  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0003   0.0001   0.0006   6.4661   2.1407   2.4885
Update Cnt = 3770    ET =   1026.6   Stats:  Mean, Std, Min, Max
r_f      |    6.20    8.22   11.50 |  185.44  170.29  199.50 | -395.35 -368.94 -390.92 |  368.36  361.06  383.20
v_f      |   -0.00   -0.00   -0.00 |    0.04    0.04    0.05 |   -0.08   -0.08   -0.10 |    0.09    0.08    0.10
r_i      |   34.42   45.40   39.91 |  673.94  682.23  756.61 |-1308.13-1259.78-1289.16 | 1326.52 1310.72 1277.54
v_i      |   -0.00   -0.00   -0.00 |    0.04    0.04    0.05 |   -0.09   -0.09   -0.09 |    0.09    0.09    0.10
norm_rf  |    0.16 |    0.06 |    0.04 |    0.44
norm_vf  |    0.07 |    0.01 |    0.04 |    0.11
gs_f     |    1.29 |    2.03 |    0.00 |   17.83
thrust   |    0.01   -0.00   -0.00 |    0.66    0.68    0.67 |   -3.34   -3.43   -3.45 |    3.38    3.25    3.31
norm_thrust |    

ADV1:  -0.000168499228254402 0.006500569118695245 0.04786567604458819 -0.0456675070891735
ADV2:  0.022850730014090964 0.8512178549461343 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.5761   0.8470   4.3113  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0007   0.0006   0.0019   6.4661   2.1407   2.4885
***** Episode 117189, Mean R = -11.5  Std R = 5.7  Min R = -30.4
PolicyLoss: -0.0253
Policy_Beta: 0.114
Policy_Entropy: 0.183
Policy_KL: 0.00112
Policy_SD: 0.515
Policy_lr_mult: 0.132
Steps: 1.17e+04
TotalSteps: 4.33e+07
VF_0_ExplainedVarNew: 0.984
VF_0_ExplainedVarOld: 0.982
VF_0_Loss : 4.11e-05


ADV1:  -0.0011660759401804551 0.006260764235824626 0.04112423953234845 -0.05704740011007055
ADV2:  0.040898538199524874 0.782045094206719 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.8007   0.8019   4.0238  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0020   0.0006   0.0033   6.4661   2.1407   2.

***** Episode 117437, Mean R = -11.0  Std R = 3.9  Min R = -20.7
PolicyLoss: -0.0143
Policy_Beta: 0.114
Policy_Entropy: 0.181
Policy_KL: 0.00099
Policy_SD: 0.531
Policy_lr_mult: 0.132
Steps: 1.17e+04
TotalSteps: 4.34e+07
VF_0_ExplainedVarNew: 0.991
VF_0_ExplainedVarOld: 0.989
VF_0_Loss : 3.94e-05


ADV1:  -6.685967121987935e-05 0.004991660816196426 0.0380377160786915 -0.054917370504052154
ADV2:  -0.004383486197539178 0.9073525627387887 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.9997   1.2613   6.1176  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0001   0.0001   0.0003   6.4661   2.1407   2.4885
***** Episode 117468, Mean R = -10.5  Std R = 3.2  Min R = -17.2
PolicyLoss: 0.00274
Policy_Beta: 0.114
Policy_Entropy: 0.181
Policy_KL: 0.00102
Policy_SD: 0.534
Policy_lr_mult: 0.132
Steps: 1.17e+04
TotalSteps: 4.34e+07
VF_0_ExplainedVarNew: 0.989
VF_0_ExplainedVarOld: 0.987
VF_0_Loss : 3.03e-05


ADV1:  -0.002055238255327574 0.00608648109775

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.9810   1.0135   5.3817  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0007   0.0003   0.0013   6.4661   2.1407   2.4885
***** Episode 117716, Mean R = -12.0  Std R = 4.6  Min R = -27.7
PolicyLoss: -0.0189
Policy_Beta: 0.114
Policy_Entropy: 0.183
Policy_KL: 0.0013
Policy_SD: 0.531
Policy_lr_mult: 0.132
Steps: 1.18e+04
TotalSteps: 4.35e+07
VF_0_ExplainedVarNew: 0.985
VF_0_ExplainedVarOld: 0.982
VF_0_Loss : 3.42e-05


ADV1:  0.0001376025651635246 0.007749611188265228 0.03996421479123097 -0.04893879192242862
ADV2:  0.02859024764836913 0.8293332625527836 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.8663   1.0461   5.5159  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0002   0.0001   0.0005   6.4661   2.1407   2.4885
***** Episode 117747, Mean R = -10.9  Std R = 5.4  Min R = -23.9
PolicyLoss: -0.0343
Policy_Beta: 0.114
Policy_Entropy: 0.181
Policy_KL: 0.0011

ADV1:  0.0036990959134996517 0.0062794486720939655 0.03044354085571152 -0.053027467164355635
ADV2:  -0.03271709316021774 0.8922848243904313 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.7320   0.8595   4.8889  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0046   0.0029   0.0097   6.4661   2.1407   2.4885
***** Episode 117995, Mean R = -11.0  Std R = 4.1  Min R = -20.5
PolicyLoss: -0.0184
Policy_Beta: 0.114
Policy_Entropy: 0.181
Policy_KL: 0.00114
Policy_SD: 0.536
Policy_lr_mult: 0.132
Steps: 1.14e+04
TotalSteps: 4.36e+07
VF_0_ExplainedVarNew: 0.988
VF_0_ExplainedVarOld: 0.983
VF_0_Loss : 4.28e-05


ADV1:  -0.004586145966716309 0.0085145573483428 0.04098608993531949 -0.0541346341307943
ADV2:  0.060712058753843334 0.8611958306567177 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   3.7952   2.0179   9.9821  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0048   0.0031   0.0118   6.4661   2.1407   2.

***** Episode 118243, Mean R = -10.3  Std R = 3.4  Min R = -20.9
PolicyLoss: -0.0286
Policy_Beta: 0.114
Policy_Entropy: 0.18
Policy_KL: 0.000844
Policy_SD: 0.536
Policy_lr_mult: 0.132
Steps: 1.17e+04
TotalSteps: 4.37e+07
VF_0_ExplainedVarNew: 0.98
VF_0_ExplainedVarOld: 0.977
VF_0_Loss : 4.35e-05


ADV1:  0.002352747902613116 0.005124926532121412 0.02810795440028624 -0.05180143163968215
ADV2:  -0.0254813578056156 0.9011733063067727 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   3.3030   1.7097   9.0465  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0039   0.0021   0.0066   6.4661   2.1407   2.4885
***** Episode 118274, Mean R = -10.2  Std R = 4.7  Min R = -24.1
PolicyLoss: -0.0152
Policy_Beta: 0.114
Policy_Entropy: 0.18
Policy_KL: 0.00158
Policy_SD: 0.535
Policy_lr_mult: 0.132
Steps: 1.15e+04
TotalSteps: 4.37e+07
VF_0_ExplainedVarNew: 0.991
VF_0_ExplainedVarOld: 0.988
VF_0_Loss : 1.97e-05


ADV1:  -0.000706463049862506 0.006560518662725007 0

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.6291   0.8449   4.5034  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0035   0.0019   0.0066   6.4661   2.1407   2.4885
***** Episode 118522, Mean R = -10.7  Std R = 4.6  Min R = -25.1
PolicyLoss: -0.0357
Policy_Beta: 0.114
Policy_Entropy: 0.179
Policy_KL: 0.000972
Policy_SD: 0.53
Policy_lr_mult: 0.132
Steps: 1.18e+04
TotalSteps: 4.38e+07
VF_0_ExplainedVarNew: 0.98
VF_0_ExplainedVarOld: 0.976
VF_0_Loss : 4.2e-05


ADV1:  0.003419917699838117 0.004749813001540363 0.04401822065924338 -0.02932687758620431
ADV2:  -0.05686303301442584 0.9118017361295742 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.1395   1.2772   7.0816  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0040   0.0025   0.0089   6.4661   2.1407   2.4885
***** Episode 118553, Mean R = -9.7  Std R = 4.5  Min R = -20.1
PolicyLoss: -0.0026
Policy_Beta: 0.114
Policy_Entropy: 0.179
Policy_KL: 0.00121


ADV1:  -0.00017525630804881675 0.00678192195132542 0.04371993033907806 -0.04681358685096105
ADV2:  0.025239019671304222 0.846540097539318 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.5925   1.0333   4.6697  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0006   0.0003   0.0012   6.4661   2.1407   2.4885
***** Episode 118801, Mean R = -11.5  Std R = 5.4  Min R = -33.6
PolicyLoss: -0.0286
Policy_Beta: 0.114
Policy_Entropy: 0.18
Policy_KL: 0.00135
Policy_SD: 0.541
Policy_lr_mult: 0.132
Steps: 1.17e+04
TotalSteps: 4.39e+07
VF_0_ExplainedVarNew: 0.982
VF_0_ExplainedVarOld: 0.978
VF_0_Loss : 3.89e-05


ADV1:  -0.0004419970776300432 0.007163557956524352 0.03024218938518869 -0.06895632430560443
ADV2:  0.03385682305961537 0.7988551439005785 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.1066   0.6213   3.0356  27.0893  20.3031  12.6669
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0006   0.0003   0.0012   6.4661   2.1407   2.

cs_angles |  0.0027  0.0018 |  0.0743  0.0780 | -0.9363 -0.9966 |  0.9953  0.9932
optical_flow |  0.0000 -0.0000 |  0.0212  0.0224 | -0.9963 -1.0824 |  1.0407  1.2699
v_err    | -0.0102 |  0.0578 | -0.4531 |  0.0989
landing_rewards |    9.81 |    1.38 |    0.00 |   10.00
landing_margin |   -0.02 |    0.01 |   -0.06 |    0.01
tracking_rewards |  -16.36 |    4.28 |  -38.18 |   -9.14
steps    |     378 |      20 |     332 |     417
***** Episode 119080, Mean R = -11.4  Std R = 5.6  Min R = -25.8
PolicyLoss: -0.0349
Policy_Beta: 0.114
Policy_Entropy: 0.181
Policy_KL: 0.000949
Policy_SD: 0.534
Policy_lr_mult: 0.132
Steps: 1.17e+04
TotalSteps: 4.4e+07
VF_0_ExplainedVarNew: 0.975
VF_0_ExplainedVarOld: 0.973
VF_0_Loss : 5.42e-05


ADV1:  0.0013555158570633457 0.006651901166880877 0.050240436368284125 -0.05178062537141825
ADV2:  0.015547833215262865 0.8085296993081269 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.1070   0.9528   5.0359  27.0893  20.3031  12.6669
ValFun  Gradient

attitude |   -0.04    0.01   -0.20 |    1.26    0.65    1.90 |   -3.14   -1.55   -3.14 |    3.14    1.54    3.14
w        |    0.00    0.00   -0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |    0.02   -0.15 |    0.65    1.89 |   -1.45   -3.14 |    1.43    3.13
w_f      |    0.00   -0.00    0.00 |    0.01    0.01    0.01 |   -0.03   -0.03   -0.02 |    0.03    0.04    0.02
w_rewards |   -0.00 |    0.00 |   -0.03 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.22 |    0.25 |    0.00 |    1.59
seeker_angles |    0.00    0.00 |    0.07    0.08 |   -1.00   -0.98 |    1.00    0.99
cs_angles |  0.0025  0.0016 |  0.0722  0.0761 | -0.9957 -0.9779 |  0.9999  0.9938
optical_flow |  0.0001 -0.0001 |  0.0213  0.0233 | -1.2420 -1.0932 |  1.1409  1.0899
v_err    | -0.0101 |  0.0577 | -0.4531 |  0.1001
landing_rewards |    9.84 |    1.26 |    0.00 |   10.00
landing_margin |   -0

thrust   |    0.00   -0.01   -0.00 |    0.66    0.67    0.66 |   -3.34   -3.21   -3.45 |    3.45    3.43    3.44
norm_thrust |    0.87 |    0.75 |    0.00 |    3.46
fuel     |    1.49 |    0.18 |    1.05 |    2.17
rewards  |  -10.55 |    4.68 |  -31.19 |   -2.71
fuel_rewards |   -4.29 |    0.53 |   -6.21 |   -3.04
glideslope_rewards |    0.00 |    0.00 |    0.00 |    0.00
glideslope_penalty |    0.00 |    0.00 |    0.00 |    0.00
glideslope |    3.03 |   13.24 |    0.00 |  179.85
norm_af  |    1.66 |    0.86 |    0.03 |    3.28
norm_wf  |    0.01 |    0.01 |    0.00 |    0.04
rh_penalty |    0.00 |    0.00 |    0.00 |    0.00
att_rewards |    0.00 |    0.00 |    0.00 |    0.00
att_penalty |    0.00 |    0.00 |    0.00 |    0.00
attitude |   -0.03    0.06   -0.12 |    1.12    0.67    1.77 |   -3.14   -1.49   -3.14 |    3.14    1.57    3.14
w        |    0.00   -0.00   -0.00 |    0.01    0.00    0.00 |   -0.05   -0.05   -0.05 |    0.05    0.05    0.05
a_f      |    0.06   -0.13 |    0.68

In [8]:
fname = "optimize_WATTVW_FOV-AR=5"
policy.save_params(fname)


In [5]:
env.test_policy_batch(agent,5000,print_every=100,test_mode=True)

worked 1


KeyboardInterrupt: 