# Test Recurrent Policy with Extreme Parameter Variation 

In [1]:
import numpy as np
import os,sys



sys.path.append('../../../RL_lib/Agents')
sys.path.append('../../../RL_lib/Policies/PPO')
sys.path.append('../../../RL_lib/Policies/Common')
sys.path.append('../../../RL_lib/Utils')
sys.path.append('../../../Env')
sys.path.append('../../../Imaging')


%load_ext autoreload
%load_ext autoreload
%autoreload 2
%matplotlib nbagg
import os
print(os.getcwd())

The autoreload extension is already loaded. To reload it, use:
  %reload_ext autoreload
/Users/briangaudet/Study/Subjects/MachineLearning/Projects/Asteroid_CPO_seeker-master/Experiments/Extended/Optimize_HF


In [2]:
%%html
<style>
.output_wrapper, .output {
    height:auto !important;
    max-height:1000px;  /* your desired max-height here */
}
.output_scroll {
    box-shadow:none !important;
    webkit-box-shadow:none !important;
}
</style>

# Optimize Policy

In [3]:
from env import Env
import env_utils as envu
from dynamics_model import Dynamics_model
from lander_model import Lander_model
from ic_gen import Landing_icgen
import rl_utils
import attitude_utils as attu
import optics_utils as optu
from arch_policy_vf import Arch

from policy_ppo import Policy
from softmax_pd import Softmax_pd as PD
from value_function import Value_function

import policy_nets as policy_nets
import valfunc_nets as valfunc_nets


from agent import Agent


import torch.nn as nn

from flat_constraint import Flat_constraint
from glideslope_constraint import Glideslope_constraint
from rh_constraint import RH_constraint
from no_attitude_constraint import Attitude_constraint
from w_constraint import W_constraint
from reward_attitude import Reward
from asteroid_hfr import Asteroid

from thruster_model_cubesat import Thruster_model

from sensor import Sensor
from seeker import Seeker

landing_site_range = 0.0
landing_site = None #np.asarray([-250.,0.,0.])

asteroid_model = Asteroid(landing_site_override=landing_site, omega_range=(1e-5,5e-4))

ap = attu.Quaternion_attitude()

C_cb = optu.rotate_optical_axis(0.0, 0.0, np.pi)
r_cb = np.asarray([0,0,0])
fov=envu.deg2rad(90)
seeker = Seeker(attitude_parameterization=ap, C_cb=C_cb, r_cb=r_cb,
                radome_slope_bounds=(-0.05,0.05), range_bias=(-0.05,0.05),
                   fov=fov, debug=False)
sensor = Sensor(seeker, attitude_parameterization=ap,  use_range=True, apf_tau1=300, use_dp=False,
                      landing_site_range=landing_site_range,
                      pool_type='max', state_type=Sensor.optflow_state_range_dp1)
print(sensor.track_func)
sensor.track_func = sensor.track_func1
print(sensor.track_func)
logger = rl_utils.Logger()
dynamics_model = Dynamics_model(h=2)
thruster_model = Thruster_model(pulsed=True, scale=1.0, offset=0.4)
lander_model = Lander_model(asteroid_model, thruster_model, attitude_parameterization=ap, sensor=sensor, 
                             landing_site_range=landing_site_range, com_range=(-0.10,0.10),
                              attitude_bias=0.05, omega_bias=0.05)

lander_model.get_state_agent = lander_model.get_state_agent_sensor_att_w2

obs_dim = 13
action_dim = 12
actions_per_dim = 2
logit_dim = action_dim * actions_per_dim

recurrent_steps = 60

reward_object = Reward(landing_rlimit=2, landing_vlimit=0.1, 
                       tracking_bias=0.01, fov_coeff=-50., 
                       att_coeff=-0.20,
                       tracking_coeff=-0.5, magv_coeff=-1.0,
                       fuel_coeff=-0.10,  landing_coeff=10.0)

glideslope_constraint = Glideslope_constraint(gs_limit=-1.0)
shape_constraint = Flat_constraint()
attitude_constraint = Attitude_constraint(ap)
w_constraint = W_constraint(w_limit=(0.1,0.1,0.1), w_margin=(0.05,0.05,0.05))
rh_constraint = RH_constraint(rh_limit=150)

wi=0.05
ic_gen = Landing_icgen((800,1000), 
                           p_engine_fail=0.5,
                           engine_fail_scale=(0.5,1.0),
                           lander_wll=(-wi,-wi,-wi),
                           lander_wul=(wi,wi,wi),
                           attitude_parameterization=ap,
                           position_error=(0,np.pi/4),
                           heading_error=(0,np.pi/8),
                           attitude_error=(0,np.pi/16),
                           min_mass=450, max_mass=500,
                           mag_v=(0.05,0.1),
                           debug=False,
                           inertia_uncertainty_diag=10.0,
                           inertia_uncertainty_offdiag=1.0)

env = Env(ic_gen, lander_model, dynamics_model, logger,
          landing_site_range=landing_site_range,
          debug_done=False,
          reward_object=reward_object,
          glideslope_constraint=glideslope_constraint,
          attitude_constraint=attitude_constraint,
          w_constraint=w_constraint,
          rh_constraint=rh_constraint,
          tf_limit=5000.0,print_every=10,nav_period=6)




env.ic_gen.show()

arch = Arch()

policy = Policy(policy_nets.GRU1(obs_dim, logit_dim, recurrent_steps=recurrent_steps), 
                PD(action_dim, actions_per_dim),
                shuffle=False,
                kl_targ=0.001,epochs=20, beta=0.1, servo_kl=True, max_grad_norm=30, scale_vector_obs=True,
                init_func=rl_utils.xn_init)
value_function = Value_function(valfunc_nets.GRU1(obs_dim, recurrent_steps=recurrent_steps), scale_obs=True,
                                shuffle=False, batch_size=9999999, max_grad_norm=30, 
                                verbose=False)

agent = Agent(arch, policy, value_function, None, env, logger,
              policy_episodes=30, policy_steps=3000, gamma1=0.95, gamma2=0.995, 
              recurrent_steps=recurrent_steps, monitor=env.rl_stats)
agent.train(120000)

Quaternion_attitude
Euler321 Attitude
C_cb: 
[[ 1.0000000e+00  0.0000000e+00 -0.0000000e+00]
 [ 0.0000000e+00 -1.0000000e+00  1.2246468e-16]
 [ 0.0000000e+00 -1.2246468e-16 -1.0000000e+00]]
[ 0.0000000e+00 -1.2246468e-16 -1.0000000e+00]
using max  pooling
V4: Output State type:  <function Sensor.optflow_state_range_dp1 at 0x135b15488>
<bound method Sensor.track_func1 of <sensor.Sensor object at 0x1260ac780>>
<bound method Sensor.track_func1 of <sensor.Sensor object at 0x1260ac780>>
6dof dynamics model 
thruster model: 
Inertia Tensor:  [[333.33333333   0.           0.        ]
 [  0.         333.33333333   0.        ]
 [  0.           0.         333.33333333]]
Lander Model: 
Reward_terminal equator
queue fixed
Flat Constraint
Attitude Constraint
Rotational Velocity Constraint
Position Hysterises Constraint


<IPython.core.display.Javascript object>

<IPython.core.display.Javascript object>

<IPython.core.display.Javascript object>

<IPython.core.display.Javascript object>

<IPython.core.display.Javascript object>

<IPython.core.display.Javascript object>

<IPython.core.display.Javascript object>

lander env RHL
Landing_icgen:
[[-1.]
 [ 1.]]
Policy with vectorized sample
	xn_init: layer  Linear(in_features=13, out_features=130, bias=True)
	xn_init: layer  GRUCell(130, 176)
	xn_init: layer  Linear(in_features=176, out_features=240, bias=True)
	xn_init: layer  Linear(in_features=240, out_features=24, bias=True)
Policy: recurrent steps > 1, disabling shuffle
	Test Mode:          False
	Clip Param:         0.1
	Shuffle :           False
	Shuffle by Chunks:  False
	Max Grad Norm:      30
	Recurrent Steps:    60
	Rollout Limit:      1
	Advantage Func:     <advantage_utils.Adv_default object at 0x137bb9240>
	Advantage Norm:     <function Adv_normalizer.apply at 0x134c70488>
	PD:                 <softmax_pd.Softmax_pd object at 0x137baffd0>
	Loss Function:      <bound method Policy.calc_loss1 of <policy_ppo.Policy object at 0x137bb9080>>
Value Funtion
	xn_init: layer  Linear(in_features=13, out_features=130, bias=True)
	xn_init: layer  GRUCell(130, 25)
	xn_init: layer  Linear(in_feature

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0957   0.0247   0.1316   0.1735   0.1166   0.0364
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.4722   0.2573   0.9992   8.0871   2.2896   2.8947
***** Episode 234, Mean R = -236.8  Std R = 76.6  Min R = -458.3
PolicyLoss: -0.015
Policy_Beta: 0.0667
Policy_Entropy: 0.000334
Policy_KL: 0.00172
Policy_SD: 0.956
Policy_lr_mult: 1
Steps: 3.76e+03
TotalSteps: 2.22e+04
VF_0_ExplainedVarNew: 0.0567
VF_0_ExplainedVarOld: 0.0394
VF_0_Loss : 0.749


ADV1:  0.1982832627301218 0.7651490961746018 1.2131314463679568 -3.645914965693663
ADV2:  -0.0422580369192737 0.8558418050571811 1.146745606147643 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.1029   0.0257   0.1355   0.1735   0.1166   0.0364
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.4052   0.2280   0.9313   8.0871   2.2896   2.8947
***** Episode 265, Mean R = -265.7  Std R = 108.5  Min R = -549.4
PolicyLoss: -0.0241
Policy_Beta: 0.0667
Policy_Entropy: 0.000336
Policy_

ADV1:  0.05286150920151628 0.4385158658297476 0.754511477909946 -4.096960597369948
ADV2:  0.031240070879257502 0.6938857375189396 1.5015845951186102 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0691   0.0099   0.0794   0.1735   0.1166   0.0364
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.1195   0.0542   0.2446   8.0871   2.2896   2.8947
***** Episode 513, Mean R = -405.7  Std R = 184.4  Min R = -1032.0
PolicyLoss: -0.0532
Policy_Beta: 0.0667
Policy_Entropy: 0.000366
Policy_KL: 0.00114
Policy_SD: 0.955
Policy_lr_mult: 1
Steps: 9.24e+03
TotalSteps: 8.2e+04
VF_0_ExplainedVarNew: 0.222
VF_0_ExplainedVarOld: 0.185
VF_0_Loss : 0.199


*** RH VIO  CNT:  100
ADV1:  0.017712442602509516 0.33576935438382766 0.5871538800216337 -3.7359625089851605
ADV2:  0.03323102914238187 0.7163026849382153 1.620223998592397 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0707   0.0141   0.0915   0.1735   0.1166   0.0364
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0538   0

***** Episode 761, Mean R = -472.5  Std R = 206.8  Min R = -860.3
PolicyLoss: -0.0377
Policy_Beta: 0.0667
Policy_Entropy: 0.000379
Policy_KL: 0.00101
Policy_SD: 0.955
Policy_lr_mult: 1
Steps: 1.1e+04
TotalSteps: 1.69e+05
VF_0_ExplainedVarNew: 0.592
VF_0_ExplainedVarOld: 0.57
VF_0_Loss : 0.0528


ADV1:  0.008663685865924729 0.2049161484039514 0.9097309914678394 -3.506064991463764
ADV2:  0.022734925882551483 0.7707109638836905 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0833   0.0153   0.1106   0.1735   0.1166   0.0364
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0190   0.0071   0.0363   8.0871   2.2896   2.8947
***** Episode 792, Mean R = -407.8  Std R = 163.9  Min R = -987.2
PolicyLoss: -0.0329
Policy_Beta: 0.0667
Policy_Entropy: 0.000386
Policy_KL: 0.00105
Policy_SD: 0.956
Policy_lr_mult: 1
Steps: 9.57e+03
TotalSteps: 1.79e+05
VF_0_ExplainedVarNew: 0.678
VF_0_ExplainedVarOld: 0.665
VF_0_Loss : 0.0452


ADV1:  -0.03614858562287244 0.2721558921939325 0.45254208

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0994   0.0274   0.1406   0.1735   0.1166   0.0364
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0383   0.0136   0.0716   8.0871   2.2896   2.8947
***** Episode 1040, Mean R = -450.8  Std R = 199.9  Min R = -996.0
PolicyLoss: -0.00415
Policy_Beta: 0.0667
Policy_Entropy: 0.000395
Policy_KL: 0.00102
Policy_SD: 0.956
Policy_lr_mult: 1
Steps: 1.07e+04
TotalSteps: 2.69e+05
VF_0_ExplainedVarNew: 0.706
VF_0_ExplainedVarOld: 0.673
VF_0_Loss : 0.0357


ADV1:  -0.02575689718389415 0.16003439371352002 0.5382460112950894 -1.4667655245463074
ADV2:  0.04153560231775345 0.8274029658900593 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0821   0.0137   0.1085   0.1735   0.1166   0.0364
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0422   0.0189   0.0929   8.0871   2.2896   2.8947
***** Episode 1071, Mean R = -470.6  Std R = 158.8  Min R = -839.7
PolicyLoss: -0.0346
Policy_Beta: 0.0667
Policy_Entropy: 0.000411
Policy_KL: 0.

ADV1:  -0.010712716911414568 0.16402754605628456 1.612126021385193 -1.374746541338646
ADV2:  0.02050670400929557 0.8246919743091553 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.1284   0.0319   0.1945   0.1945   0.1284   0.0364
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0343   0.0131   0.0563   8.0871   2.2896   2.8947
***** Episode 1319, Mean R = -471.0  Std R = 161.5  Min R = -865.5
PolicyLoss: -0.0202
Policy_Beta: 0.0667
Policy_Entropy: 0.00044
Policy_KL: 0.0012
Policy_SD: 0.953
Policy_lr_mult: 1
Steps: 1.15e+04
TotalSteps: 3.75e+05
VF_0_ExplainedVarNew: 0.767
VF_0_ExplainedVarOld: 0.754
VF_0_Loss : 0.0432


*** RH VIO  CNT:  600
ADV1:  -0.0011050142128018153 0.16039277854809822 1.4609785029439555 -1.1799387287209915
ADV2:  0.015368958308657341 0.8166622887445651 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.1345   0.0230   0.1828   0.1945   0.1345   0.0364
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0188   0.0063   0.0320   8.0871 

seeker_angles |    0.03    0.05 |    0.34    0.34 |   -1.00   -1.00 |    1.00    1.00
cs_angles |  0.0314  0.0535 |  0.3410  0.3438 | -0.9996 -0.9995 |  1.0000  0.9999
optical_flow |  0.0002  0.0006 |  0.0025  0.0026 | -0.0211 -0.0300 |  0.0294  0.0303
v_err    | -0.3993 |  0.1898 | -1.0549 |  0.8343
landing_rewards |    0.00 |    0.00 |    0.00 |    0.00
landing_margin |  764.07 |  299.84 |  109.35 | 1271.09
tracking_rewards | -378.48 |  139.85 | -957.56 | -149.92
steps    |     380 |     125 |     124 |     834
***** Episode 1598, Mean R = -401.6  Std R = 101.0  Min R = -660.7
PolicyLoss: -0.0299
Policy_Beta: 0.0667
Policy_Entropy: 0.000511
Policy_KL: 0.00116
Policy_SD: 0.953
Policy_lr_mult: 1
Steps: 1.16e+04
TotalSteps: 4.81e+05
VF_0_ExplainedVarNew: 0.819
VF_0_ExplainedVarOld: 0.8
VF_0_Loss : 0.0416


ADV1:  0.012219085722116963 0.1557632158713779 1.877559479077657 -1.1039533911112
ADV2:  -0.007113525860595024 0.8381637719863944 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max 

w        |   -0.00    0.00   -0.00 |    0.02    0.02    0.02 |   -0.10   -0.09   -0.09 |    0.09    0.09    0.08
a_f      |    0.07   -0.12 |    0.68    1.81 |   -1.49   -3.12 |    1.56    3.12
w_f      |   -0.00    0.00   -0.00 |    0.02    0.02    0.02 |   -0.06   -0.06   -0.05 |    0.06    0.05    0.06
w_rewards |   -0.87 |    0.81 |   -4.27 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |  -43.06 |   17.28 |  -50.00 |    0.00
theta_cv |    1.31 |    0.65 |    0.01 |    3.13
seeker_angles |    0.12    0.07 |    0.32    0.35 |   -1.00   -1.00 |    1.00    1.00
cs_angles |  0.1222  0.0651 |  0.3208  0.3455 | -0.9999 -1.0000 |  1.0000  1.0000
optical_flow |  0.0014  0.0006 |  0.0034  0.0032 | -0.0379 -0.0721 |  0.0562  0.0368
v_err    | -0.2755 |  0.2226 | -1.1299 |  0.9837
landing_rewards |    0.00 |    0.00 |    0.00 |    0.00
landing_margin |  564.85 |  267.82 |   37.03 | 1266.54
tracking_rewards | -268.54 |  100.01 | -817.81 | -119.59
steps    |     332 |  

w        |   -0.00    0.00   -0.00 |    0.02    0.02    0.02 |   -0.08   -0.09   -0.08 |    0.08    0.08    0.08
a_f      |    0.05    0.13 |    0.64    1.81 |   -1.40   -3.14 |    1.46    3.12
w_f      |   -0.00   -0.00   -0.00 |    0.02    0.02    0.02 |   -0.05   -0.05   -0.05 |    0.06    0.06    0.05
w_rewards |   -0.41 |    0.48 |   -3.14 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |  -46.61 |   12.57 |  -50.00 |    0.00
theta_cv |    1.07 |    0.57 |    0.01 |    3.12
seeker_angles |    0.08    0.02 |    0.33    0.34 |   -1.00   -1.00 |    1.00    1.00
cs_angles |  0.0753  0.0234 |  0.3280  0.3370 | -0.9999 -0.9996 |  0.9999  1.0000
optical_flow |  0.0012  0.0003 |  0.0046  0.0044 | -0.1005 -0.2108 |  0.0898  0.2004
v_err    | -0.1554 |  0.2511 | -1.0737 |  1.0149
landing_rewards |    0.00 |    0.00 |    0.00 |    0.00
landing_margin |  432.38 |  222.84 |   13.52 | 1167.18
tracking_rewards | -187.70 |   59.69 | -585.15 |  -84.25
steps    |     283 |  

w        |    0.00    0.00   -0.00 |    0.02    0.02    0.02 |   -0.08   -0.07   -0.08 |    0.10    0.08    0.09
a_f      |   -0.09   -0.07 |    0.70    1.88 |   -1.45   -3.12 |    1.41    3.14
w_f      |   -0.00   -0.00   -0.00 |    0.02    0.02    0.02 |   -0.05   -0.05   -0.05 |    0.05    0.06    0.05
w_rewards |   -0.33 |    0.43 |   -2.75 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |  -46.77 |   12.28 |  -50.00 |    0.00
theta_cv |    0.89 |    0.50 |    0.00 |    3.13
seeker_angles |    0.06   -0.01 |    0.32    0.34 |   -1.00   -1.00 |    1.00    1.00
cs_angles |  0.0586 -0.0069 |  0.3209  0.3423 | -1.0000 -1.0000 |  0.9997  0.9999
optical_flow |  0.0015 -0.0002 |  0.0046  0.0048 | -0.1387 -0.0635 |  0.0805  0.0979
v_err    | -0.0886 |  0.2363 | -1.1964 |  0.8958
landing_rewards |    0.00 |    0.00 |    0.00 |    0.00
landing_margin |  379.62 |  186.58 |   14.87 | 1267.10
tracking_rewards | -150.54 |   34.70 | -407.42 |  -89.69
steps    |     261 |  

w        |    0.00    0.00   -0.00 |    0.02    0.02    0.02 |   -0.08   -0.08   -0.09 |    0.09    0.09    0.09
a_f      |   -0.04   -0.01 |    0.69    1.87 |   -1.43   -3.14 |    1.52    3.12
w_f      |   -0.00   -0.00   -0.00 |    0.02    0.02    0.02 |   -0.04   -0.04   -0.04 |    0.04    0.04    0.05
w_rewards |   -0.43 |    0.46 |   -2.47 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |  -47.10 |   11.69 |  -50.00 |    0.00
theta_cv |    0.78 |    0.45 |    0.00 |    3.10
seeker_angles |    0.10   -0.02 |    0.33    0.34 |   -1.00   -1.00 |    1.00    1.00
cs_angles |  0.0988 -0.0197 |  0.3285  0.3378 | -0.9996 -1.0000 |  0.9998  1.0000
optical_flow |  0.0016 -0.0006 |  0.0047  0.0047 | -0.1331 -0.0490 |  0.0641  0.0598
v_err    | -0.0824 |  0.1964 | -0.7044 |  0.8201
landing_rewards |    0.00 |    0.00 |    0.00 |    0.00
landing_margin |  357.18 |  156.05 |   27.28 |  776.55
tracking_rewards | -132.31 |   25.28 | -235.71 |  -81.01
steps    |     261 |  

w        |    0.00    0.00   -0.00 |    0.02    0.02    0.02 |   -0.09   -0.08   -0.09 |    0.10    0.09    0.08
a_f      |    0.04    0.04 |    0.66    1.82 |   -1.50   -3.13 |    1.44    3.14
w_f      |   -0.00   -0.00    0.00 |    0.02    0.02    0.02 |   -0.04   -0.04   -0.04 |    0.10    0.04    0.04
w_rewards |   -0.52 |    0.53 |   -2.66 |    0.00
w_penalty |   -0.32 |    5.67 | -100.00 |    0.00
fov_penalty |  -47.42 |   11.06 |  -50.00 |    0.00
theta_cv |    0.71 |    0.41 |    0.00 |    3.10
seeker_angles |    0.07   -0.02 |    0.32    0.34 |   -1.00   -1.00 |    1.00    1.00
cs_angles |  0.0707 -0.0152 |  0.3168  0.3401 | -0.9993 -0.9999 |  0.9998  0.9996
optical_flow |  0.0011 -0.0004 |  0.0054  0.0059 | -0.0728 -0.0949 |  0.1073  0.1657
v_err    | -0.0793 |  0.1702 | -0.8175 |  0.7085
landing_rewards |    0.00 |    0.00 |    0.00 |    0.00
landing_margin |  304.25 |  166.58 |    4.24 |  905.85
tracking_rewards | -123.59 |   24.15 | -240.10 |   -7.98
steps    |     273 |  

w        |    0.00    0.00   -0.00 |    0.02    0.02    0.02 |   -0.08   -0.08   -0.10 |    0.10    0.10    0.08
a_f      |    0.03    0.04 |    0.63    1.84 |   -1.42   -3.13 |    1.55    3.12
w_f      |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.04   -0.04   -0.04 |    0.10    0.04    0.04
w_rewards |   -0.57 |    0.55 |   -2.61 |    0.00
w_penalty |   -0.32 |    5.67 | -100.00 |    0.00
fov_penalty |  -48.23 |    9.25 |  -50.00 |    0.00
theta_cv |    0.66 |    0.38 |    0.00 |    3.12
seeker_angles |    0.06   -0.03 |    0.32    0.34 |   -1.00   -1.00 |    1.00    1.00
cs_angles |  0.0622 -0.0309 |  0.3222  0.3352 | -1.0000 -0.9998 |  0.9999  0.9997
optical_flow |  0.0008 -0.0005 |  0.0063  0.0066 | -0.1200 -0.1349 |  0.1117  0.3452
v_err    | -0.0654 |  0.1523 | -0.6975 |  0.6138
landing_rewards |    0.00 |    0.00 |    0.00 |    0.00
landing_margin |  258.13 |  149.79 |    5.39 |  865.51
tracking_rewards | -114.32 |   23.63 | -208.44 |   -7.64
steps    |     279 |  

norm_thrust |    1.55 |    0.66 |    0.00 |    3.46
fuel     |    4.34 |    0.77 |    2.48 |    6.27
rewards  | -171.73 |   24.61 | -287.03 | -108.25
fuel_rewards |  -12.43 |    2.20 |  -17.93 |   -7.10
glideslope_rewards |    0.00 |    0.00 |    0.00 |    0.00
glideslope_penalty |    0.00 |    0.00 |    0.00 |    0.00
glideslope |    4.56 |   18.28 |    0.01 |  388.45
norm_af  |    1.81 |    0.90 |    0.09 |    3.31
norm_wf  |    0.02 |    0.01 |    0.00 |    0.05
rh_penalty |    0.00 |    0.00 |    0.00 |    0.00
att_rewards |    0.00 |    0.00 |    0.00 |    0.00
att_penalty |    0.00 |    0.00 |    0.00 |    0.00
attitude |    0.02   -0.04   -0.04 |    1.24    0.64    1.92 |   -3.14   -1.56   -3.14 |    3.14    1.56    3.14
w        |    0.00    0.00   -0.00 |    0.02    0.02    0.02 |   -0.08   -0.07   -0.09 |    0.09    0.09    0.08
a_f      |   -0.03   -0.14 |    0.65    1.91 |   -1.45   -3.14 |    1.41    3.13
w_f      |   -0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.

ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0331   0.0129   0.0590   8.0871   2.2896   2.8947
Update Cnt = 130    ET =    793.6   Stats:  Mean, Std, Min, Max
r_f      |  -28.30  -21.64   -7.08 |  288.01  275.10  315.27 | -840.57 -707.45 -807.30 |  758.46  671.59  818.64
v_f      |    0.03   -0.02    0.01 |    0.40    0.37    0.41 |   -1.20   -1.00   -0.93 |    1.01    1.30    1.20
r_i      |  -63.58   -5.77  -14.16 |  691.51  657.10  772.77 |-1306.17-1309.72-1359.23 | 1289.31 1325.39 1320.96
v_i      |    0.00    0.00    0.00 |    0.04    0.04    0.05 |   -0.10   -0.09   -0.09 |    0.09    0.09    0.09
norm_rf  |  208.78 |  131.73 |   16.85 |  656.86
norm_vf  |    0.65 |    0.21 |    0.21 |    1.51
gs_f     |    0.96 |    1.04 |    0.02 |    8.34
thrust   |    0.01    0.00    0.00 |    0.97    0.98    0.97 |   -3.44   -3.36   -3.42 |    3.25    3.41    3.43
norm_thrust |    1.55 |    0.66 |    0.00 |    3.46
fuel     |    4.44 |    0.77 |    2.48 |    6.06
rewards  | -168.29 |

ADV1:  -0.0015504790938774134 0.18851770598976056 2.436511335372925 -1.1265481726328552
ADV2:  -0.030309118847618968 0.6765473786377438 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.2879   0.0977   0.5461   0.8245   0.3689   0.1642
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0618   0.0171   0.0986   8.0871   2.2896   2.8947
***** Episode 4357, Mean R = -157.7  Std R = 23.7  Min R = -208.5
PolicyLoss: 0.0316
Policy_Beta: 0.0667
Policy_Entropy: 0.00216
Policy_KL: 0.00103
Policy_SD: 0.952
Policy_lr_mult: 1
Steps: 9.03e+03
TotalSteps: 1.27e+06
VF_0_ExplainedVarNew: 0.845
VF_0_ExplainedVarOld: 0.776
VF_0_Loss : 0.0581


ADV1:  0.023083719172379745 0.1464930656414144 2.095327761967977 -1.0600901858011902
ADV2:  -0.02790063125193797 0.7536933442032155 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.2867   0.0984   0.5491   0.8245   0.3689   0.1642
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0456   0.0230   0.0995   8.0871   2.2896   2.8947
Updat

ADV1:  0.004504504472231429 0.13694738938325351 2.298555669784546 -1.1403451283772807
ADV2:  -0.022479626978372993 0.7054068257799787 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.2366   0.0410   0.3105   0.8245   0.3689   0.1642
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0294   0.0074   0.0443   8.0871   2.2896   2.8947
***** Episode 4636, Mean R = -159.7  Std R = 22.1  Min R = -204.6
PolicyLoss: 0.0176
Policy_Beta: 0.0667
Policy_Entropy: 0.00237
Policy_KL: 0.00108
Policy_SD: 0.953
Policy_lr_mult: 1
Steps: 9.1e+03
TotalSteps: 1.35e+06
VF_0_ExplainedVarNew: 0.909
VF_0_ExplainedVarOld: 0.885
VF_0_Loss : 0.0476


ADV1:  0.014526312822813714 0.1461999551795065 2.2289275805155437 -1.0982874949773174
ADV2:  -0.03971064683947333 0.6440277437532815 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.2783   0.0683   0.4025   0.8245   0.3689   0.1642
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0297   0.0134   0.0574   8.0871   2.2896   2.8947
***** E

ADV1:  -0.0019409366561049623 0.11996899838761704 2.391545352935791 -0.975826229565893
ADV2:  -0.007918930284253629 0.712982436817027 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.2702   0.0581   0.3838   0.8245   0.3689   0.1642
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0332   0.0146   0.0655   8.0871   2.2896   2.8947
***** Episode 4915, Mean R = -163.8  Std R = 17.3  Min R = -202.7
PolicyLoss: 0.00651
Policy_Beta: 0.0667
Policy_Entropy: 0.00265
Policy_KL: 0.00103
Policy_SD: 0.952
Policy_lr_mult: 1
Steps: 9.78e+03
TotalSteps: 1.44e+06
VF_0_ExplainedVarNew: 0.93
VF_0_ExplainedVarOld: 0.911
VF_0_Loss : 0.0373


ADV1:  0.007389716518665262 0.13468059114626005 0.9139230165441362 -1.362697465715888
ADV2:  -0.016792294993661822 0.8022524532524207 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.2644   0.0668   0.4502   0.8245   0.3689   0.1642
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0636   0.0353   0.1954   8.0871   2.2896   2.8947
*****

ADV1:  0.02734928772244287 0.19182094912660522 2.3431791337331136 -1.17444542249044
ADV2:  -0.04898422655066735 0.6448750891429701 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.2813   0.1316   0.7260   0.8959   0.4379   0.1642
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0542   0.0260   0.1116   8.0871   2.2896   2.8947
***** Episode 5194, Mean R = -158.1  Std R = 25.0  Min R = -208.7
PolicyLoss: 0.0357
Policy_Beta: 0.0667
Policy_Entropy: 0.00293
Policy_KL: 0.00092
Policy_SD: 0.949
Policy_lr_mult: 1
Steps: 9.79e+03
TotalSteps: 1.52e+06
VF_0_ExplainedVarNew: 0.81
VF_0_ExplainedVarOld: 0.745
VF_0_Loss : 0.0542


ADV1:  -0.03142306011121119 0.2413633863466798 1.7959652735738219 -4.746456212102104
ADV2:  0.03993911872195773 0.569080319465266 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.1947   0.0494   0.3041   0.8959   0.4379   0.1642
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0669   0.0270   0.1278   8.0871   2.2896   2.8947
***** Episode

ADV1:  -0.01591220884553589 0.19799337203545175 2.118851606977386 -4.682869952282472
ADV2:  0.013663323592273572 0.5458290253655105 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.2357   0.0887   0.4585   0.8959   0.4379   0.1642
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0398   0.0159   0.0766   8.0871   2.2896   2.8947
***** Episode 5473, Mean R = -152.2  Std R = 24.0  Min R = -188.6
PolicyLoss: -0.0113
Policy_Beta: 0.0667
Policy_Entropy: 0.00315
Policy_KL: 0.00112
Policy_SD: 0.949
Policy_lr_mult: 1
Steps: 9.6e+03
TotalSteps: 1.61e+06
VF_0_ExplainedVarNew: 0.81
VF_0_ExplainedVarOld: 0.778
VF_0_Loss : 0.052


ADV1:  -0.010847786473318709 0.15542260446539316 1.6285514815648396 -1.7923902599016848
ADV2:  0.011284896235240245 0.696026322689619 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.3112   0.0726   0.4682   0.8959   0.4379   0.1642
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0386   0.0138   0.0691   8.0871   2.2896   2.8947
***** Epi

ADV1:  -0.01859735758849801 0.16604580086940177 2.232144901487337 -1.2921266873677593
ADV2:  -0.00949815722595633 0.7166588019026089 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.3925   0.1486   0.7744   0.8959   0.4441   0.1642
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0372   0.0171   0.0860   8.0871   2.2896   2.8947
***** Episode 5752, Mean R = -150.9  Std R = 19.0  Min R = -185.3
PolicyLoss: 0.0174
Policy_Beta: 0.0667
Policy_Entropy: 0.00342
Policy_KL: 0.00102
Policy_SD: 0.948
Policy_lr_mult: 1
Steps: 9.74e+03
TotalSteps: 1.7e+06
VF_0_ExplainedVarNew: 0.869
VF_0_ExplainedVarOld: 0.822
VF_0_Loss : 0.0389


Dynamics: Max Disturbance (m/s^2):  [0.00149461 0.0018056  0.00138071] 0.002720371623523329
ADV1:  0.016872904667983937 0.14058605438499566 2.06361865679423 -1.4330000591278096
ADV2:  -0.02260060782567879 0.6874091857118166 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.2508   0.0984   0.5639   0.8959   0.4441   0.1642
ValFun  Gradients: u

ADV1:  0.02029547091867425 0.18445900937930074 2.7744577503204346 -1.4534480889638286
ADV2:  -0.03702972933068309 0.69681427964684 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.3609   0.1286   0.6913   0.8959   0.4441   0.1642
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0604   0.0369   0.1967   8.0871   2.2896   2.8947
***** Episode 6031, Mean R = -153.3  Std R = 23.9  Min R = -196.0
PolicyLoss: 0.0244
Policy_Beta: 0.0667
Policy_Entropy: 0.004
Policy_KL: 0.00118
Policy_SD: 0.948
Policy_lr_mult: 1
Steps: 9.42e+03
TotalSteps: 1.79e+06
VF_0_ExplainedVarNew: 0.843
VF_0_ExplainedVarOld: 0.776
VF_0_Loss : 0.0493


ADV1:  -0.008008538201035883 0.13272663189840817 0.8587232812245686 -1.8581718903451359
ADV2:  0.030402731231169475 0.73977951882772 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.3009   0.0805   0.5799   0.8959   0.4441   0.1642
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0209   0.0081   0.0384   8.0871   2.2896   2.8947
***** Episo

ADV1:  0.00690850011617035 0.17431312477729527 2.3403603712717693 -1.4853764788309753
ADV2:  -0.023043625271918555 0.682204960455608 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.3148   0.0981   0.5384   1.3958   0.5840   0.2377
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0296   0.0085   0.0440   8.0871   2.2896   2.8947
***** Episode 6310, Mean R = -155.1  Std R = 19.5  Min R = -213.7
PolicyLoss: 0.0186
Policy_Beta: 0.0667
Policy_Entropy: 0.00415
Policy_KL: 0.00101
Policy_SD: 0.948
Policy_lr_mult: 1
Steps: 9.76e+03
TotalSteps: 1.87e+06
VF_0_ExplainedVarNew: 0.841
VF_0_ExplainedVarOld: 0.804
VF_0_Loss : 0.0374


ADV1:  0.0021688492780647327 0.17522649199339693 2.469646838506063 -1.2058660411834738
ADV2:  -0.018578440483756925 0.7075207644636925 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.3854   0.1493   0.8446   1.3958   0.5840   0.2377
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0475   0.0155   0.0947   8.0871   2.2896   2.8947
*****

ADV1:  -0.007787937176079493 0.17131893014346875 2.2673040008544922 -1.4064623721440657
ADV2:  -0.004895291057616989 0.7055425415229013 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.2910   0.0832   0.5324   1.3958   0.5840   0.2377
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0347   0.0138   0.0574   8.0871   2.2896   2.8947
***** Episode 6589, Mean R = -145.9  Std R = 19.3  Min R = -178.2
PolicyLoss: 0.00708
Policy_Beta: 0.0667
Policy_Entropy: 0.00425
Policy_KL: 0.00102
Policy_SD: 0.945
Policy_lr_mult: 1
Steps: 9.82e+03
TotalSteps: 1.96e+06
VF_0_ExplainedVarNew: 0.853
VF_0_ExplainedVarOld: 0.802
VF_0_Loss : 0.0394


ADV1:  -0.011408694291011323 0.16498664072588687 1.291156767209371 -1.717476303310273
ADV2:  0.018056053730858182 0.7262124217497329 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.3637   0.1146   0.6270   1.3958   0.5840   0.2377
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0420   0.0119   0.0668   8.0871   2.2896   2.8947
***

seeker_angles |    0.01   -0.03 |    0.30    0.31 |   -1.00   -1.00 |    1.00    1.00
cs_angles |  0.0100 -0.0290 |  0.3018  0.3123 | -1.0000 -1.0000 |  0.9998  1.0000
optical_flow | -0.0004  0.0004 |  0.0127  0.0131 | -0.3930 -0.3824 |  0.5279  0.5768
v_err    | -0.0266 |  0.0954 | -0.6367 |  0.9803
landing_rewards |    0.00 |    0.00 |    0.00 |    0.00
landing_margin |  119.42 |  116.43 |    4.02 |  980.74
tracking_rewards |  -90.01 |   19.51 | -154.16 |   -8.31
steps    |     319 |      50 |      11 |     397
***** Episode 6868, Mean R = -154.1  Std R = 23.6  Min R = -219.5
PolicyLoss: 0.0303
Policy_Beta: 0.0667
Policy_Entropy: 0.00477
Policy_KL: 0.000998
Policy_SD: 0.944
Policy_lr_mult: 1
Steps: 1.03e+04
TotalSteps: 2.05e+06
VF_0_ExplainedVarNew: 0.833
VF_0_ExplainedVarOld: 0.774
VF_0_Loss : 0.0334


ADV1:  -0.0021367249041719443 0.16012154899262382 2.124815820058187 -1.4899648503034881
ADV2:  0.000113147237303747 0.6880250138257019 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u

w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.08   -0.07   -0.10 |    0.09    0.10    0.08
a_f      |    0.03   -0.05 |    0.64    1.80 |   -1.44   -3.10 |    1.48    3.12
w_f      |   -0.00   -0.00   -0.00 |    0.01    0.01    0.01 |   -0.04   -0.03   -0.03 |    0.03    0.10    0.03
w_rewards |   -0.87 |    0.47 |   -2.46 |   -0.02
w_penalty |   -0.32 |    5.67 | -100.00 |    0.00
fov_penalty |  -45.16 |   14.78 |  -50.00 |    0.00
theta_cv |    0.63 |    0.34 |    0.00 |    3.11
seeker_angles |    0.02   -0.02 |    0.29    0.30 |   -1.00   -1.00 |    1.00    1.00
cs_angles |  0.0219 -0.0210 |  0.2895  0.3049 | -0.9999 -0.9999 |  0.9999  0.9996
optical_flow | -0.0001 -0.0000 |  0.0136  0.0134 | -0.9661 -0.4928 |  0.5900  0.2443
v_err    | -0.0254 |  0.0916 | -0.5669 |  0.5535
landing_rewards |    0.00 |    0.00 |    0.00 |    0.00
landing_margin |  105.54 |  106.74 |    0.03 |  888.92
tracking_rewards |  -88.47 |   17.10 | -163.19 |  -10.93
steps    |     326 |  

thrust   |   -0.00    0.01    0.00 |    1.00    1.01    1.00 |   -3.36   -3.46   -3.46 |    3.42    3.46    3.41
norm_thrust |    1.60 |    0.69 |    0.00 |    3.46
fuel     |    4.47 |    0.60 |    0.18 |    5.59
rewards  | -145.57 |   24.34 | -222.19 |  -62.81
fuel_rewards |  -12.78 |    1.73 |  -15.99 |   -0.53
glideslope_rewards |    0.00 |    0.00 |    0.00 |    0.00
glideslope_penalty |    0.00 |    0.00 |    0.00 |    0.00
glideslope |    3.28 |   14.74 |    0.01 |  392.52
norm_af  |    1.73 |    0.89 |    0.08 |    3.31
norm_wf  |    0.02 |    0.01 |    0.00 |    0.10
rh_penalty |    0.00 |    0.00 |    0.00 |    0.00
att_rewards |    0.00 |    0.00 |    0.00 |    0.00
att_penalty |    0.00 |    0.00 |    0.00 |    0.00
attitude |   -0.09    0.01    0.10 |    1.19    0.65    1.79 |   -3.14   -1.57   -3.14 |    3.14    1.56    3.14
w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.06   -0.09   -0.10 |    0.09    0.09    0.05
a_f      |    0.05    0.04 |    0.66

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.6070   0.2453   1.5077   1.5077   0.6070   0.2453
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0542   0.0222   0.1196   8.0871   2.2896   2.8947
Update Cnt = 250    ET =    938.2   Stats:  Mean, Std, Min, Max
r_f      |   -1.43    4.49   18.35 |  235.20  206.99  254.18 |-1023.93 -654.25 -967.65 |  804.55  686.40 1161.56
v_f      |    0.01    0.00   -0.01 |    0.32    0.31    0.33 |   -1.01   -0.89   -0.98 |    0.85    0.80    0.93
r_i      |    7.13   -3.43   49.19 |  666.87  651.93  779.76 |-1381.75-1350.43-1243.70 | 1328.83 1321.90 1306.90
v_i      |   -0.00    0.00   -0.00 |    0.04    0.04    0.05 |   -0.09   -0.09   -0.09 |    0.09    0.09    0.09
norm_rf  |  100.11 |  129.66 |    2.28 | 1011.14
norm_vf  |    0.50 |    0.23 |    0.08 |    1.19
gs_f     |    1.02 |    1.48 |    0.03 |   12.98
thrust   |    0.00    0.01   -0.01 |    1.00    1.00    1.00 |   -3.44   -3.45   -3.42 |    3.44    3.38    3.38
norm_thrust |    1

ADV1:  -0.004653639998291154 0.21691418267388143 1.8075541526919305 -4.7101458050059035
ADV2:  0.008719406431318539 0.6909591156241834 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.4861   0.1568   0.8346   1.5077   0.6070   0.2453
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0228   0.0054   0.0305   8.0871   2.2896   2.8947
***** Episode 8077, Mean R = -145.5  Std R = 30.1  Min R = -211.4
PolicyLoss: -0.0117
Policy_Beta: 0.0667
Policy_Entropy: 0.00653
Policy_KL: 0.00122
Policy_SD: 0.94
Policy_lr_mult: 1
Steps: 9.79e+03
TotalSteps: 2.45e+06
VF_0_ExplainedVarNew: 0.751
VF_0_ExplainedVarOld: 0.716
VF_0_Loss : 0.0611


ADV1:  0.008741757735056307 0.18444254913369987 2.3558251825968424 -1.2945175488789897
ADV2:  -0.032169806244634544 0.6912369380310404 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.5461   0.1995   1.0272   1.5077   0.6070   0.2453
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0267   0.0132   0.0572   8.0871   2.2896   2.8947
Upd

ADV1:  0.008980055211488373 0.1758288018025295 1.8599444007873536 -1.6594324437777224
ADV2:  -0.026905302041586497 0.7338473182379236 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.3841   0.0852   0.5445   1.5077   0.6070   0.2453
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0341   0.0141   0.0733   8.0871   2.2896   2.8947
***** Episode 8356, Mean R = -144.0  Std R = 23.6  Min R = -193.7
PolicyLoss: 0.0209
Policy_Beta: 0.0667
Policy_Entropy: 0.00714
Policy_KL: 0.00106
Policy_SD: 0.939
Policy_lr_mult: 1
Steps: 1.05e+04
TotalSteps: 2.54e+06
VF_0_ExplainedVarNew: 0.829
VF_0_ExplainedVarOld: 0.771
VF_0_Loss : 0.0394


ADV1:  0.00010830868240443062 0.20912171777449493 2.2875463644663494 -4.688781183938184
ADV2:  0.0034088056742216386 0.623841813470641 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.6221   0.2871   1.4949   1.5077   0.6221   0.2871
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0195   0.0059   0.0286   8.0871   2.2896   2.8947
****

ADV1:  0.009350083748732939 0.15862876496388623 1.998438237508138 -1.5401130930582703
ADV2:  -0.02438590882373114 0.7505747820577077 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.2945   0.1070   0.6662   1.5077   0.6221   0.2871
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0238   0.0091   0.0456   8.0871   2.2896   2.8947
***** Episode 8635, Mean R = -148.9  Std R = 29.0  Min R = -216.6
PolicyLoss: 0.0177
Policy_Beta: 0.0667
Policy_Entropy: 0.00735
Policy_KL: 0.000893
Policy_SD: 0.938
Policy_lr_mult: 1
Steps: 1.05e+04
TotalSteps: 2.64e+06
VF_0_ExplainedVarNew: 0.868
VF_0_ExplainedVarOld: 0.825
VF_0_Loss : 0.037


ADV1:  0.019931975570610033 0.1894922922166408 2.2889287153879803 -1.0285926676435273
ADV2:  -0.04550287619277376 0.6748275341033614 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.6090   0.2382   1.1805   1.5077   0.6221   0.2871
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0301   0.0123   0.0625   8.0871   2.2896   2.8947
***** E

ADV1:  -0.011439888595957272 0.21912873853911766 1.9742423137429261 -4.616244111262488
ADV2:  0.019680676182445647 0.6764893442334243 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.3742   0.0879   0.6032   1.5077   0.6844   0.2871
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0332   0.0115   0.0571   8.0871   2.2896   2.8947
***** Episode 8914, Mean R = -143.4  Std R = 25.7  Min R = -176.1
PolicyLoss: -0.0199
Policy_Beta: 0.0667
Policy_Entropy: 0.00775
Policy_KL: 0.00117
Policy_SD: 0.938
Policy_lr_mult: 1
Steps: 1.03e+04
TotalSteps: 2.73e+06
VF_0_ExplainedVarNew: 0.738
VF_0_ExplainedVarOld: 0.682
VF_0_Loss : 0.0588


ADV1:  -0.011964048032557097 0.1818572864956595 1.531437603632609 -1.5708084365389148
ADV2:  -0.003415796253270483 0.7822965033873218 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.4477   0.1248   0.7001   1.5077   0.6844   0.2871
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0325   0.0122   0.0654   8.0871   2.2896   2.8947
****

ADV1:  -0.016547606888692577 0.17600713431872017 2.006010532767977 -2.0617271030953255
ADV2:  0.006212268114763469 0.7178057740223606 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.4733   0.1487   0.7329   1.5077   0.6844   0.2871
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0279   0.0117   0.0572   8.0871   2.2896   2.8947
***** Episode 9193, Mean R = -131.6  Std R = 27.7  Min R = -186.5
PolicyLoss: -0.00225
Policy_Beta: 0.0667
Policy_Entropy: 0.0074
Policy_KL: 0.00102
Policy_SD: 0.934
Policy_lr_mult: 1
Steps: 1.08e+04
TotalSteps: 2.82e+06
VF_0_ExplainedVarNew: 0.809
VF_0_ExplainedVarOld: 0.759
VF_0_Loss : 0.0444


ADV1:  0.00949987133138642 0.1826617812175901 1.8621690725865154 -1.2457716782887798
ADV2:  -0.006426231545936568 0.7601041396867669 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.5336   0.1775   1.0432   1.5077   0.6844   0.2871
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0288   0.0108   0.0559   8.0871   2.2896   2.8947
*****

ADV1:  -0.01591876512091349 0.21655743552290277 1.3194054185969175 -4.667282476731758
ADV2:  0.03406935343796725 0.6705389887797949 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.3718   0.1126   0.6331   1.5077   0.6844   0.2871
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0305   0.0125   0.0534   8.0871   2.2896   2.8947
***** Episode 9472, Mean R = -136.0  Std R = 28.7  Min R = -177.4
PolicyLoss: -0.0335
Policy_Beta: 0.0667
Policy_Entropy: 0.00836
Policy_KL: 0.000949
Policy_SD: 0.933
Policy_lr_mult: 1
Steps: 1.01e+04
TotalSteps: 2.92e+06
VF_0_ExplainedVarNew: 0.741
VF_0_ExplainedVarOld: 0.683
VF_0_Loss : 0.0652


ADV1:  0.02923753498618301 0.1930408645837975 2.081886432437453 -1.4001171174286422
ADV2:  -0.04232863195813339 0.7071853382737378 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.4144   0.1222   0.6895   1.5077   0.6844   0.2871
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0524   0.0224   0.1066   8.0871   2.2896   2.8947
***** Ep

ADV1:  -0.0018853108744539783 0.14628310497336378 1.2575943379427328 -1.2584027017093504
ADV2:  0.018590151938817346 0.7531874979254862 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.4468   0.2018   1.1065   1.5825   0.6844   0.2871
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0138   0.0046   0.0245   8.0871   2.2896   2.8947
***** Episode 9751, Mean R = -119.0  Std R = 39.4  Min R = -183.7
PolicyLoss: -0.0221
Policy_Beta: 0.0667
Policy_Entropy: 0.00817
Policy_KL: 0.000997
Policy_SD: 0.928
Policy_lr_mult: 1
Steps: 1.11e+04
TotalSteps: 3.02e+06
VF_0_ExplainedVarNew: 0.806
VF_0_ExplainedVarOld: 0.755
VF_0_Loss : 0.0385


ADV1:  0.0017470935580658174 0.189710106557409 2.3697392622629803 -2.0902906936383756
ADV2:  -0.00848425559220954 0.710492926217465 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.5700   0.2239   1.2981   1.5825   0.6844   0.2871
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0179   0.0050   0.0286   8.0871   2.2896   2.8947
***

ADV1:  -0.008197635833335614 0.19840741355805375 2.0017922496795655 -1.6117262405056674
ADV2:  -0.0008793192482411226 0.7446415291037576 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.4917   0.1435   0.8016   1.5825   0.6844   0.3107
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0271   0.0100   0.0503   8.0871   2.2896   2.8947
***** Episode 10030, Mean R = -113.9  Std R = 34.4  Min R = -190.6
PolicyLoss: 0.000579
Policy_Beta: 0.0667
Policy_Entropy: 0.00885
Policy_KL: 0.000961
Policy_SD: 0.924
Policy_lr_mult: 1
Steps: 1.09e+04
TotalSteps: 3.11e+06
VF_0_ExplainedVarNew: 0.625
VF_0_ExplainedVarOld: 0.559
VF_0_Loss : 0.0545


ADV1:  0.0025495227196455105 0.19852152494624487 2.22577228864034 -2.0781643262749903
ADV2:  0.005212652319940576 0.7058378938709033 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.6045   0.3220   1.7231   1.7231   0.6844   0.3220
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0163   0.0057   0.0281   8.0871   2.2896   2.8947

ADV1:  -0.00808701741757568 0.1844002899067315 2.136585861774253 -2.1226289888223033
ADV2:  0.03328374076390511 0.7204252751223482 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.4867   0.1366   0.9545   1.7231   0.6844   0.3220
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0217   0.0071   0.0390   8.0871   2.2896   2.8947
***** Episode 10309, Mean R = -127.0  Std R = 40.7  Min R = -188.2
PolicyLoss: -0.0358
Policy_Beta: 0.0667
Policy_Entropy: 0.0101
Policy_KL: 0.00114
Policy_SD: 0.923
Policy_lr_mult: 1
Steps: 1.06e+04
TotalSteps: 3.21e+06
VF_0_ExplainedVarNew: 0.792
VF_0_ExplainedVarOld: 0.717
VF_0_Loss : 0.05


ADV1:  -0.023248495100410705 0.1724814953019232 1.6045387967427571 -2.020071270465853
ADV2:  0.052202230057429626 0.6967508087919789 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.5502   0.1534   0.8619   1.7231   0.6844   0.3220
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0442   0.0187   0.0789   8.0871   2.2896   2.8947
***** Epis

cs_angles |  0.0017 -0.0200 |  0.2748  0.2605 | -0.9992 -0.9996 |  1.0000  0.9988
optical_flow | -0.0001  0.0001 |  0.0225  0.0219 | -0.9666 -1.2475 |  1.6575  1.1270
v_err    | -0.0153 |  0.0752 | -0.4974 |  0.5028
landing_rewards |    0.35 |    1.85 |    0.00 |   10.00
landing_margin |   31.24 |   74.90 |   -0.03 |  960.58
tracking_rewards |  -79.19 |   19.25 | -133.86 |   -7.37
steps    |     353 |      37 |      11 |     408
***** Episode 10588, Mean R = -106.4  Std R = 34.4  Min R = -191.1
PolicyLoss: -0.00322
Policy_Beta: 0.0667
Policy_Entropy: 0.0102
Policy_KL: 0.00104
Policy_SD: 0.917
Policy_lr_mult: 1
Steps: 1.12e+04
TotalSteps: 3.31e+06
VF_0_ExplainedVarNew: 0.623
VF_0_ExplainedVarOld: 0.561
VF_0_Loss : 0.0521


ADV1:  -0.003907661923291563 0.1556827873021255 1.2413842199032357 -2.2309297943115256
ADV2:  0.025218917893971602 0.6644148639092204 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.4885   0.1780   1.0409   1.7318   0.8275   0.4418
ValFun  Gradients: u/s

attitude |    0.11   -0.08   -0.01 |    1.17    0.61    1.84 |   -3.14   -1.57   -3.14 |    3.14    1.56    3.14
w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.05   -0.07   -0.10 |    0.09    0.09    0.05
a_f      |   -0.08    0.04 |    0.62    1.79 |   -1.39   -3.14 |    1.38    3.12
w_f      |   -0.01    0.00   -0.00 |    0.01    0.02    0.02 |   -0.04   -0.06   -0.10 |    0.02    0.06    0.04
w_rewards |   -1.07 |    0.51 |   -2.64 |   -0.09
w_penalty |   -0.32 |    5.67 | -100.00 |    0.00
fov_penalty |  -23.39 |   24.95 |  -50.00 |    0.00
theta_cv |    0.56 |    0.31 |    0.00 |    3.04
seeker_angles |    0.02   -0.02 |    0.26    0.25 |   -1.00   -1.00 |    1.00    1.00
cs_angles |  0.0178 -0.0247 |  0.2627  0.2493 | -0.9999 -0.9992 |  0.9993  0.9987
optical_flow | -0.0002  0.0004 |  0.0220  0.0228 | -1.0502 -0.7570 |  0.8957  1.3065
v_err    | -0.0137 |  0.0751 | -0.5024 |  0.6914
landing_rewards |    0.35 |    1.85 |    0.00 |   10.00
landing_margin |   22

w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.10   -0.07   -0.10 |    0.09    0.09    0.05
a_f      |    0.05    0.04 |    0.62    1.84 |   -1.42   -3.13 |    1.47    3.13
w_f      |   -0.01    0.01   -0.00 |    0.01    0.02    0.02 |   -0.10   -0.07   -0.10 |    0.04    0.08    0.05
w_rewards |   -1.03 |    0.56 |   -5.09 |   -0.04
w_penalty |   -0.65 |    8.01 | -100.00 |    0.00
fov_penalty |  -21.29 |   24.72 |  -50.00 |    0.00
theta_cv |    0.56 |    0.31 |    0.00 |    3.06
seeker_angles |    0.02   -0.02 |    0.26    0.25 |   -1.00   -1.00 |    1.00    1.00
cs_angles |  0.0193 -0.0214 |  0.2570  0.2540 | -0.9998 -0.9999 |  0.9990  0.9997
optical_flow | -0.0000  0.0001 |  0.0222  0.0242 | -0.8412 -0.8036 |  0.8673  1.1768
v_err    | -0.0141 |  0.0750 | -0.5037 |  0.8817
landing_rewards |    0.32 |    1.77 |    0.00 |   10.00
landing_margin |   20.10 |   59.98 |   -0.06 |  924.69
tracking_rewards |  -77.81 |   18.50 | -150.33 |   -7.02
steps    |     360 |  

w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.06   -0.09   -0.10 |    0.08    0.09    0.05
a_f      |    0.02    0.06 |    0.68    1.84 |   -1.49   -3.11 |    1.42    3.12
w_f      |   -0.01    0.01   -0.00 |    0.01    0.02    0.02 |   -0.04   -0.05   -0.04 |    0.04    0.09    0.05
w_rewards |   -0.97 |    0.51 |   -3.03 |   -0.06
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |  -20.00 |   24.49 |  -50.00 |    0.00
theta_cv |    0.56 |    0.31 |    0.00 |    3.02
seeker_angles |    0.02   -0.02 |    0.25    0.26 |   -1.00   -1.00 |    1.00    1.00
cs_angles |  0.0187 -0.0170 |  0.2519  0.2612 | -0.9991 -0.9999 |  0.9987  0.9994
optical_flow | -0.0003  0.0004 |  0.0229  0.0250 | -1.2002 -1.1560 |  0.8254  1.0439
v_err    | -0.0147 |  0.0741 | -0.6724 |  0.4962
landing_rewards |    0.55 |    2.28 |    0.00 |   10.00
landing_margin |   17.92 |   52.94 |   -0.09 |  427.60
tracking_rewards |  -77.42 |   20.96 | -148.54 |  -37.74
steps    |     360 |  

w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.09   -0.06   -0.09 |    0.09    0.09    0.07
a_f      |   -0.09   -0.07 |    0.67    1.78 |   -1.44   -3.14 |    1.48    3.12
w_f      |   -0.01    0.01   -0.00 |    0.01    0.02    0.02 |   -0.04   -0.05   -0.04 |    0.03    0.06    0.05
w_rewards |   -0.97 |    0.50 |   -2.39 |   -0.01
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |  -14.84 |   22.84 |  -50.00 |    0.00
theta_cv |    0.52 |    0.30 |    0.00 |    3.11
seeker_angles |    0.02   -0.02 |    0.23    0.23 |   -1.00   -1.00 |    1.00    1.00
cs_angles |  0.0162 -0.0164 |  0.2303  0.2286 | -0.9995 -0.9993 |  0.9998  0.9996
optical_flow | -0.0002  0.0004 |  0.0228  0.0239 | -0.7580 -0.8727 |  0.7453  0.9829
v_err    | -0.0128 |  0.0733 | -0.6889 |  0.4886
landing_rewards |    0.81 |    2.72 |    0.00 |   10.00
landing_margin |   11.11 |   40.61 |   -0.06 |  517.68
tracking_rewards |  -72.22 |   18.98 | -130.76 |  -36.72
steps    |     365 |  

attitude |    0.02   -0.00   -0.19 |    1.18    0.63    1.88 |   -3.14   -1.57   -3.14 |    3.14    1.57    3.14
w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.10   -0.07   -0.09 |    0.10    0.10    0.05
a_f      |    0.01   -0.04 |    0.63    1.88 |   -1.42   -3.12 |    1.42    3.14
w_f      |   -0.01    0.01   -0.00 |    0.01    0.02    0.02 |   -0.10   -0.07   -0.04 |    0.03    0.07    0.04
w_rewards |   -0.95 |    0.57 |   -6.12 |   -0.04
w_penalty |   -0.32 |    5.67 | -100.00 |    0.00
fov_penalty |  -14.03 |   22.47 |  -50.00 |    0.00
theta_cv |    0.53 |    0.30 |    0.00 |    2.97
seeker_angles |    0.02   -0.02 |    0.23    0.23 |   -1.00   -1.00 |    0.99    1.00
cs_angles |  0.0167 -0.0229 |  0.2288  0.2300 | -0.9987 -0.9989 |  0.9945  0.9993
optical_flow | -0.0001  0.0003 |  0.0229  0.0246 | -1.2180 -1.0728 |  0.9505  0.9934
v_err    | -0.0116 |  0.0718 | -0.5054 |  0.7644
landing_rewards |    1.03 |    3.04 |    0.00 |   10.00
landing_margin |    8

w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.07   -0.08   -0.09 |    0.10    0.10    0.05
a_f      |   -0.00    0.02 |    0.67    1.82 |   -1.50   -3.14 |    1.51    3.14
w_f      |   -0.01    0.01   -0.00 |    0.01    0.02    0.01 |   -0.04   -0.06   -0.04 |    0.03    0.06    0.04
w_rewards |   -0.88 |    0.46 |   -2.17 |   -0.05
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |   -9.68 |   19.75 |  -50.00 |    0.00
theta_cv |    0.52 |    0.30 |    0.00 |    2.76
seeker_angles |    0.01   -0.03 |    0.21    0.22 |   -1.00   -1.00 |    1.00    1.00
cs_angles |  0.0107 -0.0266 |  0.2142  0.2181 | -0.9998 -0.9992 |  0.9999  0.9983
optical_flow |  0.0000  0.0005 |  0.0228  0.0257 | -0.9526 -1.4650 |  0.8843  1.2429
v_err    | -0.0108 |  0.0699 | -0.5007 |  0.7312
landing_rewards |    1.55 |    3.62 |    0.00 |   10.00
landing_margin |    8.83 |   39.60 |   -0.06 |  412.78
tracking_rewards |  -68.42 |   18.37 | -120.56 |  -33.99
steps    |     364 |  

attitude |   -0.08    0.04   -0.01 |    1.27    0.64    1.91 |   -3.14   -1.56   -3.14 |    3.14    1.56    3.14
w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.06   -0.06   -0.10 |    0.09    0.10    0.05
a_f      |    0.02    0.14 |    0.68    1.92 |   -1.46   -3.12 |    1.48    3.13
w_f      |   -0.01    0.01   -0.00 |    0.01    0.02    0.01 |   -0.05   -0.06   -0.05 |    0.03    0.07    0.04
w_rewards |   -0.79 |    0.47 |   -2.28 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |   -7.90 |   18.24 |  -50.00 |    0.00
theta_cv |    0.50 |    0.29 |    0.00 |    2.82
seeker_angles |   -0.00   -0.01 |    0.21    0.19 |   -1.00   -1.00 |    1.00    1.00
cs_angles | -0.0012 -0.0087 |  0.2074  0.1942 | -0.9968 -0.9982 |  0.9977  0.9951
optical_flow |  0.0001  0.0005 |  0.0223  0.0247 | -1.0919 -1.0604 |  1.0349  0.6566
v_err    | -0.0100 |  0.0702 | -0.5297 |  0.4813
landing_rewards |    1.55 |    3.62 |    0.00 |   10.00
landing_margin |    5

w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.07   -0.05   -0.10 |    0.09    0.09    0.05
a_f      |    0.05    0.09 |    0.66    1.87 |   -1.44   -3.11 |    1.49    3.13
w_f      |   -0.01    0.01    0.00 |    0.01    0.02    0.01 |   -0.04   -0.05   -0.04 |    0.03    0.07    0.04
w_rewards |   -0.87 |    0.43 |   -2.35 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |   -5.81 |   16.02 |  -50.00 |    0.00
theta_cv |    0.49 |    0.29 |    0.00 |    3.00
seeker_angles |    0.00   -0.02 |    0.19    0.19 |   -1.00   -1.00 |    1.00    1.00
cs_angles |  0.0014 -0.0203 |  0.1919  0.1891 | -0.9998 -0.9996 |  0.9985  0.9985
optical_flow |  0.0001  0.0004 |  0.0214  0.0246 | -1.2218 -1.0762 |  0.9983  0.8962
v_err    | -0.0093 |  0.0687 | -0.5017 |  0.2841
landing_rewards |    1.84 |    3.87 |    0.00 |   10.00
landing_margin |    2.28 |    6.95 |   -0.09 |   60.94
tracking_rewards |  -62.69 |   17.91 | -152.39 |  -30.33
steps    |     369 |  

w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.07   -0.07   -0.09 |    0.08    0.09    0.05
a_f      |    0.02   -0.19 |    0.65    1.85 |   -1.44   -3.13 |    1.40    3.14
w_f      |   -0.00    0.01   -0.00 |    0.01    0.03    0.01 |   -0.04   -0.07   -0.03 |    0.03    0.07    0.04
w_rewards |   -0.84 |    0.46 |   -2.42 |   -0.03
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |   -3.55 |   12.84 |  -50.00 |    0.00
theta_cv |    0.48 |    0.29 |    0.00 |    2.99
seeker_angles |    0.01   -0.02 |    0.17    0.18 |   -0.99   -1.00 |    0.99    1.00
cs_angles |  0.0080 -0.0179 |  0.1742  0.1827 | -0.9934 -0.9994 |  0.9871  0.9983
optical_flow | -0.0000  0.0004 |  0.0209  0.0257 | -0.8763 -1.0260 |  0.8656  1.1685
v_err    | -0.0090 |  0.0682 | -0.5049 |  0.4318
landing_rewards |    2.74 |    4.46 |    0.00 |   10.00
landing_margin |    1.30 |    4.76 |   -0.06 |   36.53
tracking_rewards |  -60.19 |   16.52 | -119.65 |  -30.78
steps    |     370 |  

w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.05   -0.06   -0.09 |    0.08    0.09    0.05
a_f      |    0.03   -0.06 |    0.64    1.84 |   -1.29   -3.10 |    1.44    3.12
w_f      |   -0.01    0.01   -0.00 |    0.01    0.03    0.01 |   -0.04   -0.05   -0.03 |    0.04    0.06    0.04
w_rewards |   -0.81 |    0.43 |   -2.31 |   -0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |   -1.61 |    8.83 |  -50.00 |    0.00
theta_cv |    0.46 |    0.28 |    0.00 |    2.70
seeker_angles |    0.01   -0.03 |    0.16    0.16 |   -1.00   -0.99 |    0.99    1.00
cs_angles |  0.0070 -0.0290 |  0.1611  0.1610 | -0.9955 -0.9876 |  0.9939  0.9956
optical_flow |  0.0001  0.0004 |  0.0224  0.0251 | -0.9162 -0.8261 |  1.1664  1.2866
v_err    | -0.0089 |  0.0673 | -0.4997 |  0.3097
landing_rewards |    3.00 |    4.58 |    0.00 |   10.00
landing_margin |    0.56 |    2.72 |   -0.07 |   22.90
tracking_rewards |  -55.83 |   14.85 | -130.44 |  -31.53
steps    |     371 |  

norm_wf  |    0.03 |    0.01 |    0.01 |    0.07
rh_penalty |    0.00 |    0.00 |    0.00 |    0.00
att_rewards |    0.00 |    0.00 |    0.00 |    0.00
att_penalty |    0.00 |    0.00 |    0.00 |    0.00
attitude |    0.02   -0.00    0.04 |    1.14    0.60    1.82 |   -3.14   -1.55   -3.14 |    3.14    1.56    3.14
w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.08   -0.06   -0.09 |    0.08    0.09    0.05
a_f      |   -0.01    0.00 |    0.65    1.85 |   -1.40   -3.14 |    1.43    3.12
w_f      |   -0.00    0.01    0.00 |    0.01    0.02    0.01 |   -0.03   -0.06   -0.04 |    0.03    0.06    0.05
w_rewards |   -0.82 |    0.41 |   -1.82 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |   -0.81 |    6.30 |  -50.00 |    0.00
theta_cv |    0.43 |    0.27 |    0.00 |    2.68
seeker_angles |    0.00   -0.03 |    0.14    0.15 |   -1.00   -1.00 |    1.00    0.99
cs_angles |  0.0008 -0.0256 |  0.1439  0.1462 | -0.9989 -0.9999 |  0.9967  0.9950
optical

norm_thrust |    1.35 |    0.69 |    0.00 |    3.46
fuel     |    3.12 |    0.27 |    2.60 |    4.07
rewards  |  -56.57 |   15.53 | -133.93 |  -26.23
fuel_rewards |   -8.93 |    0.77 |  -11.65 |   -7.44
glideslope_rewards |    0.00 |    0.00 |    0.00 |    0.00
glideslope_penalty |    0.00 |    0.00 |    0.00 |    0.00
glideslope |    2.93 |   13.53 |    0.01 | 1053.12
norm_af  |    1.80 |    0.90 |    0.03 |    3.26
norm_wf  |    0.03 |    0.01 |    0.00 |    0.06
rh_penalty |    0.00 |    0.00 |    0.00 |    0.00
att_rewards |    0.00 |    0.00 |    0.00 |    0.00
att_penalty |    0.00 |    0.00 |    0.00 |    0.00
attitude |   -0.05   -0.02    0.02 |    1.28    0.66    1.91 |   -3.14   -1.56   -3.14 |    3.14    1.57    3.14
w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.06   -0.05   -0.09 |    0.08    0.09    0.05
a_f      |   -0.01    0.09 |    0.66    1.89 |   -1.45   -3.13 |    1.51    3.14
w_f      |   -0.00    0.01    0.00 |    0.01    0.02    0.01 |   -0.

ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0008   0.0003   0.0015   8.0871   2.2896   2.8947
Update Cnt = 470    ET =    925.8   Stats:  Mean, Std, Min, Max
r_f      |   -7.98  -11.95    7.01 |  180.85  175.26  198.06 | -377.68 -391.34 -378.50 |  395.89  390.42  392.70
v_f      |    0.00   -0.00   -0.00 |    0.07    0.07    0.08 |   -0.16   -0.22   -0.25 |    0.22    0.22    0.22
r_i      |  -30.80  -58.29   34.33 |  658.12  670.79  771.03 |-1353.92-1302.62-1304.00 | 1317.45 1302.71 1329.14
v_i      |    0.00    0.00   -0.00 |    0.04    0.04    0.05 |   -0.09   -0.09   -0.10 |    0.10    0.09    0.09
norm_rf  |    0.77 |    1.08 |    0.05 |   18.28
norm_vf  |    0.12 |    0.05 |    0.03 |    0.32
gs_f     |    1.35 |    2.11 |    0.02 |   23.70
thrust   |   -0.01    0.00   -0.00 |    0.85    0.86    0.86 |   -3.43   -3.44   -3.46 |    3.44    3.46    3.45
norm_thrust |    1.32 |    0.68 |    0.00 |    3.46
fuel     |    2.97 |    0.24 |    2.43 |    3.73
rewards  |  -52.81 |

ADV1:  -0.0035129667568752844 0.020567197225656968 0.19828445745090909 -0.20186645414538446
ADV2:  0.022065645704440133 0.8793488191903778 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.5359   0.9896   3.6616   7.5254   3.8919   2.3289
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0036   0.0022   0.0090   8.0871   2.2896   2.8947
***** Episode 14897, Mean R = -51.1  Std R = 11.6  Min R = -79.5
PolicyLoss: -0.0115
Policy_Beta: 0.0667
Policy_Entropy: 0.0335
Policy_KL: 0.00085
Policy_SD: 0.774
Policy_lr_mult: 1
Steps: 1.17e+04
TotalSteps: 4.89e+06
VF_0_ExplainedVarNew: 0.915
VF_0_ExplainedVarOld: 0.91
VF_0_Loss : 0.0599


Dynamics: Max Disturbance (m/s^2):  [0.00149461 0.0018056  0.00138071] 0.002720371623523329
ADV1:  -0.00047053398479598004 0.021059186839660148 0.10486015404264137 -0.22255985448331525
ADV2:  0.017536709111308633 0.8817331654888276 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   3.6798   2.1542   7.3375   7.5254   3.8919   2.3289
ValFun 

ADV1:  0.0013820414337589514 0.01913032021683205 0.11585884450886964 -0.12843394802830005
ADV2:  -0.00432558153386968 0.931427405646053 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   3.2998   1.4148   5.7177   7.5254   4.2031   2.3289
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0016   0.0008   0.0038   8.0871   2.2896   2.8947
***** Episode 15176, Mean R = -44.8  Std R = 12.3  Min R = -68.3
PolicyLoss: -0.00467
Policy_Beta: 0.0667
Policy_Entropy: 0.0372
Policy_KL: 0.000979
Policy_SD: 0.748
Policy_lr_mult: 1
Steps: 1.15e+04
TotalSteps: 4.99e+06
VF_0_ExplainedVarNew: 0.929
VF_0_ExplainedVarOld: 0.925
VF_0_Loss : 0.052


Dynamics: Max Disturbance (m/s^2):  [0.00149461 0.0018056  0.00138071] 0.002720371623523329
ADV1:  -0.001614483337876471 0.021041023221562507 0.1234047963841745 -0.16808924144075024
ADV2:  0.0146023867346662 0.9096217320891615 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.9538   0.4865   2.1587   7.5254   4.2031   2.3289
ValFun  Gradi

Dynamics: Max Disturbance (m/s^2):  [0.00149461 0.0018056  0.00138071] 0.002720371623523329
ADV1:  0.0008837485899867747 0.018438969187083494 0.1995761309310346 -0.10691497375324882
ADV2:  -0.0030924529428900736 0.922350425285608 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.7665   0.7193   3.3018   8.0334   4.2031   2.3289
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0012   0.0006   0.0026   8.0871   2.2896   2.8947
***** Episode 15455, Mean R = -43.4  Std R = 9.3  Min R = -69.4
PolicyLoss: -0.00486
Policy_Beta: 0.0667
Policy_Entropy: 0.0428
Policy_KL: 0.000734
Policy_SD: 0.729
Policy_lr_mult: 1
Steps: 1.17e+04
TotalSteps: 5.1e+06
VF_0_ExplainedVarNew: 0.921
VF_0_ExplainedVarOld: 0.919
VF_0_Loss : 0.0563


ADV1:  0.000852328015535431 0.019100889660429513 0.11958911677186293 -0.1578189184143405
ADV2:  0.0044764067433131745 0.9108153837283436 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.8305   0.4536   1.8833   8.0334   4.2031   2.3289
ValFun  Gr

Dynamics: Max Disturbance (m/s^2):  [0.00149461 0.0018056  0.00138071] 0.002720371623523329
ADV1:  0.0014391637054316912 0.017953470106862525 0.09957569448600831 -0.13443196791298032
ADV2:  -0.002320027793851036 0.9190898083834104 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.8990   0.4591   2.5554   8.5228   4.2031   2.4330
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0018   0.0010   0.0037   8.0871   2.2896   2.8947
***** Episode 15734, Mean R = -41.5  Std R = 10.0  Min R = -70.1
PolicyLoss: -0.00888
Policy_Beta: 0.0667
Policy_Entropy: 0.0478
Policy_KL: 0.000894
Policy_SD: 0.702
Policy_lr_mult: 1
Steps: 1.15e+04
TotalSteps: 5.2e+06
VF_0_ExplainedVarNew: 0.927
VF_0_ExplainedVarOld: 0.925
VF_0_Loss : 0.0511


ADV1:  -0.001211872345715913 0.016314930872807352 0.10145972444170709 -0.07687935969978854
ADV2:  0.0028358591072876445 0.9402073311343966 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.7818   1.9107   6.3300   8.5228   4.2031   2.4330
ValFun

Dynamics: Max Disturbance (m/s^2):  [0.00149461 0.0018056  0.00138071] 0.002720371623523329
ADV1:  -0.0010868830136743805 0.020581446269025763 0.10689423998196923 -0.2635847831227055
ADV2:  0.020222261167453282 0.8463851174784534 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.9506   0.4342   2.2024   8.6638   4.2185   2.4330
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0017   0.0009   0.0034   8.0871   2.2896   2.8947
***** Episode 16013, Mean R = -44.4  Std R = 13.2  Min R = -70.0
PolicyLoss: -0.0213
Policy_Beta: 0.0667
Policy_Entropy: 0.0513
Policy_KL: 0.000783
Policy_SD: 0.707
Policy_lr_mult: 1
Steps: 1.16e+04
TotalSteps: 5.31e+06
VF_0_ExplainedVarNew: 0.93
VF_0_ExplainedVarOld: 0.923
VF_0_Loss : 0.0392


ADV1:  -0.0005921245311908755 0.01886488408545266 0.1141106231976815 -0.09722058256176583
ADV2:  -0.004631515881885858 0.9221306219238665 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.8628   0.3254   1.9146   8.6638   4.2185   2.4330
ValFun  G

***** Episode 16261, Mean R = -40.6  Std R = 9.9  Min R = -61.1
PolicyLoss: -0.00989
Policy_Beta: 0.0667
Policy_Entropy: 0.055
Policy_KL: 0.000926
Policy_SD: 0.694
Policy_lr_mult: 1
Steps: 1.16e+04
TotalSteps: 5.4e+06
VF_0_ExplainedVarNew: 0.931
VF_0_ExplainedVarOld: 0.928
VF_0_Loss : 0.0491


ADV1:  -0.00295624393398102 0.0179675984034708 0.1022751456819189 -0.10233072216741199
ADV2:  0.013774040451444251 0.9319917610109986 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   3.0639   1.9472   5.6425   8.6638   4.2185   2.4330
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0031   0.0017   0.0073   8.0871   2.2896   2.8947
***** Episode 16292, Mean R = -41.6  Std R = 8.7  Min R = -55.4
PolicyLoss: -0.00512
Policy_Beta: 0.0667
Policy_Entropy: 0.0559
Policy_KL: 0.00144
Policy_SD: 0.687
Policy_lr_mult: 1
Steps: 1.15e+04
TotalSteps: 5.41e+06
VF_0_ExplainedVarNew: 0.929
VF_0_ExplainedVarOld: 0.927
VF_0_Loss : 0.0401


ADV1:  -0.0008253530660250923 0.018956307621918408 0.1308602

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.7756   0.2819   1.4989  10.3262   4.3819   3.1804
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0096   0.0051   0.0216   8.0871   2.2896   2.8947
***** Episode 16540, Mean R = -45.1  Std R = 15.8  Min R = -80.7
PolicyLoss: -0.00374
Policy_Beta: 0.0667
Policy_Entropy: 0.06
Policy_KL: 0.000725
Policy_SD: 0.701
Policy_lr_mult: 1
Steps: 1.16e+04
TotalSteps: 5.5e+06
VF_0_ExplainedVarNew: 0.952
VF_0_ExplainedVarOld: 0.949
VF_0_Loss : 0.0435


ADV1:  0.003121794292655993 0.018211372746943955 0.10398371247301928 -0.10938381133492953
ADV2:  -0.01327469929486539 0.9407195517390176 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.8891   1.8197   7.5568  10.3262   4.3819   3.1804
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0041   0.0023   0.0087   8.0871   2.2896   2.8947
***** Episode 16571, Mean R = -39.3  Std R = 9.9  Min R = -59.7
PolicyLoss: -0.00512
Policy_Beta: 0.0667
Policy_Entropy: 0.0594
Policy_KL: 0.000676

Dynamics: Max Disturbance (m/s^2):  [0.00149461 0.0018056  0.00138071] 0.002720371623523329
ADV1:  -0.0023124663384644847 0.019125499408765106 0.1086050529175982 -0.08866450583499116
ADV2:  0.000664143280918025 0.917201378484783 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   9.0796   3.0692  13.8133  13.8133   9.0796   5.6032
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0024   0.0014   0.0062   8.0871   2.2896   2.8947
***** Episode 16819, Mean R = -41.9  Std R = 15.6  Min R = -106.8
PolicyLoss: 0.00976
Policy_Beta: 0.0296
Policy_Entropy: 0.0636
Policy_KL: 0.00051
Policy_SD: 0.68
Policy_lr_mult: 1
Steps: 1.16e+04
TotalSteps: 5.61e+06
VF_0_ExplainedVarNew: 0.944
VF_0_ExplainedVarOld: 0.936
VF_0_Loss : 0.0381


ADV1:  0.0016138602008192715 0.018763949520386854 0.09054388016884729 -0.16744976135373102
ADV2:  -0.00025129798146820585 0.919081398326143 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   8.3846   2.6345  13.0473  13.8133   9.0796   5.6032
ValFun  

cs_angles | -0.0075 -0.0015 |  0.1122  0.1118 | -0.9959 -0.9984 |  0.9947  0.9987
optical_flow |  0.0001  0.0002 |  0.0264  0.0277 | -1.2794 -1.0989 |  1.1075  1.6007
v_err    | -0.0076 |  0.0608 | -0.4999 |  0.1926
landing_rewards |    5.13 |    5.00 |    0.00 |   10.00
landing_margin |    0.00 |    0.04 |   -0.08 |    0.12
tracking_rewards |  -37.23 |    9.10 |  -95.78 |  -23.33
steps    |     374 |      19 |     323 |     416
***** Episode 17098, Mean R = -35.0  Std R = 7.9  Min R = -61.8
PolicyLoss: -0.00505
Policy_Beta: 0.0667
Policy_Entropy: 0.067
Policy_KL: 0.000596
Policy_SD: 0.649
Policy_lr_mult: 1
Steps: 1.15e+04
TotalSteps: 5.71e+06
VF_0_ExplainedVarNew: 0.948
VF_0_ExplainedVarOld: 0.944
VF_0_Loss : 0.041


ADV1:  -0.00017675283409622556 0.01666021272884633 0.12465335617046203 -0.14546285181990337
ADV2:  0.0026495569053101493 0.9334848720016508 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.5527   0.8051   4.4290  13.8133   9.3261   5.6032
ValFun  Gradients: u

attitude |    0.07    0.02    0.08 |    1.26    0.64    1.86 |   -3.14   -1.57   -3.14 |    3.14    1.56    3.14
w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.05   -0.05   -0.09 |    0.08    0.09    0.05
a_f      |    0.00    0.19 |    0.65    1.82 |   -1.47   -3.11 |    1.52    3.14
w_f      |   -0.01    0.00    0.00 |    0.01    0.02    0.01 |   -0.04   -0.05   -0.04 |    0.03    0.05    0.03
w_rewards |   -0.68 |    0.38 |   -1.75 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.37 |    0.30 |    0.00 |    3.01
seeker_angles |   -0.01    0.00 |    0.11    0.11 |   -1.00   -1.00 |    0.99    0.98
cs_angles | -0.0082  0.0038 |  0.1056  0.1110 | -0.9966 -0.9999 |  0.9859  0.9842
optical_flow |  0.0002  0.0001 |  0.0252  0.0258 | -1.0355 -0.9963 |  0.8877  1.0734
v_err    | -0.0070 |  0.0604 | -0.4820 |  0.1990
landing_rewards |    5.10 |    5.00 |    0.00 |   10.00
landing_margin |    0

attitude |    0.06   -0.04   -0.11 |    1.26    0.64    1.89 |   -3.14   -1.56   -3.14 |    3.14    1.54    3.14
w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.06   -0.05   -0.09 |    0.08    0.08    0.05
a_f      |   -0.06   -0.00 |    0.67    1.90 |   -1.50   -3.12 |    1.41    3.06
w_f      |   -0.01    0.00    0.00 |    0.01    0.02    0.01 |   -0.04   -0.05   -0.04 |    0.03    0.06    0.03
w_rewards |   -0.68 |    0.39 |   -2.01 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.38 |    0.30 |    0.00 |    3.07
seeker_angles |   -0.01    0.01 |    0.11    0.11 |   -1.00   -1.00 |    1.00    1.00
cs_angles | -0.0064  0.0131 |  0.1060  0.1148 | -0.9999 -0.9996 |  0.9965  0.9980
optical_flow |  0.0002 -0.0001 |  0.0252  0.0255 | -0.9061 -1.1880 |  1.0223  1.0143
v_err    | -0.0070 |  0.0599 | -0.5007 |  0.2409
landing_rewards |    5.35 |    4.99 |    0.00 |   10.00
landing_margin |   -0

w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.05   -0.05   -0.08 |    0.08    0.09    0.05
a_f      |   -0.05    0.10 |    0.69    1.81 |   -1.49   -3.14 |    1.52    3.13
w_f      |   -0.01    0.00   -0.00 |    0.01    0.02    0.01 |   -0.04   -0.05   -0.04 |    0.03    0.05    0.04
w_rewards |   -0.69 |    0.40 |   -2.03 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.37 |    0.30 |    0.00 |    2.80
seeker_angles |   -0.01    0.01 |    0.11    0.11 |   -0.98   -0.99 |    1.00    1.00
cs_angles | -0.0092  0.0070 |  0.1106  0.1079 | -0.9774 -0.9899 |  0.9995  0.9989
optical_flow |  0.0002 -0.0001 |  0.0262  0.0257 | -1.1312 -1.1492 |  0.9831  1.2378
v_err    | -0.0080 |  0.0602 | -0.4533 |  0.1618
landing_rewards |    5.68 |    4.95 |    0.00 |   10.00
landing_margin |   -0.00 |    0.03 |   -0.07 |    0.09
tracking_rewards |  -36.15 |    8.52 |  -65.68 |  -22.96
steps    |     375 |  

w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.05   -0.05   -0.09 |    0.09    0.09    0.05
a_f      |   -0.02   -0.04 |    0.70    1.82 |   -1.52   -3.13 |    1.40    3.13
w_f      |   -0.01    0.00   -0.00 |    0.01    0.02    0.01 |   -0.04   -0.04   -0.05 |    0.03    0.05    0.04
w_rewards |   -0.64 |    0.42 |   -2.13 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.37 |    0.30 |    0.00 |    2.93
seeker_angles |   -0.01    0.00 |    0.11    0.11 |   -1.00   -1.00 |    0.99    1.00
cs_angles | -0.0085  0.0037 |  0.1114  0.1062 | -0.9997 -0.9980 |  0.9912  0.9964
optical_flow |  0.0001 -0.0000 |  0.0269  0.0261 | -1.0949 -1.0996 |  1.2479  1.5090
v_err    | -0.0077 |  0.0600 | -0.5003 |  0.1852
landing_rewards |    5.45 |    4.98 |    0.00 |   10.00
landing_margin |   -0.00 |    0.03 |   -0.08 |    0.10
tracking_rewards |  -35.58 |    8.11 |  -68.00 |  -19.47
steps    |     373 |  

glideslope |    3.00 |   12.93 |    0.01 |  438.59
norm_af  |    1.78 |    0.88 |    0.02 |    3.30
norm_wf  |    0.02 |    0.01 |    0.00 |    0.06
rh_penalty |    0.00 |    0.00 |    0.00 |    0.00
att_rewards |    0.00 |    0.00 |    0.00 |    0.00
att_penalty |    0.00 |    0.00 |    0.00 |    0.00
attitude |    0.10    0.02    0.03 |    1.27    0.65    1.90 |   -3.14   -1.55   -3.14 |    3.14    1.57    3.14
w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.05   -0.05   -0.08 |    0.08    0.08    0.05
a_f      |    0.02    0.10 |    0.68    1.87 |   -1.44   -3.08 |    1.36    3.13
w_f      |   -0.01    0.00   -0.00 |    0.01    0.02    0.01 |   -0.05   -0.03   -0.04 |    0.03    0.05    0.03
w_rewards |   -0.62 |    0.42 |   -1.99 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.36 |    0.30 |    0.00 |    2.82
seeker_angles |   -0.01    0.00 |    0.10    0.11 |   -0.99   -1.00 |    1.

w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.06   -0.05   -0.08 |    0.08    0.08    0.05
a_f      |   -0.02    0.18 |    0.65    1.91 |   -1.43   -3.14 |    1.52    3.11
w_f      |   -0.01    0.00   -0.00 |    0.01    0.02    0.01 |   -0.04   -0.04   -0.04 |    0.03    0.05    0.03
w_rewards |   -0.68 |    0.43 |   -1.97 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.36 |    0.30 |    0.00 |    2.99
seeker_angles |   -0.01    0.00 |    0.11    0.10 |   -1.00   -1.00 |    0.97    1.00
cs_angles | -0.0084  0.0003 |  0.1101  0.1028 | -0.9992 -0.9971 |  0.9700  0.9994
optical_flow |  0.0000  0.0001 |  0.0263  0.0257 | -1.2367 -1.1156 |  1.1584  1.1923
v_err    | -0.0085 |  0.0593 | -0.4609 |  0.1652
landing_rewards |    6.13 |    4.87 |    0.00 |   10.00
landing_margin |   -0.01 |    0.03 |   -0.08 |    0.10
tracking_rewards |  -34.36 |    8.03 |  -71.01 |  -21.55
steps    |     373 |  

glideslope |    2.93 |   13.03 |    0.01 |  434.10
norm_af  |    1.75 |    0.89 |    0.05 |    3.32
norm_wf  |    0.02 |    0.01 |    0.00 |    0.06
rh_penalty |    0.00 |    0.00 |    0.00 |    0.00
att_rewards |    0.00 |    0.00 |    0.00 |    0.00
att_penalty |    0.00 |    0.00 |    0.00 |    0.00
attitude |   -0.09    0.04    0.06 |    1.18    0.63    1.84 |   -3.14   -1.55   -3.14 |    3.14    1.57    3.14
w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.05   -0.05   -0.09 |    0.07    0.09    0.05
a_f      |    0.05    0.08 |    0.64    1.86 |   -1.39   -3.12 |    1.47    3.13
w_f      |   -0.01    0.00   -0.00 |    0.01    0.02    0.01 |   -0.04   -0.04   -0.04 |    0.03    0.06    0.04
w_rewards |   -0.60 |    0.42 |   -2.09 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |   -0.16 |    2.84 |  -50.00 |    0.00
theta_cv |    0.37 |    0.31 |    0.00 |    3.02
seeker_angles |   -0.01   -0.01 |    0.10    0.11 |   -1.00   -1.00 |    1.

attitude |   -0.04   -0.02    0.00 |    1.28    0.68    1.88 |   -3.14   -1.57   -3.14 |    3.14    1.57    3.14
w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.05   -0.05   -0.08 |    0.09    0.09    0.05
a_f      |   -0.03    0.03 |    0.67    1.87 |   -1.45   -3.13 |    1.39    3.10
w_f      |   -0.01    0.00   -0.00 |    0.01    0.02    0.01 |   -0.04   -0.05   -0.03 |    0.03    0.05    0.03
w_rewards |   -0.66 |    0.46 |   -2.34 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.36 |    0.30 |    0.00 |    2.92
seeker_angles |   -0.00   -0.00 |    0.11    0.10 |   -0.97   -1.00 |    1.00    1.00
cs_angles | -0.0039 -0.0047 |  0.1080  0.1021 | -0.9750 -0.9979 |  0.9971  0.9957
optical_flow |  0.0002 -0.0000 |  0.0271  0.0262 | -1.2074 -1.2370 |  1.5636  1.0247
v_err    | -0.0084 |  0.0583 | -0.4827 |  0.1644
landing_rewards |    6.61 |    4.73 |    0.00 |   10.00
landing_margin |   -0

attitude |    0.00    0.02    0.11 |    1.18    0.64    1.84 |   -3.14   -1.55   -3.14 |    3.14    1.55    3.14
w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.06   -0.05   -0.09 |    0.08    0.08    0.05
a_f      |    0.02    0.10 |    0.66    1.82 |   -1.48   -3.11 |    1.47    3.11
w_f      |   -0.01    0.00   -0.00 |    0.01    0.02    0.01 |   -0.04   -0.05   -0.04 |    0.04    0.05    0.03
w_rewards |   -0.66 |    0.44 |   -1.96 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |   -0.16 |    2.84 |  -50.00 |    0.00
theta_cv |    0.36 |    0.30 |    0.00 |    2.78
seeker_angles |   -0.00    0.00 |    0.10    0.11 |   -0.99   -0.99 |    1.00    0.99
cs_angles | -0.0036  0.0022 |  0.1033  0.1064 | -0.9891 -0.9904 |  0.9966  0.9916
optical_flow | -0.0000 -0.0002 |  0.0260  0.0257 | -0.9430 -1.5806 |  1.0139  0.9297
v_err    | -0.0087 |  0.0591 | -0.4553 |  0.4568
landing_rewards |    6.23 |    4.85 |    0.00 |   10.00
landing_margin |    1

attitude |    0.11    0.03   -0.03 |    1.24    0.67    1.88 |   -3.14   -1.57   -3.14 |    3.14    1.56    3.14
w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.06   -0.05   -0.09 |    0.10    0.08    0.05
a_f      |    0.02   -0.02 |    0.70    1.88 |   -1.44   -3.13 |    1.39    3.14
w_f      |   -0.01    0.00   -0.00 |    0.02    0.02    0.01 |   -0.06   -0.05   -0.04 |    0.10    0.04    0.03
w_rewards |   -0.68 |    0.42 |   -1.85 |    0.00
w_penalty |   -0.32 |    5.67 | -100.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.36 |    0.31 |    0.00 |    2.98
seeker_angles |   -0.00    0.00 |    0.11    0.10 |   -0.98   -1.00 |    0.99    0.99
cs_angles | -0.0020  0.0001 |  0.1054  0.1030 | -0.9815 -0.9987 |  0.9935  0.9918
optical_flow |  0.0001 -0.0002 |  0.0271  0.0270 | -0.8971 -1.2165 |  1.4597  1.0325
v_err    | -0.0089 |  0.0580 | -0.4532 |  0.1598
landing_rewards |    6.58 |    4.74 |    0.00 |   10.00
landing_margin |    3

w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.06   -0.05   -0.09 |    0.07    0.08    0.05
a_f      |   -0.05   -0.01 |    0.68    1.79 |   -1.51   -3.13 |    1.46    3.12
w_f      |   -0.00    0.00    0.00 |    0.02    0.02    0.01 |   -0.04   -0.05   -0.04 |    0.04    0.05    0.03
w_rewards |   -0.64 |    0.39 |   -2.23 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |   -0.16 |    2.84 |  -50.00 |    0.00
theta_cv |    0.34 |    0.31 |    0.00 |    3.04
seeker_angles |    0.00   -0.01 |    0.10    0.11 |   -1.00   -0.99 |    0.99    1.00
cs_angles |  0.0033 -0.0074 |  0.0991  0.1050 | -0.9966 -0.9937 |  0.9873  0.9976
optical_flow |  0.0000  0.0000 |  0.0261  0.0270 | -1.1169 -1.4696 |  1.2204  1.2146
v_err    | -0.0090 |  0.0583 | -0.4813 |  0.1664
landing_rewards |    6.65 |    4.72 |    0.00 |   10.00
landing_margin |    0.07 |    1.44 |   -0.09 |   25.34
tracking_rewards |  -32.11 |    8.71 | -119.58 |  -19.91
steps    |     374 |  

attitude |   -0.11   -0.03    0.10 |    1.19    0.66    1.83 |   -3.14   -1.52   -3.14 |    3.14    1.56    3.14
w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.06   -0.05   -0.08 |    0.08    0.09    0.05
a_f      |   -0.00    0.09 |    0.67    1.84 |   -1.45   -3.13 |    1.39    3.11
w_f      |   -0.01    0.00   -0.00 |    0.02    0.02    0.01 |   -0.05   -0.05   -0.03 |    0.03    0.05    0.03
w_rewards |   -0.65 |    0.41 |   -2.09 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.36 |    0.31 |    0.00 |    2.99
seeker_angles |    0.01   -0.02 |    0.11    0.10 |   -1.00   -1.00 |    0.97    1.00
cs_angles |  0.0139 -0.0195 |  0.1082  0.1033 | -0.9952 -0.9979 |  0.9736  0.9994
optical_flow |  0.0000 -0.0003 |  0.0261  0.0264 | -0.9655 -1.1899 |  1.2603  1.2744
v_err    | -0.0094 |  0.0588 | -0.4537 |  0.1525
landing_rewards |    6.58 |    4.74 |    0.00 |   10.00
landing_margin |   -0

w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.10   -0.05   -0.08 |    0.09    0.08    0.05
a_f      |   -0.00    0.06 |    0.69    1.78 |   -1.47   -3.13 |    1.55    3.13
w_f      |   -0.01    0.00   -0.00 |    0.02    0.02    0.01 |   -0.10   -0.04   -0.06 |    0.03    0.06    0.03
w_rewards |   -0.72 |    0.50 |   -5.15 |    0.00
w_penalty |   -0.32 |    5.67 | -100.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.37 |    0.32 |    0.00 |    2.99
seeker_angles |    0.01   -0.01 |    0.11    0.11 |   -0.99   -0.98 |    1.00    1.00
cs_angles |  0.0084 -0.0136 |  0.1086  0.1088 | -0.9935 -0.9771 |  0.9973  0.9974
optical_flow | -0.0001 -0.0001 |  0.0263  0.0288 | -0.9282 -1.2584 |  1.0620  1.5049
v_err    | -0.0091 |  0.0587 | -0.4572 |  0.5610
landing_rewards |    7.19 |    4.49 |    0.00 |   10.00
landing_margin |    0.84 |   14.94 |   -0.08 |  263.53
tracking_rewards |  -33.87 |    8.11 |  -80.61 |  -21.30
steps    |     373 |  

w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.07   -0.05   -0.09 |    0.08    0.08    0.05
a_f      |   -0.01   -0.01 |    0.65    1.85 |   -1.54   -3.09 |    1.51    3.09
w_f      |   -0.01    0.00   -0.00 |    0.02    0.02    0.01 |   -0.05   -0.05   -0.03 |    0.03    0.05    0.03
w_rewards |   -0.76 |    0.44 |   -2.12 |   -0.05
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.36 |    0.32 |    0.00 |    2.96
seeker_angles |    0.00   -0.01 |    0.11    0.11 |   -1.00   -1.00 |    1.00    1.00
cs_angles |  0.0042 -0.0061 |  0.1130  0.1051 | -0.9957 -0.9963 |  0.9984  0.9966
optical_flow | -0.0001 -0.0000 |  0.0264  0.0267 | -1.0515 -0.8609 |  1.3410  1.3622
v_err    | -0.0091 |  0.0583 | -0.4612 |  0.1540
landing_rewards |    6.87 |    4.64 |    0.00 |   10.00
landing_margin |   -0.01 |    0.03 |   -0.07 |    0.07
tracking_rewards |  -33.58 |    9.12 |  -90.82 |  -20.10
steps    |     375 |  

attitude |    0.14   -0.05   -0.16 |    1.21    0.67    1.84 |   -3.14   -1.57   -3.14 |    3.14    1.56    3.14
w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.06   -0.05   -0.09 |    0.08    0.09    0.05
a_f      |   -0.06   -0.00 |    0.67    1.84 |   -1.46   -3.14 |    1.51    3.13
w_f      |   -0.01    0.00   -0.00 |    0.01    0.02    0.01 |   -0.05   -0.04   -0.05 |    0.03    0.05    0.03
w_rewards |   -0.72 |    0.41 |   -2.07 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.35 |    0.32 |    0.00 |    2.98
seeker_angles |    0.00   -0.00 |    0.10    0.11 |   -0.98   -1.00 |    1.00    0.99
cs_angles |  0.0046 -0.0014 |  0.1023  0.1051 | -0.9840 -0.9965 |  0.9967  0.9914
optical_flow | -0.0000 -0.0002 |  0.0267  0.0271 | -1.3274 -1.2758 |  1.2241  0.9325
v_err    | -0.0089 |  0.0579 | -0.4998 |  0.1700
landing_rewards |    7.10 |    4.54 |    0.00 |   10.00
landing_margin |   -0

w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.05   -0.05   -0.09 |    0.08    0.08    0.05
a_f      |    0.09   -0.04 |    0.65    1.90 |   -1.50   -3.14 |    1.45    3.13
w_f      |   -0.00    0.00   -0.00 |    0.02    0.02    0.01 |   -0.05   -0.04   -0.05 |    0.04    0.05    0.03
w_rewards |   -0.68 |    0.40 |   -2.10 |   -0.02
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.35 |    0.32 |    0.00 |    3.03
seeker_angles |   -0.00    0.00 |    0.11    0.10 |   -0.99   -1.00 |    1.00    0.99
cs_angles | -0.0017  0.0012 |  0.1071  0.1023 | -0.9948 -0.9997 |  0.9972  0.9940
optical_flow | -0.0002 -0.0000 |  0.0267  0.0274 | -1.3495 -1.3191 |  1.1635  1.2722
v_err    | -0.0088 |  0.0579 | -0.4587 |  0.2067
landing_rewards |    6.97 |    4.60 |    0.00 |   10.00
landing_margin |   -0.01 |    0.03 |   -0.07 |    0.16
tracking_rewards |  -32.04 |    7.88 |  -76.36 |  -17.34
steps    |     374 |  

attitude |   -0.02    0.01    0.04 |    1.26    0.64    1.88 |   -3.14   -1.56   -3.14 |    3.14    1.56    3.14
w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.06   -0.05   -0.09 |    0.08    0.08    0.05
a_f      |    0.01    0.09 |    0.63    1.85 |   -1.51   -3.13 |    1.32    3.14
w_f      |   -0.01    0.00   -0.00 |    0.01    0.02    0.01 |   -0.04   -0.04   -0.03 |    0.03    0.04    0.03
w_rewards |   -0.63 |    0.38 |   -2.09 |   -0.02
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |   -0.16 |    2.84 |  -50.00 |    0.00
theta_cv |    0.35 |    0.32 |    0.00 |    2.94
seeker_angles |    0.00    0.00 |    0.10    0.11 |   -1.00   -1.00 |    0.99    1.00
cs_angles |  0.0012  0.0025 |  0.1037  0.1060 | -0.9953 -0.9984 |  0.9938  0.9976
optical_flow |  0.0001 -0.0002 |  0.0263  0.0277 | -1.1892 -1.4804 |  1.1102  0.9395
v_err    | -0.0084 |  0.0575 | -0.4580 |  0.4825
landing_rewards |    7.19 |    4.49 |    0.00 |   10.00
landing_margin |    1

w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.06   -0.08   -0.09 |    0.08    0.08    0.05
a_f      |    0.06    0.10 |    0.67    1.84 |   -1.53   -3.14 |    1.48    3.13
w_f      |   -0.01    0.00    0.00 |    0.02    0.01    0.01 |   -0.04   -0.04   -0.03 |    0.03    0.05    0.04
w_rewards |   -0.65 |    0.40 |   -3.19 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |   -0.16 |    2.84 |  -50.00 |    0.00
theta_cv |    0.35 |    0.32 |    0.00 |    3.07
seeker_angles |    0.00    0.01 |    0.10    0.10 |   -0.98   -1.00 |    0.99    0.99
cs_angles |  0.0049  0.0058 |  0.1032  0.1008 | -0.9767 -0.9993 |  0.9947  0.9928
optical_flow |  0.0001 -0.0001 |  0.0263  0.0276 | -0.9885 -1.2058 |  1.1903  1.1822
v_err    | -0.0085 |  0.0585 | -0.4570 |  0.4527
landing_rewards |    7.00 |    4.58 |    0.00 |   10.00
landing_margin |    1.22 |   21.67 |   -0.08 |  382.16
tracking_rewards |  -31.52 |    7.68 |  -92.70 |  -17.33
steps    |     374 |  

attitude |   -0.06    0.02   -0.04 |    1.26    0.66    1.93 |   -3.14   -1.57   -3.14 |    3.14    1.56    3.14
w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.05   -0.05   -0.08 |    0.08    0.09    0.05
a_f      |    0.01    0.04 |    0.68    1.90 |   -1.41   -3.13 |    1.41    3.12
w_f      |   -0.01    0.00   -0.00 |    0.02    0.01    0.01 |   -0.05   -0.05   -0.04 |    0.03    0.04    0.03
w_rewards |   -0.66 |    0.38 |   -1.72 |   -0.01
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.34 |    0.32 |    0.00 |    3.01
seeker_angles |    0.00    0.00 |    0.10    0.10 |   -0.97   -1.00 |    1.00    0.99
cs_angles |  0.0040  0.0029 |  0.1018  0.0967 | -0.9730 -0.9962 |  0.9958  0.9885
optical_flow |  0.0001 -0.0002 |  0.0268  0.0277 | -1.1917 -1.1217 |  1.2390  1.1134
v_err    | -0.0084 |  0.0575 | -0.4529 |  0.1877
landing_rewards |    7.13 |    4.52 |    0.00 |   10.00
landing_margin |   -0

attitude |    0.03   -0.03   -0.00 |    1.33    0.67    1.87 |   -3.14   -1.55   -3.14 |    3.14    1.55    3.14
w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.05   -0.05   -0.08 |    0.08    0.09    0.05
a_f      |   -0.03   -0.05 |    0.68    1.85 |   -1.42   -3.13 |    1.43    3.09
w_f      |   -0.01    0.00   -0.00 |    0.01    0.01    0.01 |   -0.04   -0.04   -0.04 |    0.03    0.04    0.02
w_rewards |   -0.70 |    0.38 |   -2.12 |   -0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.35 |    0.32 |    0.00 |    3.05
seeker_angles |    0.01    0.00 |    0.10    0.10 |   -0.99   -0.99 |    1.00    0.99
cs_angles |  0.0055  0.0017 |  0.0979  0.1010 | -0.9869 -0.9949 |  0.9970  0.9942
optical_flow | -0.0002 -0.0003 |  0.0261  0.0274 | -1.0115 -1.3697 |  1.1478  0.8862
v_err    | -0.0084 |  0.0576 | -0.4579 |  0.1445
landing_rewards |    7.58 |    4.28 |    0.00 |   10.00
landing_margin |   -0

w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.10   -0.05   -0.08 |    0.08    0.08    0.07
a_f      |   -0.06   -0.12 |    0.70    1.87 |   -1.51   -3.11 |    1.54    3.14
w_f      |   -0.01    0.00   -0.00 |    0.02    0.01    0.01 |   -0.10   -0.03   -0.04 |    0.03    0.04    0.07
w_rewards |   -0.72 |    0.46 |   -5.07 |    0.00
w_penalty |   -0.32 |    5.67 | -100.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.35 |    0.32 |    0.00 |    3.02
seeker_angles |    0.01    0.00 |    0.10    0.10 |   -1.00   -1.00 |    0.99    1.00
cs_angles |  0.0055  0.0008 |  0.0987  0.1029 | -0.9951 -0.9951 |  0.9906  0.9994
optical_flow |  0.0000 -0.0001 |  0.0270  0.0280 | -1.2809 -1.2300 |  1.0449  1.1187
v_err    | -0.0081 |  0.0582 | -0.4684 |  0.5073
landing_rewards |    7.42 |    4.38 |    0.00 |   10.00
landing_margin |    2.48 |   43.89 |   -0.08 |  774.08
tracking_rewards |  -30.76 |    7.23 |  -63.96 |  -18.52
steps    |     373 |  

w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.06   -0.05   -0.09 |    0.09    0.08    0.05
a_f      |    0.00   -0.03 |    0.66    1.78 |   -1.41   -3.13 |    1.48    3.13
w_f      |   -0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.05   -0.04   -0.04 |    0.03    0.03    0.03
w_rewards |   -0.68 |    0.41 |   -2.50 |   -0.01
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.35 |    0.32 |    0.00 |    3.07
seeker_angles |    0.01   -0.00 |    0.10    0.10 |   -0.99   -1.00 |    1.00    0.99
cs_angles |  0.0058 -0.0021 |  0.1023  0.0991 | -0.9880 -0.9966 |  0.9963  0.9907
optical_flow |  0.0001  0.0000 |  0.0273  0.0283 | -1.1120 -1.1242 |  1.1345  1.1768
v_err    | -0.0080 |  0.0575 | -0.4970 |  0.1790
landing_rewards |    7.55 |    4.30 |    0.00 |   10.00
landing_margin |   -0.02 |    0.03 |   -0.07 |    0.09
tracking_rewards |  -30.61 |    6.83 |  -66.92 |  -18.92
steps    |     374 |  

attitude |    0.00   -0.01   -0.04 |    1.19    0.70    1.78 |   -3.14   -1.55   -3.14 |    3.14    1.57    3.14
w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.10   -0.05   -0.08 |    0.07    0.09    0.05
a_f      |    0.00   -0.07 |    0.70    1.75 |   -1.41   -3.11 |    1.47    3.14
w_f      |   -0.00   -0.00   -0.00 |    0.02    0.01    0.01 |   -0.10   -0.04   -0.04 |    0.04    0.03    0.03
w_rewards |   -0.69 |    0.38 |   -2.00 |   -0.04
w_penalty |   -0.32 |    5.67 | -100.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.34 |    0.32 |    0.00 |    3.02
seeker_angles |    0.00   -0.00 |    0.10    0.10 |   -0.99   -1.00 |    0.98    0.99
cs_angles |  0.0049 -0.0013 |  0.1004  0.0998 | -0.9916 -0.9973 |  0.9806  0.9913
optical_flow | -0.0001 -0.0002 |  0.0282  0.0285 | -1.0751 -1.0041 |  1.3318  1.3654
v_err    | -0.0082 |  0.0581 | -0.4944 |  0.1837
landing_rewards |    7.77 |    4.16 |    0.00 |   10.00
landing_margin |    3

attitude |    0.01   -0.06    0.00 |    1.31    0.63    1.92 |   -3.14   -1.54   -3.14 |    3.14    1.57    3.14
w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.06   -0.05   -0.09 |    0.07    0.08    0.05
a_f      |   -0.06    0.11 |    0.63    1.92 |   -1.33   -3.14 |    1.38    3.14
w_f      |   -0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.05   -0.04   -0.03 |    0.03    0.04    0.02
w_rewards |   -0.67 |    0.36 |   -2.09 |   -0.03
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.34 |    0.32 |    0.00 |    2.92
seeker_angles |    0.00    0.00 |    0.10    0.10 |   -1.00   -1.00 |    1.00    0.97
cs_angles |  0.0041  0.0026 |  0.1004  0.1030 | -0.9964 -0.9980 |  0.9976  0.9688
optical_flow |  0.0000 -0.0001 |  0.0285  0.0268 | -1.3949 -1.2198 |  1.2065  1.1396
v_err    | -0.0084 |  0.0576 | -0.4515 |  0.1796
landing_rewards |    7.52 |    4.32 |    0.00 |   10.00
landing_margin |   -0

attitude |    0.04    0.01    0.10 |    1.30    0.72    1.88 |   -3.14   -1.57   -3.14 |    3.14    1.57    3.14
w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.06   -0.05   -0.09 |    0.08    0.09    0.05
a_f      |    0.00    0.18 |    0.72    1.85 |   -1.44   -3.12 |    1.56    3.13
w_f      |   -0.00    0.00   -0.00 |    0.02    0.01    0.01 |   -0.05   -0.04   -0.04 |    0.04    0.04    0.03
w_rewards |   -0.72 |    0.38 |   -1.91 |   -0.01
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |   -0.16 |    2.84 |  -50.00 |    0.00
theta_cv |    0.35 |    0.32 |    0.00 |    3.12
seeker_angles |    0.00    0.00 |    0.10    0.11 |   -1.00   -1.00 |    1.00    0.98
cs_angles |  0.0040  0.0033 |  0.0996  0.1078 | -0.9996 -0.9955 |  0.9978  0.9820
optical_flow |  0.0001 -0.0001 |  0.0264  0.0283 | -1.0009 -1.2100 |  1.4227  1.1781
v_err    | -0.0088 |  0.0578 | -0.4516 |  0.4023
landing_rewards |    7.39 |    4.39 |    0.00 |   10.00
landing_margin |    1

attitude |    0.05    0.03    0.02 |    1.23    0.67    1.86 |   -3.14   -1.56   -3.14 |    3.14    1.56    3.14
w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.07   -0.05   -0.08 |    0.08    0.09    0.05
a_f      |    0.03    0.02 |    0.66    1.85 |   -1.43   -3.13 |    1.48    3.14
w_f      |   -0.00    0.00   -0.00 |    0.02    0.01    0.01 |   -0.04   -0.03   -0.03 |    0.03    0.04    0.03
w_rewards |   -0.68 |    0.39 |   -1.79 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.33 |    0.31 |    0.00 |    3.13
seeker_angles |    0.00    0.00 |    0.09    0.10 |   -0.99   -1.00 |    0.99    0.99
cs_angles |  0.0027  0.0039 |  0.0942  0.0972 | -0.9947 -0.9964 |  0.9932  0.9942
optical_flow | -0.0001 -0.0000 |  0.0277  0.0274 | -1.2231 -1.2959 |  1.1181  1.5363
v_err    | -0.0090 |  0.0577 | -0.4540 |  0.1645
landing_rewards |    7.35 |    4.41 |    0.00 |   10.00
landing_margin |   -0

w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.07   -0.05   -0.09 |    0.07    0.08    0.05
a_f      |   -0.01   -0.10 |    0.64    1.87 |   -1.49   -3.13 |    1.51    3.12
w_f      |   -0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.04   -0.04   -0.03 |    0.04    0.04    0.03
w_rewards |   -0.75 |    0.39 |   -1.76 |   -0.03
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.33 |    0.31 |    0.00 |    3.04
seeker_angles |    0.00    0.01 |    0.09    0.10 |   -0.99   -1.00 |    0.97    0.99
cs_angles |  0.0038  0.0056 |  0.0921  0.0956 | -0.9891 -0.9996 |  0.9740  0.9892
optical_flow | -0.0002 -0.0002 |  0.0275  0.0271 | -1.0250 -1.1151 |  0.9920  1.1800
v_err    | -0.0089 |  0.0574 | -0.4532 |  0.1468
landing_rewards |    8.06 |    3.95 |    0.00 |   10.00
landing_margin |   -0.02 |    0.02 |   -0.08 |    0.08
tracking_rewards |  -29.16 |    5.88 |  -57.66 |  -18.16
steps    |     375 |  

w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.08   -0.05   -0.09 |    0.08    0.09    0.05
a_f      |    0.01    0.30 |    0.61    1.77 |   -1.32   -3.13 |    1.43    3.12
w_f      |   -0.00    0.00    0.00 |    0.02    0.01    0.01 |   -0.04   -0.04   -0.03 |    0.03    0.04    0.03
w_rewards |   -0.70 |    0.38 |   -2.10 |   -0.01
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.33 |    0.31 |    0.00 |    3.01
seeker_angles |    0.00    0.01 |    0.09    0.10 |   -0.99   -0.99 |    1.00    0.97
cs_angles |  0.0031  0.0053 |  0.0942  0.0998 | -0.9913 -0.9924 |  0.9987  0.9721
optical_flow | -0.0000 -0.0001 |  0.0290  0.0271 | -1.2518 -1.1366 |  1.2690  1.0564
v_err    | -0.0088 |  0.0576 | -0.4519 |  0.1642
landing_rewards |    7.97 |    4.02 |    0.00 |   10.00
landing_margin |   -0.02 |    0.02 |   -0.07 |    0.07
tracking_rewards |  -29.78 |    6.45 |  -63.53 |  -18.23
steps    |     376 |  

w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.07   -0.05   -0.09 |    0.08    0.09    0.05
a_f      |    0.02   -0.04 |    0.68    1.80 |   -1.51   -3.13 |    1.55    3.14
w_f      |   -0.01    0.00   -0.00 |    0.02    0.01    0.01 |   -0.05   -0.04   -0.04 |    0.03    0.03    0.02
w_rewards |   -0.72 |    0.40 |   -2.12 |   -0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.33 |    0.31 |    0.00 |    2.99
seeker_angles |    0.01    0.00 |    0.10    0.10 |   -0.99   -1.00 |    0.99    0.99
cs_angles |  0.0050  0.0018 |  0.0953  0.0977 | -0.9867 -0.9968 |  0.9939  0.9943
optical_flow | -0.0001 -0.0000 |  0.0283  0.0278 | -1.2137 -1.2467 |  1.5175  1.3305
v_err    | -0.0092 |  0.0573 | -0.4626 |  0.1755
landing_rewards |    7.94 |    4.05 |    0.00 |   10.00
landing_margin |   -0.02 |    0.02 |   -0.07 |    0.09
tracking_rewards |  -29.65 |    6.65 |  -62.82 |  -17.29
steps    |     377 |  

w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.07   -0.05   -0.09 |    0.08    0.08    0.05
a_f      |    0.01   -0.00 |    0.70    1.75 |   -1.50   -3.11 |    1.42    3.13
w_f      |   -0.00    0.00   -0.00 |    0.02    0.01    0.01 |   -0.04   -0.03   -0.03 |    0.03    0.04    0.03
w_rewards |   -0.70 |    0.38 |   -1.82 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.34 |    0.31 |    0.00 |    3.09
seeker_angles |    0.01    0.00 |    0.10    0.10 |   -0.99   -1.00 |    0.99    0.99
cs_angles |  0.0056  0.0043 |  0.0975  0.0972 | -0.9948 -0.9950 |  0.9863  0.9922
optical_flow | -0.0002 -0.0002 |  0.0275  0.0281 | -0.9271 -1.1938 |  1.2018  1.0177
v_err    | -0.0095 |  0.0572 | -0.4547 |  0.1507
landing_rewards |    7.84 |    4.12 |    0.00 |   10.00
landing_margin |   -0.02 |    0.02 |   -0.07 |    0.06
tracking_rewards |  -29.89 |    6.34 |  -56.99 |  -17.53
steps    |     376 |  

w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.07   -0.05   -0.09 |    0.07    0.09    0.05
a_f      |   -0.03   -0.01 |    0.67    1.75 |   -1.47   -3.07 |    1.53    3.14
w_f      |   -0.00    0.00   -0.00 |    0.02    0.01    0.01 |   -0.05   -0.04   -0.03 |    0.03    0.03    0.03
w_rewards |   -0.69 |    0.40 |   -1.87 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.34 |    0.31 |    0.00 |    3.05
seeker_angles |    0.00    0.00 |    0.10    0.10 |   -0.99   -1.00 |    1.00    1.00
cs_angles |  0.0031  0.0021 |  0.0972  0.1010 | -0.9856 -0.9983 |  0.9996  0.9966
optical_flow | -0.0001 -0.0000 |  0.0290  0.0276 | -1.3310 -1.0233 |  1.3289  1.3303
v_err    | -0.0095 |  0.0574 | -0.4513 |  0.1450
landing_rewards |    7.74 |    4.18 |    0.00 |   10.00
landing_margin |   -0.02 |    0.02 |   -0.08 |    0.07
tracking_rewards |  -30.01 |    7.48 |  -58.68 |  -17.28
steps    |     374 |  

attitude |   -0.04   -0.03    0.13 |    1.22    0.68    1.82 |   -3.14   -1.56   -3.14 |    3.14    1.57    3.14
w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.08   -0.05   -0.08 |    0.08    0.08    0.05
a_f      |   -0.02    0.07 |    0.65    1.81 |   -1.56   -3.14 |    1.50    3.08
w_f      |   -0.00    0.00   -0.00 |    0.02    0.01    0.01 |   -0.05   -0.04   -0.03 |    0.04    0.04    0.03
w_rewards |   -0.63 |    0.37 |   -1.95 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.33 |    0.31 |    0.00 |    3.11
seeker_angles |    0.00   -0.00 |    0.10    0.10 |   -1.00   -1.00 |    1.00    1.00
cs_angles |  0.0023 -0.0004 |  0.0981  0.0969 | -0.9971 -0.9986 |  0.9999  0.9976
optical_flow | -0.0002 -0.0002 |  0.0285  0.0270 | -1.3851 -1.1475 |  1.1527  1.1740
v_err    | -0.0089 |  0.0569 | -0.4529 |  0.1557
landing_rewards |    8.32 |    3.74 |    0.00 |   10.00
landing_margin |   -0

w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.08   -0.05   -0.08 |    0.09    0.09    0.05
a_f      |   -0.03    0.06 |    0.66    1.92 |   -1.37   -3.12 |    1.53    3.13
w_f      |   -0.00    0.00   -0.00 |    0.02    0.01    0.01 |   -0.04   -0.03   -0.03 |    0.04    0.03    0.03
w_rewards |   -0.69 |    0.39 |   -2.05 |   -0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.34 |    0.32 |    0.00 |    3.00
seeker_angles |   -0.00   -0.00 |    0.10    0.10 |   -0.99   -0.99 |    0.99    0.99
cs_angles | -0.0002 -0.0020 |  0.0987  0.0994 | -0.9916 -0.9865 |  0.9925  0.9855
optical_flow | -0.0002 -0.0002 |  0.0273  0.0269 | -1.7593 -1.2850 |  1.2770  1.1710
v_err    | -0.0092 |  0.0570 | -0.4522 |  0.2122
landing_rewards |    7.84 |    4.12 |    0.00 |   10.00
landing_margin |   -0.02 |    0.03 |   -0.06 |    0.09
tracking_rewards |  -30.11 |    6.94 |  -58.13 |  -17.71
steps    |     375 |  

attitude |    0.04   -0.03   -0.20 |    1.11    0.65    1.76 |   -3.14   -1.56   -3.14 |    3.14    1.54    3.14
w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.06   -0.05   -0.08 |    0.09    0.09    0.05
a_f      |   -0.01   -0.13 |    0.65    1.75 |   -1.54   -3.14 |    1.50    3.10
w_f      |   -0.00    0.00   -0.00 |    0.02    0.01    0.01 |   -0.05   -0.04   -0.03 |    0.03    0.03    0.03
w_rewards |   -0.70 |    0.39 |   -2.36 |   -0.02
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.33 |    0.31 |    0.00 |    2.96
seeker_angles |   -0.00    0.00 |    0.10    0.10 |   -0.98   -1.00 |    1.00    1.00
cs_angles | -0.0027  0.0011 |  0.0967  0.1012 | -0.9789 -1.0000 |  0.9951  0.9983
optical_flow | -0.0000 -0.0000 |  0.0285  0.0267 | -1.4658 -1.3012 |  1.6239  1.2284
v_err    | -0.0090 |  0.0571 | -0.4536 |  0.2249
landing_rewards |    7.84 |    4.12 |    0.00 |   10.00
landing_margin |   -0

attitude |   -0.06   -0.01   -0.15 |    1.24    0.63    1.91 |   -3.14   -1.56   -3.14 |    3.14    1.54    3.14
w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.07   -0.05   -0.08 |    0.09    0.08    0.05
a_f      |   -0.01   -0.08 |    0.63    1.91 |   -1.46   -3.12 |    1.41    3.11
w_f      |   -0.00    0.00   -0.00 |    0.02    0.01    0.01 |   -0.04   -0.03   -0.03 |    0.05    0.04    0.03
w_rewards |   -0.65 |    0.36 |   -2.44 |   -0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.33 |    0.31 |    0.00 |    2.92
seeker_angles |   -0.00    0.00 |    0.10    0.10 |   -1.00   -0.99 |    1.00    1.00
cs_angles | -0.0021  0.0022 |  0.0961  0.0976 | -0.9997 -0.9936 |  0.9987  0.9950
optical_flow | -0.0000 -0.0001 |  0.0284  0.0280 | -1.1532 -1.2557 |  1.3110  1.3928
v_err    | -0.0087 |  0.0565 | -0.4537 |  0.1774
landing_rewards |    8.00 |    4.00 |    0.00 |   10.00
landing_margin |   -0

w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.07   -0.05   -0.08 |    0.09    0.08    0.05
a_f      |   -0.00   -0.15 |    0.68    1.84 |   -1.51   -3.10 |    1.43    3.13
w_f      |   -0.00    0.00   -0.00 |    0.02    0.01    0.01 |   -0.05   -0.04   -0.04 |    0.04    0.03    0.03
w_rewards |   -0.69 |    0.37 |   -2.10 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.32 |    0.31 |    0.00 |    3.03
seeker_angles |    0.00    0.01 |    0.10    0.10 |   -1.00   -1.00 |    0.99    0.99
cs_angles |  0.0016  0.0060 |  0.0971  0.0963 | -0.9991 -0.9957 |  0.9854  0.9912
optical_flow | -0.0001 -0.0001 |  0.0268  0.0275 | -1.0672 -1.3071 |  0.9375  1.2707
v_err    | -0.0087 |  0.0570 | -0.4526 |  0.1523
landing_rewards |    7.77 |    4.16 |    0.00 |   10.00
landing_margin |   -0.02 |    0.02 |   -0.07 |    0.06
tracking_rewards |  -29.00 |    6.79 |  -61.39 |  -17.47
steps    |     374 |  

w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.07   -0.05   -0.08 |    0.08    0.09    0.05
a_f      |   -0.01   -0.01 |    0.64    1.85 |   -1.37   -3.14 |    1.46    3.14
w_f      |   -0.00    0.00   -0.00 |    0.02    0.01    0.01 |   -0.04   -0.03   -0.03 |    0.04    0.04    0.03
w_rewards |   -0.67 |    0.34 |   -1.71 |   -0.08
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.33 |    0.31 |    0.00 |    3.09
seeker_angles |   -0.00    0.00 |    0.09    0.10 |   -0.99   -0.99 |    1.00    0.99
cs_angles | -0.0015  0.0036 |  0.0948  0.0962 | -0.9914 -0.9946 |  0.9969  0.9949
optical_flow | -0.0001 -0.0003 |  0.0271  0.0266 | -1.0849 -1.0780 |  1.2110  1.3050
v_err    | -0.0092 |  0.0573 | -0.4540 |  0.1519
landing_rewards |    8.29 |    3.76 |    0.00 |   10.00
landing_margin |   -0.02 |    0.02 |   -0.07 |    0.06
tracking_rewards |  -28.91 |    6.47 |  -55.62 |  -18.03
steps    |     375 |  

w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.07   -0.05   -0.08 |    0.08    0.09    0.05
a_f      |    0.01    0.09 |    0.66    1.83 |   -1.41   -3.14 |    1.50    3.14
w_f      |   -0.00    0.00   -0.00 |    0.02    0.01    0.01 |   -0.04   -0.03   -0.04 |    0.03    0.03    0.03
w_rewards |   -0.66 |    0.36 |   -1.90 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.33 |    0.31 |    0.00 |    3.04
seeker_angles |   -0.00    0.00 |    0.09    0.09 |   -0.99   -1.00 |    0.98    1.00
cs_angles | -0.0010  0.0022 |  0.0943  0.0927 | -0.9901 -0.9989 |  0.9769  0.9995
optical_flow | -0.0001 -0.0001 |  0.0277  0.0270 | -1.2218 -1.2123 |  1.4890  1.5009
v_err    | -0.0087 |  0.0564 | -0.4540 |  0.1470
landing_rewards |    7.71 |    4.20 |    0.00 |   10.00
landing_margin |   -0.01 |    0.02 |   -0.08 |    0.06
tracking_rewards |  -28.44 |    5.58 |  -50.64 |  -17.63
steps    |     374 |  

w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.07   -0.05   -0.08 |    0.08    0.09    0.05
a_f      |   -0.03    0.14 |    0.62    1.82 |   -1.50   -3.11 |    1.47    3.14
w_f      |   -0.00    0.00   -0.00 |    0.02    0.01    0.01 |   -0.05   -0.03   -0.03 |    0.04    0.03    0.03
w_rewards |   -0.64 |    0.38 |   -1.88 |   -0.03
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.32 |    0.31 |    0.00 |    3.06
seeker_angles |    0.00    0.00 |    0.09    0.09 |   -0.99   -1.00 |    0.99    0.98
cs_angles |  0.0031  0.0024 |  0.0931  0.0949 | -0.9919 -0.9956 |  0.9869  0.9841
optical_flow | -0.0003 -0.0001 |  0.0274  0.0274 | -1.5589 -0.9668 |  1.0249  1.3886
v_err    | -0.0090 |  0.0571 | -0.4527 |  0.1470
landing_rewards |    7.45 |    4.36 |    0.00 |   10.00
landing_margin |   -0.02 |    0.02 |   -0.07 |    0.10
tracking_rewards |  -28.45 |    6.08 |  -55.01 |  -16.57
steps    |     374 |  

attitude |   -0.09    0.04   -0.02 |    1.13    0.65    1.80 |   -3.14   -1.55   -3.14 |    3.14    1.57    3.14
w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.08   -0.05   -0.08 |    0.08    0.08    0.05
a_f      |    0.05   -0.03 |    0.65    1.79 |   -1.42   -3.13 |    1.47    3.14
w_f      |   -0.00    0.00   -0.00 |    0.02    0.01    0.01 |   -0.04   -0.03   -0.04 |    0.04    0.03    0.03
w_rewards |   -0.64 |    0.36 |   -1.64 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.33 |    0.32 |    0.00 |    3.10
seeker_angles |    0.00    0.00 |    0.10    0.10 |   -0.98   -1.00 |    0.98    1.00
cs_angles |  0.0048  0.0014 |  0.0964  0.0995 | -0.9827 -0.9998 |  0.9838  0.9980
optical_flow |  0.0001 -0.0001 |  0.0268  0.0251 | -1.5174 -1.0892 |  1.1637  1.2648
v_err    | -0.0089 |  0.0573 | -0.4512 |  0.1981
landing_rewards |    7.90 |    4.07 |    0.00 |   10.00
landing_margin |   -0

attitude |   -0.01   -0.02    0.05 |    1.15    0.65    1.83 |   -3.14   -1.56   -3.14 |    3.14    1.55    3.14
w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.07   -0.05   -0.09 |    0.08    0.08    0.05
a_f      |   -0.02    0.06 |    0.67    1.82 |   -1.48   -3.14 |    1.54    3.14
w_f      |   -0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.04   -0.03   -0.03 |    0.04    0.03    0.03
w_rewards |   -0.59 |    0.36 |   -1.93 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.33 |    0.32 |    0.00 |    3.12
seeker_angles |    0.00   -0.00 |    0.10    0.10 |   -0.99   -1.00 |    0.99    1.00
cs_angles |  0.0007 -0.0000 |  0.0983  0.0961 | -0.9914 -1.0000 |  0.9857  0.9982
optical_flow | -0.0000 -0.0002 |  0.0279  0.0257 | -1.0588 -0.9277 |  1.0367  1.1945
v_err    | -0.0092 |  0.0574 | -0.4516 |  0.1498
landing_rewards |    8.00 |    4.00 |    0.00 |   10.00
landing_margin |   -0

attitude |    0.02    0.03    0.21 |    1.19    0.65    1.84 |   -3.14   -1.57   -3.14 |    3.14    1.57    3.14
w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.05   -0.05   -0.08 |    0.08    0.08    0.05
a_f      |    0.03    0.14 |    0.65    1.82 |   -1.44   -3.14 |    1.38    3.11
w_f      |   -0.00    0.00   -0.00 |    0.02    0.01    0.01 |   -0.04   -0.03   -0.03 |    0.04    0.03    0.03
w_rewards |   -0.64 |    0.38 |   -2.19 |   -0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.32 |    0.32 |    0.00 |    2.96
seeker_angles |    0.00    0.00 |    0.10    0.10 |   -0.99   -0.98 |    1.00    1.00
cs_angles |  0.0027  0.0020 |  0.0960  0.0961 | -0.9882 -0.9828 |  0.9976  0.9968
optical_flow | -0.0001 -0.0001 |  0.0290  0.0264 | -1.0727 -1.1386 |  1.3008  1.2506
v_err    | -0.0085 |  0.0571 | -0.4528 |  0.1365
landing_rewards |    8.19 |    3.85 |    0.00 |   10.00
landing_margin |   -0

attitude |   -0.02   -0.02    0.08 |    1.11    0.66    1.78 |   -3.14   -1.56   -3.14 |    3.14    1.57    3.14
w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.07   -0.05   -0.08 |    0.09    0.08    0.05
a_f      |   -0.02    0.10 |    0.66    1.76 |   -1.40   -3.13 |    1.43    3.12
w_f      |   -0.00    0.00    0.00 |    0.02    0.01    0.01 |   -0.04   -0.03   -0.03 |    0.03    0.03    0.03
w_rewards |   -0.62 |    0.39 |   -2.21 |   -0.01
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.33 |    0.33 |    0.00 |    3.09
seeker_angles |    0.00    0.00 |    0.10    0.10 |   -0.99   -0.98 |    0.99    1.00
cs_angles |  0.0033  0.0041 |  0.0979  0.0980 | -0.9925 -0.9844 |  0.9906  0.9969
optical_flow | -0.0001 -0.0000 |  0.0285  0.0255 | -1.3703 -0.9855 |  1.0397  1.2835
v_err    | -0.0088 |  0.0573 | -0.4517 |  0.1628
landing_rewards |    7.87 |    4.09 |    0.00 |   10.00
landing_margin |   -0

norm_thrust |    1.02 |    0.78 |    0.00 |    3.46
fuel     |    1.81 |    0.23 |    1.29 |    2.67
rewards  |  -27.04 |   11.23 | -164.20 |  -12.02
fuel_rewards |   -5.19 |    0.67 |   -7.65 |   -3.73
glideslope_rewards |    0.00 |    0.00 |    0.00 |    0.00
glideslope_penalty |    0.00 |    0.00 |    0.00 |    0.00
glideslope |    2.89 |   13.41 |    0.01 |  851.45
norm_af  |    1.76 |    0.87 |    0.05 |    3.31
norm_wf  |    0.02 |    0.01 |    0.00 |    0.05
rh_penalty |    0.00 |    0.00 |    0.00 |    0.00
att_rewards |    0.00 |    0.00 |    0.00 |    0.00
att_penalty |    0.00 |    0.00 |    0.00 |    0.00
attitude |    0.03    0.05    0.02 |    1.21    0.65    1.85 |   -3.14   -1.55   -3.14 |    3.14    1.56    3.14
w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.09   -0.05   -0.08 |    0.08    0.08    0.08
a_f      |    0.05   -0.01 |    0.67    1.84 |   -1.41   -3.12 |    1.46    3.13
w_f      |   -0.00   -0.00   -0.00 |    0.01    0.01    0.01 |   -0.

ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0037   0.0022   0.0098   8.0871   2.2896   2.8947
Update Cnt = 1000    ET =   1086.7   Stats:  Mean, Std, Min, Max
r_f      |   12.39   -3.73   -4.76 |  184.03  180.42  200.86 | -379.52 -394.12 -385.33 |  386.55  389.13  387.25
v_f      |   -0.00   -0.00   -0.00 |    0.05    0.05    0.05 |   -0.10   -0.15   -0.11 |    0.12    0.12    0.14
r_i      |   31.01  -53.33  -10.08 |  688.28  686.40  746.38 |-1294.06-1320.23-1313.92 | 1294.26 1304.74 1296.70
v_i      |   -0.00    0.00    0.00 |    0.04    0.04    0.05 |   -0.09   -0.09   -0.09 |    0.09    0.10    0.09
norm_rf  |    0.40 |    0.17 |    0.09 |    1.13
norm_vf  |    0.08 |    0.02 |    0.03 |    0.17
gs_f     |    1.28 |    2.11 |    0.01 |   19.88
thrust   |   -0.00    0.00   -0.00 |    0.73    0.73    0.73 |   -3.45   -3.46   -3.46 |    3.46    3.44    3.45
norm_thrust |    1.00 |    0.78 |    0.00 |    3.46
fuel     |    1.77 |    0.23 |    1.33 |    2.58
rewards  |  -25.92 

ADV1:  0.003984422698973924 0.013236755844246492 0.06591610513728141 -0.10514347214768016
ADV2:  -0.010240421904834362 0.9218347240380346 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.2687   0.7307   3.8812  22.3072  13.2140  10.5845
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0055   0.0032   0.0122   8.0871   2.2896   2.8947
***** Episode 31327, Mean R = -25.7  Std R = 9.0  Min R = -46.5
PolicyLoss: -0.0138
Policy_Beta: 0.1
Policy_Entropy: 0.119
Policy_KL: 0.0012
Policy_SD: 0.577
Policy_lr_mult: 0.198
Steps: 1.19e+04
TotalSteps: 1.1e+07
VF_0_ExplainedVarNew: 0.971
VF_0_ExplainedVarOld: 0.967
VF_0_Loss : 0.0132


ADV1:  0.0030342872942472855 0.01275806624778258 0.08886422916736231 -0.09362408386335391
ADV2:  -0.011430472716347733 0.9099495994485967 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.3583   0.6083   3.5621  22.3072  13.2140  10.5845
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0032   0.0018   0.0076   8.0871   2.2896   2.8947
U

ADV1:  -0.0020374283200408206 0.015280196424467079 0.054976232632356015 -0.0967217664281646
ADV2:  0.0167947887494811 0.9355573915411601 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.6105   0.6185   3.1175  22.3072  13.2140  10.5845
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0026   0.0015   0.0057   8.0871   2.2896   2.8947
***** Episode 31606, Mean R = -25.6  Std R = 8.7  Min R = -42.4
PolicyLoss: -0.0116
Policy_Beta: 0.1
Policy_Entropy: 0.12
Policy_KL: 0.00131
Policy_SD: 0.572
Policy_lr_mult: 0.198
Steps: 1.15e+04
TotalSteps: 1.11e+07
VF_0_ExplainedVarNew: 0.957
VF_0_ExplainedVarOld: 0.953
VF_0_Loss : 0.0129


ADV1:  0.0017837727274478737 0.012335734017765552 0.08179603994894961 -0.07012093615703759
ADV2:  -0.007052524464574147 0.9286224497235281 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.5119   1.6736   8.5194  22.3072  13.2140  10.5845
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0029   0.0016   0.0061   8.0871   2.2896   2.8947


ADV1:  0.00010265703123411934 0.016517756179533088 0.08604259841854417 -0.15368794742506542
ADV2:  0.007041710633021504 0.9194102023054959 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.4794   0.7001   3.3445  22.3072  13.2140  10.5845
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0011   0.0004   0.0018   8.0871   2.2896   2.8947
***** Episode 31885, Mean R = -28.1  Std R = 9.6  Min R = -45.9
PolicyLoss: -0.012
Policy_Beta: 0.1
Policy_Entropy: 0.12
Policy_KL: 0.00109
Policy_SD: 0.604
Policy_lr_mult: 0.198
Steps: 1.13e+04
TotalSteps: 1.13e+07
VF_0_ExplainedVarNew: 0.962
VF_0_ExplainedVarOld: 0.951
VF_0_Loss : 0.0108


ADV1:  0.0034861212415341703 0.014631532764223841 0.07422575760146977 -0.1621667921402956
ADV2:  0.0003846870297055398 0.8803574315766916 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.4309   1.2168   6.4214  22.3072  13.2140  10.5845
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0042   0.0025   0.0091   8.0871   2.2896   2.8947


ADV1:  0.0012939219952828598 0.01476984194204196 0.06557970806278848 -0.0848358565720696
ADV2:  0.002172289360208282 0.9261749931714643 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.6378   0.8181   3.7251  22.3072  13.2140  10.5845
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0015   0.0009   0.0034   8.0871   2.2896   2.8947
***** Episode 32164, Mean R = -27.4  Std R = 9.4  Min R = -50.8
PolicyLoss: -0.013
Policy_Beta: 0.1
Policy_Entropy: 0.121
Policy_KL: 0.00118
Policy_SD: 0.598
Policy_lr_mult: 0.198
Steps: 1.16e+04
TotalSteps: 1.14e+07
VF_0_ExplainedVarNew: 0.964
VF_0_ExplainedVarOld: 0.962
VF_0_Loss : 0.0109


ADV1:  0.0005686047882237429 0.01464352348782192 0.08619405831500854 -0.19024316591236023
ADV2:  0.009654357808060033 0.8777712897511641 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.5418   1.0706   5.4605  22.3072  13.2140  10.5845
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0009   0.0005   0.0020   8.0871   2.2896   2.8947
***

ADV1:  -0.0009972676893204974 0.011858557701462923 0.05580323288838073 -0.11243757843336011
ADV2:  0.022359850046611587 0.8859754437382246 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.5096   1.9162   8.2923  22.3072  13.2140  10.5845
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0010   0.0006   0.0024   8.0871   2.2896   2.8947
***** Episode 32443, Mean R = -24.2  Std R = 7.1  Min R = -38.0
PolicyLoss: -0.0223
Policy_Beta: 0.1
Policy_Entropy: 0.124
Policy_KL: 0.00107
Policy_SD: 0.555
Policy_lr_mult: 0.198
Steps: 1.16e+04
TotalSteps: 1.15e+07
VF_0_ExplainedVarNew: 0.973
VF_0_ExplainedVarOld: 0.971
VF_0_Loss : 0.00738


ADV1:  0.002065720424414006 0.011529692311240588 0.07222993602731698 -0.06025684282022159
ADV2:  -0.00512775419829971 0.9342294903248817 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.1917   0.8476   4.2405  22.3072  13.2140  10.5845
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0022   0.0014   0.0053   8.0871   2.2896   2.894

ADV1:  -0.0034055183288878273 0.01408881022115952 0.08779760770531514 -0.1113388825542132
ADV2:  0.020654588604933626 0.9117085076691601 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.3646   0.5709   3.2462  22.3072  13.2140  10.5845
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0036   0.0020   0.0089   8.0871   2.2896   2.8947
***** Episode 32722, Mean R = -24.5  Std R = 7.4  Min R = -45.4
PolicyLoss: -0.00741
Policy_Beta: 0.1
Policy_Entropy: 0.123
Policy_KL: 0.00138
Policy_SD: 0.576
Policy_lr_mult: 0.198
Steps: 1.16e+04
TotalSteps: 1.16e+07
VF_0_ExplainedVarNew: 0.961
VF_0_ExplainedVarOld: 0.957
VF_0_Loss : 0.0116


ADV1:  0.0020182637407578094 0.014949207116806985 0.2999903512639215 -0.11101294421127
ADV2:  -0.0010653885475380392 0.8344623196211259 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.1323   0.6432   3.2474  22.3072  13.2140  10.5845
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0021   0.0012   0.0054   8.0871   2.2896   2.8947
*

ADV1:  0.0030773224030647204 0.023861333232052886 0.5032336618079252 -0.11264573588031257
ADV2:  -0.025375202536381036 0.7669868679326145 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.3674   0.7600   4.0505  22.3072  13.2140  10.5845
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0035   0.0021   0.0080   8.0871   2.2896   2.8947
***** Episode 33001, Mean R = -24.0  Std R = 7.9  Min R = -51.7
PolicyLoss: 0.016
Policy_Beta: 0.1
Policy_Entropy: 0.124
Policy_KL: 0.00153
Policy_SD: 0.564
Policy_lr_mult: 0.198
Steps: 1.16e+04
TotalSteps: 1.17e+07
VF_0_ExplainedVarNew: 0.945
VF_0_ExplainedVarOld: 0.886
VF_0_Loss : 0.016


ADV1:  0.0010155545470128895 0.014874374527200127 0.0755425983858839 -0.0917747152436954
ADV2:  -0.0033855861511536945 0.9272528491587066 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.0322   0.3629   2.1156  22.3072  13.2140  10.5845
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0015   0.0007   0.0030   8.0871   2.2896   2.8947
**

ADV1:  0.0028712582893418363 0.012893790757514593 0.14401698073480218 -0.05596096760622271
ADV2:  -0.015154479043021552 0.9248930544579308 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.5173   0.6014   3.4715  22.3072  13.2140  10.5845
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0031   0.0018   0.0072   8.0871   2.2896   2.8947
***** Episode 33280, Mean R = -25.3  Std R = 6.6  Min R = -45.1
PolicyLoss: -0.00367
Policy_Beta: 0.1
Policy_Entropy: 0.121
Policy_KL: 0.00106
Policy_SD: 0.588
Policy_lr_mult: 0.198
Steps: 1.16e+04
TotalSteps: 1.18e+07
VF_0_ExplainedVarNew: 0.969
VF_0_ExplainedVarOld: 0.966
VF_0_Loss : 0.0165


ADV1:  -0.00342431257281174 0.01595719769708318 0.1099434850369512 -0.20989915048746555
ADV2:  0.02617649071505546 0.8914152785126118 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.6161   1.0420   5.3723  22.3072  13.2140  10.5845
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0039   0.0024   0.0087   8.0871   2.2896   2.8947
*

ADV1:  0.001045652339752024 0.012748956300534504 0.07827691968154782 -0.09015445437948874
ADV2:  0.008930053348796 0.8802511032188429 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.8735   0.4013   2.1146  22.3072  13.2140  10.5845
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0012   0.0007   0.0027   8.0871   2.2896   2.8947
***** Episode 33559, Mean R = -22.6  Std R = 7.0  Min R = -44.9
PolicyLoss: -0.0191
Policy_Beta: 0.1
Policy_Entropy: 0.125
Policy_KL: 0.00109
Policy_SD: 0.559
Policy_lr_mult: 0.198
Steps: 1.15e+04
TotalSteps: 1.19e+07
VF_0_ExplainedVarNew: 0.969
VF_0_ExplainedVarOld: 0.964
VF_0_Loss : 0.0146


ADV1:  -0.0020799190326980903 0.012262755429173992 0.07412566254908615 -0.07104972538212731
ADV2:  0.016428785968766187 0.9302972773922663 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.6788   0.7364   3.7813  22.3072  13.2140  10.5845
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0022   0.0013   0.0053   8.0871   2.2896   2.8947
**

cs_angles |  0.0024  0.0016 |  0.0945  0.0991 | -0.9974 -0.9954 |  0.9997  0.9845
optical_flow | -0.0001 -0.0001 |  0.0292  0.0267 | -1.1892 -1.1393 |  1.3270  0.9732
v_err    | -0.0088 |  0.0565 | -0.4512 |  0.1394
landing_rewards |    8.45 |    3.62 |    0.00 |   10.00
landing_margin |   -0.02 |    0.02 |   -0.07 |    0.06
tracking_rewards |  -28.19 |    5.84 |  -49.61 |  -17.41
steps    |     374 |      19 |     334 |     415
***** Episode 33838, Mean R = -27.1  Std R = 8.1  Min R = -43.4
PolicyLoss: -0.0132
Policy_Beta: 0.1
Policy_Entropy: 0.124
Policy_KL: 0.00106
Policy_SD: 0.586
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 1.2e+07
VF_0_ExplainedVarNew: 0.966
VF_0_ExplainedVarOld: 0.962
VF_0_Loss : 0.0161


ADV1:  -0.0003359580316280699 0.013875610895883215 0.08848006887726112 -0.11143684135687892
ADV2:  0.011468854106136506 0.9107777761551399 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.0595   0.7517   3.8136  22.3072  13.2140  10.5845
ValFun  Gradients: u/s

theta_cv |    0.32 |    0.31 |    0.00 |    3.07
seeker_angles |    0.00    0.00 |    0.09    0.10 |   -0.99   -1.00 |    1.00    1.00
cs_angles |  0.0012  0.0031 |  0.0935  0.0976 | -0.9947 -0.9988 |  0.9952  0.9981
optical_flow |  0.0002 -0.0002 |  0.0290  0.0268 | -1.2202 -1.4345 |  1.2723  1.2644
v_err    | -0.0091 |  0.0567 | -0.4521 |  0.1550
landing_rewards |    8.26 |    3.79 |    0.00 |   10.00
landing_margin |   -0.02 |    0.02 |   -0.07 |    0.05
tracking_rewards |  -28.27 |    6.26 |  -71.31 |  -18.34
steps    |     376 |      21 |     332 |     416
***** Episode 34148, Mean R = -25.9  Std R = 12.1  Min R = -74.6
PolicyLoss: -0.00811
Policy_Beta: 0.1
Policy_Entropy: 0.126
Policy_KL: 0.00136
Policy_SD: 0.57
Policy_lr_mult: 0.198
Steps: 1.15e+04
TotalSteps: 1.21e+07
VF_0_ExplainedVarNew: 0.975
VF_0_ExplainedVarOld: 0.955
VF_0_Loss : 0.0151


ADV1:  -0.0008980475720542141 0.013766496164636221 0.06941444917140327 -0.09644755431751295
ADV2:  0.013358506296226225 0.92493743787021

attitude |   -0.10    0.06   -0.00 |    1.17    0.67    1.82 |   -3.14   -1.55   -3.14 |    3.14    1.55    3.14
w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.07   -0.05   -0.08 |    0.08    0.08    0.05
a_f      |    0.04    0.01 |    0.66    1.81 |   -1.47   -3.07 |    1.54    3.11
w_f      |   -0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.04   -0.02   -0.03 |    0.03    0.03    0.03
w_rewards |   -0.60 |    0.35 |   -1.88 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.31 |    0.30 |    0.00 |    2.90
seeker_angles |    0.00    0.00 |    0.09    0.09 |   -1.00   -1.00 |    1.00    1.00
cs_angles |  0.0025  0.0003 |  0.0947  0.0922 | -0.9961 -0.9967 |  0.9993  0.9983
optical_flow |  0.0000 -0.0001 |  0.0285  0.0249 | -1.2957 -1.0382 |  1.5366  0.9248
v_err    | -0.0089 |  0.0568 | -0.4518 |  0.1635
landing_rewards |    8.52 |    3.55 |    0.00 |   10.00
landing_margin |   -0

attitude |   -0.01   -0.01   -0.06 |    1.15    0.65    1.84 |   -3.14   -1.56   -3.14 |    3.14    1.57    3.14
w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.08   -0.05   -0.08 |    0.09    0.08    0.05
a_f      |   -0.00   -0.07 |    0.65    1.85 |   -1.50   -3.14 |    1.47    3.14
w_f      |   -0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.03   -0.04   -0.03 |    0.04    0.03    0.03
w_rewards |   -0.62 |    0.43 |   -3.53 |   -0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.31 |    0.31 |    0.00 |    2.96
seeker_angles |    0.00   -0.00 |    0.09    0.09 |   -0.99   -0.99 |    0.99    0.99
cs_angles |  0.0005 -0.0024 |  0.0930  0.0939 | -0.9863 -0.9873 |  0.9945  0.9888
optical_flow | -0.0001 -0.0001 |  0.0279  0.0253 | -0.9304 -1.1412 |  1.3880  1.2185
v_err    | -0.0090 |  0.0569 | -0.4524 |  0.1640
landing_rewards |    8.29 |    3.76 |    0.00 |   10.00
landing_margin |   -0

attitude |    0.03   -0.04   -0.05 |    1.22    0.67    1.82 |   -3.14   -1.57   -3.14 |    3.14    1.56    3.14
w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.07   -0.05   -0.08 |    0.09    0.08    0.05
a_f      |   -0.04    0.00 |    0.67    1.81 |   -1.44   -3.14 |    1.40    3.14
w_f      |   -0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.03   -0.03   -0.04 |    0.03    0.02    0.02
w_rewards |   -0.62 |    0.40 |   -3.35 |   -0.02
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.32 |    0.31 |    0.00 |    3.08
seeker_angles |    0.00    0.00 |    0.09    0.10 |   -1.00   -1.00 |    0.99    0.98
cs_angles |  0.0002  0.0022 |  0.0947  0.0963 | -0.9983 -1.0000 |  0.9875  0.9814
optical_flow | -0.0000 -0.0001 |  0.0287  0.0252 | -1.3653 -1.1692 |  1.2377  1.0164
v_err    | -0.0095 |  0.0570 | -0.5002 |  0.1282
landing_rewards |    8.16 |    3.87 |    0.00 |   10.00
landing_margin |   -0

attitude |   -0.02    0.03   -0.01 |    1.21    0.65    1.84 |   -3.14   -1.55   -3.14 |    3.14    1.57    3.14
w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.07   -0.05   -0.08 |    0.09    0.08    0.05
a_f      |    0.04    0.00 |    0.66    1.83 |   -1.40   -3.10 |    1.46    3.12
w_f      |   -0.00   -0.00   -0.00 |    0.01    0.01    0.01 |   -0.04   -0.02   -0.03 |    0.03    0.03    0.03
w_rewards |   -0.61 |    0.36 |   -2.56 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.30 |    0.30 |    0.00 |    3.01
seeker_angles |    0.00    0.00 |    0.09    0.09 |   -0.99   -0.99 |    1.00    0.98
cs_angles |  0.0014  0.0004 |  0.0912  0.0905 | -0.9912 -0.9886 |  0.9984  0.9822
optical_flow | -0.0001 -0.0003 |  0.0272  0.0248 | -1.2227 -0.8619 |  1.5127  1.1363
v_err    | -0.0091 |  0.0566 | -0.4544 |  0.1509
landing_rewards |    8.00 |    4.00 |    0.00 |   10.00
landing_margin |   -0

w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.07   -0.05   -0.08 |    0.08    0.08    0.05
a_f      |    0.07   -0.20 |    0.67    1.74 |   -1.41   -3.13 |    1.46    3.12
w_f      |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.04   -0.03   -0.04 |    0.03    0.03    0.02
w_rewards |   -0.62 |    0.36 |   -1.98 |   -0.01
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.31 |    0.31 |    0.00 |    2.93
seeker_angles |   -0.00    0.00 |    0.09    0.09 |   -0.99   -0.99 |    0.98    1.00
cs_angles | -0.0007  0.0004 |  0.0925  0.0937 | -0.9855 -0.9913 |  0.9762  0.9966
optical_flow |  0.0001 -0.0002 |  0.0289  0.0270 | -1.9199 -1.6514 |  1.4519  1.0914
v_err    | -0.0088 |  0.0569 | -0.4593 |  0.1573
landing_rewards |    8.61 |    3.46 |    0.00 |   10.00
landing_margin |   -0.02 |    0.02 |   -0.09 |    0.10
tracking_rewards |  -27.19 |    5.54 |  -47.39 |  -17.44
steps    |     376 |  

w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.08   -0.08   -0.09 |    0.08    0.08    0.06
a_f      |   -0.00   -0.02 |    0.65    1.86 |   -1.35   -3.13 |    1.54    3.11
w_f      |   -0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.04   -0.04   -0.03 |    0.03    0.04    0.02
w_rewards |   -0.69 |    0.43 |   -2.89 |   -0.02
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.30 |    0.31 |    0.00 |    3.04
seeker_angles |    0.00    0.00 |    0.09    0.09 |   -1.00   -0.99 |    0.98    1.00
cs_angles |  0.0006  0.0028 |  0.0938  0.0916 | -0.9982 -0.9949 |  0.9759  0.9996
optical_flow |  0.0000 -0.0001 |  0.0287  0.0269 | -1.1734 -1.0188 |  1.1996  1.0119
v_err    | -0.0087 |  0.0572 | -0.4936 |  0.1419
landing_rewards |    8.48 |    3.59 |    0.00 |   10.00
landing_margin |   -0.02 |    0.02 |   -0.07 |    0.04
tracking_rewards |  -26.97 |    5.78 |  -53.66 |  -15.06
steps    |     376 |  

attitude |   -0.01   -0.02    0.22 |    1.13    0.67    1.82 |   -3.14   -1.52   -3.14 |    3.14    1.57    3.14
w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.07   -0.05   -0.08 |    0.08    0.09    0.05
a_f      |   -0.01    0.26 |    0.68    1.81 |   -1.47   -3.14 |    1.52    3.12
w_f      |   -0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.04   -0.03   -0.03 |    0.02    0.03    0.03
w_rewards |   -0.70 |    0.40 |   -1.93 |   -0.01
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.31 |    0.32 |    0.00 |    3.03
seeker_angles |   -0.00    0.00 |    0.09    0.09 |   -0.99   -1.00 |    0.98    0.96
cs_angles | -0.0005  0.0012 |  0.0948  0.0946 | -0.9916 -0.9979 |  0.9837  0.9602
optical_flow |  0.0001 -0.0002 |  0.0278  0.0254 | -1.0761 -1.2719 |  1.3756  1.2476
v_err    | -0.0083 |  0.0566 | -0.4521 |  0.1414
landing_rewards |    8.90 |    3.12 |    0.00 |   10.00
landing_margin |   -0

attitude |   -0.01    0.03    0.02 |    1.15    0.63    1.82 |   -3.14   -1.53   -3.14 |    3.14    1.52    3.14
w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.07   -0.05   -0.08 |    0.09    0.08    0.05
a_f      |    0.04    0.02 |    0.63    1.81 |   -1.45   -3.13 |    1.42    3.13
w_f      |   -0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.04   -0.03   -0.03 |    0.03    0.02    0.02
w_rewards |   -0.66 |    0.38 |   -2.30 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.30 |    0.30 |    0.00 |    3.03
seeker_angles |   -0.00   -0.00 |    0.09    0.09 |   -1.00   -1.00 |    0.99    1.00
cs_angles | -0.0009 -0.0004 |  0.0889  0.0891 | -0.9969 -0.9969 |  0.9918  0.9954
optical_flow |  0.0001 -0.0001 |  0.0286  0.0268 | -1.2731 -1.2223 |  1.2218  1.0667
v_err    | -0.0081 |  0.0565 | -0.4520 |  0.1381
landing_rewards |    8.65 |    3.42 |    0.00 |   10.00
landing_margin |   -0

glideslope |    2.82 |   12.71 |    0.01 |  913.60
norm_af  |    1.74 |    0.92 |    0.14 |    3.33
norm_wf  |    0.02 |    0.01 |    0.00 |    0.03
rh_penalty |    0.00 |    0.00 |    0.00 |    0.00
att_rewards |    0.00 |    0.00 |    0.00 |    0.00
att_penalty |    0.00 |    0.00 |    0.00 |    0.00
attitude |   -0.05    0.07    0.08 |    1.19    0.70    1.82 |   -3.14   -1.57   -3.14 |    3.14    1.57    3.14
w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.07   -0.05   -0.08 |    0.08    0.08    0.05
a_f      |    0.08    0.10 |    0.70    1.83 |   -1.50   -3.07 |    1.52    3.11
w_f      |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.03   -0.02   -0.03 |    0.03    0.02    0.03
w_rewards |   -0.65 |    0.36 |   -1.81 |   -0.01
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.30 |    0.31 |    0.00 |    2.92
seeker_angles |    0.00    0.00 |    0.09    0.09 |   -0.99   -1.00 |    1.

thrust   |   -0.00    0.00    0.00 |    0.71    0.71    0.71 |   -3.46   -3.44   -3.46 |    3.46    3.46    3.46
norm_thrust |    0.96 |    0.77 |    0.00 |    3.46
fuel     |    1.71 |    0.21 |    1.23 |    2.39
rewards  |  -23.84 |    7.64 |  -54.66 |  -10.60
fuel_rewards |   -4.91 |    0.59 |   -6.83 |   -3.53
glideslope_rewards |    0.00 |    0.00 |    0.00 |    0.00
glideslope_penalty |    0.00 |    0.00 |    0.00 |    0.00
glideslope |    2.87 |   13.02 |    0.00 |  369.82
norm_af  |    1.73 |    0.88 |    0.06 |    3.32
norm_wf  |    0.02 |    0.01 |    0.00 |    0.04
rh_penalty |    0.00 |    0.00 |    0.00 |    0.00
att_rewards |    0.00 |    0.00 |    0.00 |    0.00
att_penalty |    0.00 |    0.00 |    0.00 |    0.00
attitude |   -0.02   -0.05   -0.05 |    1.23    0.65    1.84 |   -3.14   -1.55   -3.14 |    3.14    1.57    3.14
w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.06   -0.05   -0.08 |    0.09    0.08    0.05
a_f      |   -0.05   -0.06 |    0.65

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.4463   0.7894   3.2155  22.3072  13.2140  10.5845
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0054   0.0031   0.0102   8.0871   2.2896   2.8947
Update Cnt = 1210    ET =   1112.2   Stats:  Mean, Std, Min, Max
r_f      |  -16.09    0.39   -0.07 |  192.42  174.88  198.81 | -535.78 -408.39 -621.14 |  387.12  391.46  399.90
v_f      |    0.00   -0.00    0.01 |    0.05    0.05    0.08 |   -0.11   -0.12   -0.11 |    0.15    0.28    1.01
r_i      |  -39.23    7.97  -26.67 |  699.50  648.98  769.22 |-1354.73-1308.03-1343.99 | 1294.43 1376.67 1346.74
v_i      |    0.00    0.00    0.00 |    0.04    0.04    0.05 |   -0.09   -0.09   -0.09 |    0.09    0.10    0.10
norm_rf  |    2.38 |   36.10 |    0.01 |  636.99
norm_vf  |    0.08 |    0.06 |    0.04 |    1.06
gs_f     |    1.29 |    1.70 |    0.01 |   11.44
thrust   |   -0.01   -0.00    0.00 |    0.72    0.72    0.72 |   -3.46   -3.45   -3.46 |    3.46    3.46    3.46
norm_thrust |    

ADV1:  -0.003463988621020602 0.014054104142643796 0.06614138698671757 -0.07760489101841427
ADV2:  0.026355777987226693 0.9255343408819455 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.9407   0.8338   4.4403  22.3072  13.2140  10.5845
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0038   0.0021   0.0088   8.0871   2.2896   2.8947
***** Episode 37837, Mean R = -23.4  Std R = 6.8  Min R = -37.9
PolicyLoss: -0.0122
Policy_Beta: 0.1
Policy_Entropy: 0.131
Policy_KL: 0.00142
Policy_SD: 0.558
Policy_lr_mult: 0.198
Steps: 1.15e+04
TotalSteps: 1.35e+07
VF_0_ExplainedVarNew: 0.961
VF_0_ExplainedVarOld: 0.959
VF_0_Loss : 0.014


ADV1:  0.0030407878449965255 0.01505510347422596 0.13226771733396664 -0.1444562537544002
ADV2:  -0.0034495238272911847 0.8832472573284262 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.2160   0.5221   2.6322  22.3072  13.2140  10.5845
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0024   0.0018   0.0078   8.0871   2.2896   2.8947


ADV1:  0.001237528644215599 0.011039172708274973 0.05768502863189662 -0.07021423063800475
ADV2:  0.011173387530490636 0.8810277602863646 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.3696   0.7973   3.3111  22.3072  13.2140  10.5845
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0013   0.0008   0.0033   8.0871   2.2896   2.8947
***** Episode 38116, Mean R = -22.9  Std R = 5.7  Min R = -36.2
PolicyLoss: -0.0234
Policy_Beta: 0.1
Policy_Entropy: 0.131
Policy_KL: 0.0011
Policy_SD: 0.569
Policy_lr_mult: 0.198
Steps: 1.15e+04
TotalSteps: 1.36e+07
VF_0_ExplainedVarNew: 0.979
VF_0_ExplainedVarOld: 0.976
VF_0_Loss : 0.0149


Dynamics: Max Disturbance (m/s^2):  [0.00149461 0.0018056  0.00138071] 0.002720371623523329
ADV1:  -0.0035078207731465963 0.014329164779125617 0.1047019985955363 -0.11388010695752526
ADV2:  0.0192490500964832 0.9081172505971964 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.3173   1.5683   6.7803  22.3072  13.2140  10.5845
ValFun  Gradie

***** Episode 38364, Mean R = -25.2  Std R = 5.9  Min R = -39.4
PolicyLoss: -0.0182
Policy_Beta: 0.1
Policy_Entropy: 0.131
Policy_KL: 0.0016
Policy_SD: 0.567
Policy_lr_mult: 0.198
Steps: 1.16e+04
TotalSteps: 1.37e+07
VF_0_ExplainedVarNew: 0.975
VF_0_ExplainedVarOld: 0.973
VF_0_Loss : 0.0159


ADV1:  0.0034785815974929827 0.012714051955511315 0.05876533898362596 -0.1666550211783343
ADV2:  -0.0029572919837722094 0.8361348803175379 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.2346   0.9447   4.6035  22.3072  13.2140  10.5845
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0036   0.0023   0.0090   8.0871   2.2896   2.8947
***** Episode 38395, Mean R = -25.1  Std R = 8.6  Min R = -48.8
PolicyLoss: -0.0221
Policy_Beta: 0.1
Policy_Entropy: 0.13
Policy_KL: 0.000845
Policy_SD: 0.58
Policy_lr_mult: 0.198
Steps: 1.16e+04
TotalSteps: 1.37e+07
VF_0_ExplainedVarNew: 0.977
VF_0_ExplainedVarOld: 0.971
VF_0_Loss : 0.016


Dynamics: Max Disturbance (m/s^2):  [0.00149461 0.0018056  

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.6587   1.4935   7.4315  22.3072  13.2140  10.5845
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0016   0.0009   0.0035   8.0871   2.2896   2.8947
***** Episode 38643, Mean R = -22.8  Std R = 5.8  Min R = -38.0
PolicyLoss: -0.0135
Policy_Beta: 0.1
Policy_Entropy: 0.133
Policy_KL: 0.00132
Policy_SD: 0.552
Policy_lr_mult: 0.198
Steps: 1.14e+04
TotalSteps: 1.38e+07
VF_0_ExplainedVarNew: 0.97
VF_0_ExplainedVarOld: 0.966
VF_0_Loss : 0.0159


ADV1:  0.0012326214800552594 0.012224093674256207 0.060467027152735775 -0.07127518441206115
ADV2:  0.009666801509893071 0.8995146939229686 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.6591   0.7920   3.4827  22.3072  13.2140  10.5845
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0016   0.0009   0.0033   8.0871   2.2896   2.8947
***** Episode 38674, Mean R = -25.6  Std R = 8.1  Min R = -46.2
PolicyLoss: -0.0204
Policy_Beta: 0.1
Policy_Entropy: 0.133
Policy_KL: 0.00107
Poli

ADV1:  -0.0007717711160893916 0.014376088834586352 0.11054290939306749 -0.21984736884725853
ADV2:  0.01370256435023212 0.8689995858603503 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.9868   0.9454   4.4801  22.3072  13.2140  10.5845
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0017   0.0009   0.0035   8.0871   2.2896   2.8947
***** Episode 38922, Mean R = -23.8  Std R = 5.8  Min R = -34.3
PolicyLoss: -0.0142
Policy_Beta: 0.1
Policy_Entropy: 0.136
Policy_KL: 0.00135
Policy_SD: 0.551
Policy_lr_mult: 0.198
Steps: 1.16e+04
TotalSteps: 1.39e+07
VF_0_ExplainedVarNew: 0.965
VF_0_ExplainedVarOld: 0.958
VF_0_Loss : 0.0167


Dynamics: Max Disturbance (m/s^2):  [0.00149461 0.0018056  0.00138071] 0.002720371623523329
ADV1:  0.0005398610046928724 0.013382652364177227 0.08983888687878105 -0.07798325661464739
ADV2:  0.0014771866041186992 0.9265762879847198 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.5401   0.7576   3.4064  22.3072  13.2140  10.5845
ValFun  G

ADV1:  0.0006788827511996628 0.011448496633885932 0.23156430938039774 -0.0954511138156866
ADV2:  -0.004245675982298544 0.8774039587203426 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.2090   0.8033   4.1516  22.3072  13.2140  10.5845
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0007   0.0004   0.0017   8.0871   2.2896   2.8947
***** Episode 39201, Mean R = -23.3  Std R = 7.7  Min R = -49.0
PolicyLoss: -0.00332
Policy_Beta: 0.1
Policy_Entropy: 0.135
Policy_KL: 0.000861
Policy_SD: 0.559
Policy_lr_mult: 0.198
Steps: 1.16e+04
TotalSteps: 1.4e+07
VF_0_ExplainedVarNew: 0.979
VF_0_ExplainedVarOld: 0.974
VF_0_Loss : 0.015


Dynamics: Max Disturbance (m/s^2):  [0.00149461 0.0018056  0.00138071] 0.002720371623523329
ADV1:  0.0014055102744160882 0.010972409773129093 0.05717158763544067 -0.07896612506106909
ADV2:  0.0039007337079645776 0.9031048162301953 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.2262   0.6784   2.9202  22.3072  13.2140  10.5845
ValFun  G

Dynamics: Max Disturbance (m/s^2):  [0.00149461 0.0018056  0.00138071] 0.002720371623523329
ADV1:  -0.0036991687577540224 0.014205207645415817 0.11264137505693689 -0.180870305958318
ADV2:  0.024849605574364508 0.8913629357624495 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.8599   0.3974   2.2648  22.3072  13.2140  10.5845
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0040   0.0025   0.0093   8.0871   2.2896   2.8947
***** Episode 39480, Mean R = -24.4  Std R = 7.7  Min R = -39.9
PolicyLoss: -0.0108
Policy_Beta: 0.1
Policy_Entropy: 0.135
Policy_KL: 0.00101
Policy_SD: 0.555
Policy_lr_mult: 0.198
Steps: 1.16e+04
TotalSteps: 1.41e+07
VF_0_ExplainedVarNew: 0.969
VF_0_ExplainedVarOld: 0.963
VF_0_Loss : 0.0146


ADV1:  0.00021098229935253922 0.01363877586875894 0.07668752391571187 -0.12612580829213504
ADV2:  0.012256901591122155 0.8896433547713873 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.0556   1.6197   8.1869  22.3072  13.2140  10.5845
ValFun  Gra

Dynamics: Max Disturbance (m/s^2):  [0.00149461 0.0018056  0.00138071] 0.002720371623523329
ADV1:  0.00023602094664593832 0.018132967324797435 0.0692085890654991 -0.3294841674125366
ADV2:  0.025605803496132312 0.7295412139049221 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.4191   0.7700   3.8872  22.3072  13.2140  10.5845
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0019   0.0010   0.0039   8.0871   2.2896   2.8947
***** Episode 39759, Mean R = -25.3  Std R = 10.5  Min R = -58.2
PolicyLoss: -0.0309
Policy_Beta: 0.1
Policy_Entropy: 0.131
Policy_KL: 0.000827
Policy_SD: 0.578
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 1.42e+07
VF_0_ExplainedVarNew: 0.967
VF_0_ExplainedVarOld: 0.951
VF_0_Loss : 0.0157


ADV1:  0.001014400408048085 0.011851546567809412 0.07226052675943961 -0.06767445121600306
ADV2:  0.007134095112793695 0.8937680581931049 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.0723   0.4720   2.5255  22.3072  13.2140  10.5845
ValFun  Gr

cs_angles |  0.0041  0.0021 |  0.0909  0.0917 | -0.9927 -0.9948 |  0.9808  0.9685
optical_flow |  0.0001 -0.0000 |  0.0265  0.0257 | -1.1314 -1.2437 |  0.9861  1.1130
v_err    | -0.0089 |  0.0566 | -0.4537 |  0.1460
landing_rewards |    8.61 |    3.46 |    0.00 |   10.00
landing_margin |   -0.02 |    0.02 |   -0.07 |    0.04
tracking_rewards |  -26.39 |    5.84 |  -50.38 |  -16.47
steps    |     375 |      21 |     334 |     416
***** Episode 40038, Mean R = -23.6  Std R = 6.5  Min R = -36.5
PolicyLoss: -0.0241
Policy_Beta: 0.1
Policy_Entropy: 0.133
Policy_KL: 0.000795
Policy_SD: 0.57
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 1.43e+07
VF_0_ExplainedVarNew: 0.975
VF_0_ExplainedVarOld: 0.973
VF_0_Loss : 0.0176


ADV1:  -0.0011259850578987322 0.011328609881524752 0.11297060319270047 -0.11406091502341259
ADV2:  0.017063029828043436 0.8699819755457554 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.1530   0.3888   2.2546  22.3072  13.2140  10.5845
ValFun  Gradients: u/

w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.08   -0.05   -0.08 |    0.08    0.08    0.05
a_f      |   -0.03    0.11 |    0.65    1.81 |   -1.41   -3.14 |    1.46    3.14
w_f      |   -0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.04   -0.02   -0.04 |    0.03    0.03    0.03
w_rewards |   -0.65 |    0.37 |   -2.06 |   -0.02
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.30 |    0.31 |    0.00 |    3.01
seeker_angles |    0.01    0.00 |    0.09    0.09 |   -0.97   -1.00 |    1.00    0.98
cs_angles |  0.0063  0.0029 |  0.0924  0.0885 | -0.9723 -0.9968 |  0.9992  0.9834
optical_flow |  0.0000 -0.0002 |  0.0283  0.0272 | -1.2514 -1.0512 |  1.2593  1.0628
v_err    | -0.0090 |  0.0565 | -0.4526 |  0.1492
landing_rewards |    8.94 |    3.08 |    0.00 |   10.00
landing_margin |   -0.02 |    0.02 |   -0.07 |    0.06
tracking_rewards |  -26.25 |    5.49 |  -48.44 |  -16.29
steps    |     376 |  

attitude |   -0.02   -0.03   -0.08 |    1.15    0.61    1.77 |   -3.14   -1.56   -3.14 |    3.14    1.56    3.14
w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.09   -0.05   -0.08 |    0.08    0.08    0.05
a_f      |   -0.03   -0.05 |    0.63    1.78 |   -1.46   -3.14 |    1.48    3.14
w_f      |   -0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.03   -0.02   -0.03 |    0.03    0.03    0.03
w_rewards |   -0.66 |    0.37 |   -1.95 |   -0.01
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.30 |    0.31 |    0.00 |    3.00
seeker_angles |    0.01    0.00 |    0.09    0.09 |   -0.98   -1.00 |    0.98    1.00
cs_angles |  0.0059  0.0040 |  0.0928  0.0927 | -0.9840 -0.9995 |  0.9849  0.9963
optical_flow |  0.0000 -0.0001 |  0.0271  0.0265 | -1.2927 -1.0066 |  1.0431  1.2751
v_err    | -0.0087 |  0.0563 | -0.4533 |  0.1679
landing_rewards |    8.71 |    3.35 |    0.00 |   10.00
landing_margin |   -0

attitude |   -0.10   -0.04   -0.07 |    1.29    0.65    1.92 |   -3.14   -1.56   -3.14 |    3.14    1.57    3.14
w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.07   -0.05   -0.08 |    0.09    0.08    0.05
a_f      |   -0.04   -0.02 |    0.64    1.94 |   -1.37   -3.14 |    1.48    3.14
w_f      |   -0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.04   -0.02   -0.03 |    0.04    0.03    0.03
w_rewards |   -0.67 |    0.37 |   -1.93 |   -0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.30 |    0.31 |    0.00 |    2.96
seeker_angles |    0.01    0.00 |    0.10    0.09 |   -1.00   -0.99 |    0.99    0.99
cs_angles |  0.0074  0.0010 |  0.0956  0.0918 | -0.9976 -0.9902 |  0.9927  0.9869
optical_flow | -0.0000 -0.0001 |  0.0268  0.0263 | -1.3393 -1.0421 |  1.0729  1.0317
v_err    | -0.0090 |  0.0565 | -0.4533 |  0.1418
landing_rewards |    8.52 |    3.55 |    0.00 |   10.00
landing_margin |   -0

w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.06   -0.05   -0.08 |    0.09    0.08    0.05
a_f      |    0.02   -0.20 |    0.65    1.96 |   -1.48   -3.14 |    1.50    3.12
w_f      |   -0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.03   -0.03   -0.04 |    0.03    0.03    0.03
w_rewards |   -0.65 |    0.36 |   -2.16 |   -0.02
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.30 |    0.31 |    0.00 |    3.01
seeker_angles |    0.00    0.00 |    0.09    0.09 |   -0.99   -0.99 |    0.99    0.99
cs_angles |  0.0047  0.0027 |  0.0935  0.0932 | -0.9881 -0.9865 |  0.9894  0.9928
optical_flow | -0.0001  0.0000 |  0.0277  0.0265 | -1.0637 -1.2562 |  1.4196  1.6382
v_err    | -0.0087 |  0.0566 | -0.4519 |  0.1384
landing_rewards |    8.45 |    3.62 |    0.00 |   10.00
landing_margin |   -0.02 |    0.02 |   -0.07 |    0.03
tracking_rewards |  -26.36 |    5.77 |  -55.77 |  -16.23
steps    |     373 |  

w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.06   -0.06   -0.08 |    0.08    0.08    0.05
a_f      |   -0.04    0.08 |    0.64    1.85 |   -1.52   -3.11 |    1.34    3.11
w_f      |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.03   -0.03   -0.03 |    0.03    0.03    0.03
w_rewards |   -0.62 |    0.35 |   -2.55 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.30 |    0.31 |    0.00 |    2.89
seeker_angles |    0.00    0.00 |    0.09    0.09 |   -0.99   -1.00 |    0.99    0.98
cs_angles |  0.0031  0.0023 |  0.0931  0.0890 | -0.9934 -0.9962 |  0.9922  0.9811
optical_flow | -0.0001 -0.0001 |  0.0261  0.0275 | -1.3016 -1.4780 |  1.0870  1.1095
v_err    | -0.0087 |  0.0567 | -0.4525 |  0.1231
landing_rewards |    8.29 |    3.76 |    0.00 |   10.00
landing_margin |   -0.02 |    0.02 |   -0.07 |    0.04
tracking_rewards |  -26.18 |    5.59 |  -48.15 |  -14.78
steps    |     375 |  

attitude |    0.05   -0.00    0.01 |    1.13    0.69    1.75 |   -3.14   -1.57   -3.14 |    3.14    1.57    3.14
w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.05   -0.05   -0.08 |    0.10    0.08    0.05
a_f      |   -0.00    0.02 |    0.68    1.77 |   -1.51   -3.13 |    1.53    3.14
w_f      |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.04   -0.03   -0.04 |    0.04    0.03    0.02
w_rewards |   -0.63 |    0.39 |   -2.50 |   -0.01
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.30 |    0.31 |    0.00 |    2.95
seeker_angles |    0.00    0.00 |    0.09    0.09 |   -1.00   -0.98 |    1.00    1.00
cs_angles |  0.0034  0.0049 |  0.0915  0.0917 | -0.9998 -0.9820 |  0.9951  0.9967
optical_flow | -0.0001  0.0001 |  0.0270  0.0266 | -1.1541 -1.2586 |  1.2215  1.0597
v_err    | -0.0087 |  0.0575 | -0.4526 |  0.2560
landing_rewards |    8.97 |    3.04 |    0.00 |   10.00
landing_margin |   -0

rewards  |  -22.20 |    9.08 | -137.47 |  -10.90
fuel_rewards |   -4.76 |    0.66 |   -9.85 |   -3.24
glideslope_rewards |    0.00 |    0.00 |    0.00 |    0.00
glideslope_penalty |    0.00 |    0.00 |    0.00 |    0.00
glideslope |    3.09 |   12.96 |    0.01 |  477.22
norm_af  |    1.78 |    0.89 |    0.05 |    3.20
norm_wf  |    0.02 |    0.01 |    0.00 |    0.05
rh_penalty |    0.00 |    0.00 |    0.00 |    0.00
att_rewards |    0.00 |    0.00 |    0.00 |    0.00
att_penalty |    0.00 |    0.00 |    0.00 |    0.00
attitude |   -0.11   -0.05    0.08 |    1.19    0.66    1.89 |   -3.14   -1.57   -3.14 |    3.14    1.56    3.14
w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.07   -0.07   -0.08 |    0.09    0.08    0.05
a_f      |   -0.04    0.05 |    0.66    1.88 |   -1.51   -3.12 |    1.45    3.13
w_f      |   -0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.05   -0.02   -0.04 |    0.04    0.03    0.02
w_rewards |   -0.65 |    0.45 |   -5.08 |    0.00
w_pena

ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0041   0.0024   0.0091   8.0871   2.2896   2.8947
Update Cnt = 1370    ET =    984.1   Stats:  Mean, Std, Min, Max
r_f      |   -6.36   -8.21    1.11 |  184.75  169.05  207.37 | -393.74 -369.20 -391.72 |  387.56  366.85  388.97
v_f      |    0.00    0.00   -0.00 |    0.04    0.04    0.05 |   -0.13   -0.11   -0.13 |    0.11    0.13    0.13
r_i      |  -51.18  -53.84   21.02 |  686.58  649.59  773.67 |-1336.64-1290.56-1270.61 | 1323.68 1225.35 1253.22
v_i      |    0.00    0.00   -0.00 |    0.04    0.04    0.05 |   -0.10   -0.09   -0.09 |    0.09    0.09    0.09
norm_rf  |    0.29 |    0.12 |    0.05 |    0.81
norm_vf  |    0.08 |    0.02 |    0.04 |    0.16
gs_f     |    1.27 |    2.38 |    0.01 |   34.33
thrust   |   -0.00    0.00    0.00 |    0.70    0.70    0.70 |   -3.43   -3.46   -3.46 |    3.45    3.44    3.46
norm_thrust |    0.95 |    0.77 |    0.00 |    3.46
fuel     |    1.64 |    0.21 |    1.16 |    2.64
rewards  |  -22.86 

ADV1:  0.00043726328975732384 0.012860566590675769 0.0799659788367722 -0.0924781260420734
ADV2:  0.011224121129470506 0.8924396076593561 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.1277   1.0583   5.3977  24.4317  13.2140  10.5845
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0006   0.0003   0.0012   8.0871   2.2896   2.8947
***** Episode 42797, Mean R = -23.6  Std R = 8.7  Min R = -45.0
PolicyLoss: -0.0183
Policy_Beta: 0.1
Policy_Entropy: 0.138
Policy_KL: 0.00149
Policy_SD: 0.556
Policy_lr_mult: 0.198
Steps: 1.16e+04
TotalSteps: 1.53e+07
VF_0_ExplainedVarNew: 0.972
VF_0_ExplainedVarOld: 0.969
VF_0_Loss : 0.0144


ADV1:  0.0020053224436001804 0.011546044033031557 0.059608686673060296 -0.12726552187987017
ADV2:  -0.006142017906121621 0.9156037959371435 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.9104   1.2822   6.2019  24.4317  13.2140  10.5845
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0026   0.0015   0.0055   8.0871   2.2896   2.894

ADV1:  -0.0034842983121391854 0.01250683896827857 0.05900417688283971 -0.08223852765450279
ADV2:  0.03307977278462883 0.9125463972301554 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   3.3254   2.6709  12.4321  24.4317  13.2140  10.5845
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0040   0.0023   0.0089   8.0871   2.2896   2.8947
***** Episode 43076, Mean R = -24.3  Std R = 6.7  Min R = -38.8
PolicyLoss: -0.015
Policy_Beta: 0.1
Policy_Entropy: 0.139
Policy_KL: 0.00087
Policy_SD: 0.563
Policy_lr_mult: 0.198
Steps: 1.16e+04
TotalSteps: 1.55e+07
VF_0_ExplainedVarNew: 0.972
VF_0_ExplainedVarOld: 0.969
VF_0_Loss : 0.0162


ADV1:  0.0013439695069332436 0.010865746075317389 0.07964495546222433 -0.09038671282369415
ADV2:  0.007542365909893002 0.8840928173895181 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.7731   0.8459   4.3275  24.4317  13.2140  10.5845
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0016   0.0010   0.0035   8.0871   2.2896   2.8947
*

ADV1:  0.0032138332782626297 0.009978120496187317 0.05836046941437251 -0.0795537528956538
ADV2:  -0.016372261911074732 0.9119561403968569 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   4.8249   2.1837  10.3460  24.4317  13.2140  10.5845
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0037   0.0022   0.0082   8.0871   2.2896   2.8947
***** Episode 43355, Mean R = -21.1  Std R = 6.4  Min R = -38.8
PolicyLoss: -0.0121
Policy_Beta: 0.1
Policy_Entropy: 0.135
Policy_KL: 0.000864
Policy_SD: 0.566
Policy_lr_mult: 0.198
Steps: 1.16e+04
TotalSteps: 1.56e+07
VF_0_ExplainedVarNew: 0.981
VF_0_ExplainedVarOld: 0.979
VF_0_Loss : 0.0178


ADV1:  -0.0003958101186614647 0.009592519784790303 0.044805595321236624 -0.061964136639318754
ADV2:  0.019673076560996875 0.8922432504317559 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.9073   1.1898   6.0882  24.4317  13.2140  10.5845
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0009   0.0005   0.0022   8.0871   2.2896   2.

ADV1:  0.0018944494091473285 0.010132111949648854 0.09036063067869976 -0.0636932692940908
ADV2:  -0.0028705627376708013 0.8769312507954775 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.8531   1.0006   4.5468  24.4317  13.2140  10.5845
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0023   0.0013   0.0052   8.0871   2.2896   2.8947
***** Episode 43634, Mean R = -21.6  Std R = 6.1  Min R = -36.9
PolicyLoss: -0.0131
Policy_Beta: 0.1
Policy_Entropy: 0.135
Policy_KL: 0.0011
Policy_SD: 0.553
Policy_lr_mult: 0.198
Steps: 1.18e+04
TotalSteps: 1.57e+07
VF_0_ExplainedVarNew: 0.982
VF_0_ExplainedVarOld: 0.979
VF_0_Loss : 0.0126


ADV1:  -0.00078192568501106 0.010357452859979816 0.061896169107423765 -0.1957663653186641
ADV2:  0.020521870099766058 0.8484272788614793 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.7011   1.4398   6.7204  24.4317  13.2140  10.5845
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0009   0.0005   0.0019   8.0871   2.2896   2.8947


ADV1:  -0.00101089331227096 0.011528561981768968 0.11505816486322484 -0.07736370235963357
ADV2:  0.016063914666359744 0.8946174829999349 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.7403   1.2515   6.5627  24.4317  13.2140  10.5845
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0017   0.0009   0.0034   8.0871   2.2896   2.8947
***** Episode 43913, Mean R = -21.4  Std R = 7.4  Min R = -40.5
PolicyLoss: -0.0126
Policy_Beta: 0.1
Policy_Entropy: 0.134
Policy_KL: 0.001
Policy_SD: 0.568
Policy_lr_mult: 0.198
Steps: 1.15e+04
TotalSteps: 1.58e+07
VF_0_ExplainedVarNew: 0.975
VF_0_ExplainedVarOld: 0.972
VF_0_Loss : 0.0199


ADV1:  -0.00020717130281622424 0.011874527761477339 0.047991652659649706 -0.17334567975102266
ADV2:  0.021275524026646342 0.8419388851094718 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.7643   2.0231  10.0629  24.4317  13.2140  10.5845
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0009   0.0004   0.0019   8.0871   2.2896   2.8947

ADV1:  -0.002229691387046438 0.010616883750316497 0.04909349332253143 -0.059702904762816186
ADV2:  0.023249330665689377 0.9258091388458318 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.7256   0.8352   3.9804  24.4317  13.2140  10.5845
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0026   0.0015   0.0056   8.0871   2.2896   2.8947
***** Episode 44192, Mean R = -22.1  Std R = 6.1  Min R = -34.0
PolicyLoss: -0.0138
Policy_Beta: 0.1
Policy_Entropy: 0.135
Policy_KL: 0.000979
Policy_SD: 0.549
Policy_lr_mult: 0.198
Steps: 1.18e+04
TotalSteps: 1.59e+07
VF_0_ExplainedVarNew: 0.977
VF_0_ExplainedVarOld: 0.976
VF_0_Loss : 0.0127


ADV1:  0.0029176783237954865 0.012789553541957226 0.12623203179039943 -0.2756827500495367
ADV2:  -0.009638732230217538 0.8035897874103108 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.2724   0.4903   2.5828  24.4317  13.2140  10.5845
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0034   0.0020   0.0075   8.0871   2.2896   2.89

ADV1:  0.0018763729294855398 0.011380469074086037 0.05815529386902133 -0.06345531401206239
ADV2:  0.0014708432031824304 0.9060309505270793 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.5826   1.7120   8.7146  24.4317  13.2140  10.5845
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0021   0.0013   0.0048   8.0871   2.2896   2.8947
***** Episode 44471, Mean R = -21.4  Std R = 6.8  Min R = -39.8
PolicyLoss: -0.0176
Policy_Beta: 0.1
Policy_Entropy: 0.136
Policy_KL: 0.000847
Policy_SD: 0.552
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 1.6e+07
VF_0_ExplainedVarNew: 0.976
VF_0_ExplainedVarOld: 0.973
VF_0_Loss : 0.0116


ADV1:  -4.7806510511602375e-05 0.01130541779657784 0.05503610691863813 -0.21625474702337366
ADV2:  0.022845694322378533 0.7956053900468223 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.1207   0.5726   2.4828  24.4317  13.2140  10.5845
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0008   0.0005   0.0018   8.0871   2.2896   2.89

ADV1:  -7.228712388732014e-05 0.009727830971666986 0.1258678193902088 -0.07184903097760398
ADV2:  0.012745709850111954 0.8343662038349532 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.1996   0.7241   3.6276  24.4317  13.2140  10.5845
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0005   0.0003   0.0012   8.0871   2.2896   2.8947
***** Episode 44750, Mean R = -21.6  Std R = 6.7  Min R = -40.4
PolicyLoss: -0.0157
Policy_Beta: 0.1
Policy_Entropy: 0.138
Policy_KL: 0.000858
Policy_SD: 0.555
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 1.61e+07
VF_0_ExplainedVarNew: 0.985
VF_0_ExplainedVarOld: 0.982
VF_0_Loss : 0.0124


ADV1:  -0.0013566255607924136 0.011061114485677558 0.0679867510889009 -0.07607399281195884
ADV2:  0.02679017766969922 0.8668423556129213 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.4469   0.8224   4.3551  24.4317  13.2140  10.5845
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0016   0.0010   0.0035   8.0871   2.2896   2.8947

ADV1:  0.0002560141754126307 0.00940424580313295 0.08371289310873442 -0.07000385822192456
ADV2:  0.010805201485963038 0.8784713768324017 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.0831   0.8043   4.0072  24.4317  13.2140  10.5845
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0004   0.0003   0.0011   8.0871   2.2896   2.8947
***** Episode 45029, Mean R = -20.9  Std R = 6.6  Min R = -40.1
PolicyLoss: -0.0178
Policy_Beta: 0.1
Policy_Entropy: 0.138
Policy_KL: 0.00116
Policy_SD: 0.561
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 1.62e+07
VF_0_ExplainedVarNew: 0.984
VF_0_ExplainedVarOld: 0.982
VF_0_Loss : 0.00961


ADV1:  -0.003015011195588614 0.012085799835720496 0.0699497437348679 -0.08742333127407653
ADV2:  0.022971807798980674 0.9436796957236113 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.9215   0.3718   2.3476  24.4317  13.2140  10.5845
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0037   0.0022   0.0079   8.0871   2.2896   2.8947


cs_angles |  0.0012  0.0010 |  0.0886  0.0871 | -0.9945 -0.9898 |  0.9829  0.9837
optical_flow | -0.0000  0.0000 |  0.0274  0.0258 | -1.3460 -1.3255 |  0.9295  1.2235
v_err    | -0.0088 |  0.0563 | -0.4533 |  0.1231
landing_rewards |    8.71 |    3.35 |    0.00 |   10.00
landing_margin |   -0.02 |    0.02 |   -0.07 |    0.06
tracking_rewards |  -25.07 |    4.81 |  -49.96 |  -16.60
steps    |     375 |      20 |     331 |     421
***** Episode 45308, Mean R = -20.3  Std R = 5.8  Min R = -34.2
PolicyLoss: -0.014
Policy_Beta: 0.1
Policy_Entropy: 0.137
Policy_KL: 0.00146
Policy_SD: 0.543
Policy_lr_mult: 0.198
Steps: 1.19e+04
TotalSteps: 1.63e+07
VF_0_ExplainedVarNew: 0.977
VF_0_ExplainedVarOld: 0.975
VF_0_Loss : 0.00843


Dynamics: Max Disturbance (m/s^2):  [0.00149461 0.0018056  0.00138071] 0.002720371623523329
ADV1:  -0.0007670483261036098 0.013797874175036038 0.08366535309178152 -0.36852675857522554
ADV2:  0.0249140020365373 0.7096307071138579 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/

attitude |    0.01    0.01   -0.06 |    1.13    0.65    1.80 |   -3.14   -1.57   -3.14 |    3.14    1.56    3.14
w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.09   -0.07   -0.07 |    0.08    0.08    0.07
a_f      |    0.01   -0.08 |    0.65    1.80 |   -1.46   -3.09 |    1.36    3.13
w_f      |   -0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.04   -0.02   -0.03 |    0.03    0.03    0.02
w_rewards |   -0.54 |    0.35 |   -2.38 |   -0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.29 |    0.31 |    0.00 |    2.99
seeker_angles |    0.00    0.01 |    0.09    0.09 |   -0.99   -1.00 |    0.99    0.99
cs_angles |  0.0019  0.0061 |  0.0890  0.0889 | -0.9887 -0.9998 |  0.9922  0.9863
optical_flow | -0.0002 -0.0001 |  0.0267  0.0260 | -1.0949 -1.1361 |  1.1447  1.0874
v_err    | -0.0094 |  0.0581 | -0.6334 |  0.1253
landing_rewards |    9.16 |    2.77 |    0.00 |   10.00
landing_margin |   -0

w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.07   -0.05   -0.08 |    0.08    0.08    0.05
a_f      |    0.00    0.08 |    0.70    1.89 |   -1.50   -3.13 |    1.47    3.14
w_f      |   -0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.04   -0.02   -0.02 |    0.03    0.03    0.02
w_rewards |   -0.54 |    0.35 |   -2.25 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.29 |    0.30 |    0.00 |    3.05
seeker_angles |    0.00    0.00 |    0.09    0.09 |   -0.99   -0.97 |    0.99    0.99
cs_angles |  0.0002  0.0044 |  0.0854  0.0886 | -0.9941 -0.9692 |  0.9900  0.9934
optical_flow | -0.0001  0.0000 |  0.0287  0.0272 | -1.3490 -1.0735 |  1.3913  1.3910
v_err    | -0.0091 |  0.0574 | -0.4532 |  0.1262
landing_rewards |    8.94 |    3.08 |    0.00 |   10.00
landing_margin |   -0.02 |    0.02 |   -0.07 |    0.05
tracking_rewards |  -25.14 |    4.62 |  -44.56 |  -15.99
steps    |     375 |  

attitude |    0.02    0.02    0.13 |    1.28    0.64    1.94 |   -3.14   -1.57   -3.14 |    3.14    1.54    3.14
w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.06   -0.05   -0.08 |    0.09    0.08    0.05
a_f      |    0.02    0.20 |    0.64    1.93 |   -1.44   -3.13 |    1.45    3.13
w_f      |   -0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.04   -0.02   -0.02 |    0.03    0.03    0.02
w_rewards |   -0.55 |    0.33 |   -2.05 |   -0.01
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.28 |    0.30 |    0.00 |    2.97
seeker_angles |    0.00    0.00 |    0.09    0.09 |   -1.00   -0.99 |    0.99    1.00
cs_angles |  0.0016  0.0020 |  0.0868  0.0891 | -0.9986 -0.9884 |  0.9909  0.9976
optical_flow | -0.0000 -0.0001 |  0.0267  0.0270 | -1.3637 -0.9258 |  1.0435  1.2482
v_err    | -0.0090 |  0.0571 | -0.4535 |  0.1532
landing_rewards |    9.03 |    2.96 |    0.00 |   10.00
landing_margin |   -0

thrust   |   -0.01    0.00    0.00 |    0.70    0.71    0.70 |   -3.44   -3.46   -3.46 |    3.40    3.44    3.42
norm_thrust |    0.95 |    0.77 |    0.00 |    3.46
fuel     |    1.65 |    0.20 |    1.15 |    2.24
rewards  |  -21.52 |    6.56 |  -46.28 |  -10.29
fuel_rewards |   -4.72 |    0.57 |   -6.40 |   -3.29
glideslope_rewards |    0.00 |    0.00 |    0.00 |    0.00
glideslope_penalty |    0.00 |    0.00 |    0.00 |    0.00
glideslope |    2.83 |   12.67 |    0.01 |  427.03
norm_af  |    1.76 |    0.89 |    0.04 |    3.35
norm_wf  |    0.02 |    0.01 |    0.00 |    0.04
rh_penalty |    0.00 |    0.00 |    0.00 |    0.00
att_rewards |    0.00 |    0.00 |    0.00 |    0.00
att_penalty |    0.00 |    0.00 |    0.00 |    0.00
attitude |   -0.04    0.02    0.29 |    1.20    0.66    1.83 |   -3.14   -1.57   -3.14 |    3.14    1.57    3.14
w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.07   -0.05   -0.08 |    0.08    0.07    0.05
a_f      |    0.01    0.36 |    0.68

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.8923   0.8977   4.3561  29.5271  16.8478  11.1535
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0003   0.0002   0.0008   8.0871   2.2896   2.8947
Update Cnt = 1510    ET =    936.9   Stats:  Mean, Std, Min, Max
r_f      |   -1.34   40.93   16.05 |  181.32  162.52  201.64 | -385.37 -389.59 -382.51 |  391.16  383.09  371.40
v_f      |   -0.00   -0.01   -0.00 |    0.05    0.04    0.05 |   -0.13   -0.13   -0.12 |    0.11    0.08    0.14
r_i      |   17.12  108.82   51.89 |  701.89  608.11  772.92 |-1309.69-1260.22-1352.21 | 1329.02 1273.22 1286.17
v_i      |   -0.00   -0.01   -0.00 |    0.04    0.04    0.05 |   -0.09   -0.09   -0.10 |    0.09    0.08    0.10
norm_rf  |    0.26 |    0.12 |    0.04 |    0.73
norm_vf  |    0.08 |    0.02 |    0.02 |    0.15
gs_f     |    1.30 |    1.76 |    0.02 |   21.29
thrust   |   -0.00    0.00    0.00 |    0.70    0.72    0.71 |   -3.46   -3.44   -3.46 |    3.45    3.46    3.45
norm_thrust |    

ADV1:  -0.00931710585510295 0.018078134538255932 0.520901188967682 -0.12134403326245635
ADV2:  0.02981501819146723 0.8707706922384069 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.3293   1.3885   5.9609  29.5271  16.8478  11.1535
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0095   0.0059   0.0237   8.0871   2.2896   2.8947
***** Episode 47137, Mean R = -21.8  Std R = 5.9  Min R = -37.7
PolicyLoss: -0.00149
Policy_Beta: 0.1
Policy_Entropy: 0.138
Policy_KL: 0.000845
Policy_SD: 0.556
Policy_lr_mult: 0.198
Steps: 1.16e+04
TotalSteps: 1.7e+07
VF_0_ExplainedVarNew: 0.956
VF_0_ExplainedVarOld: 0.933
VF_0_Loss : 0.00802


ADV1:  0.0016848300380529913 0.01603100931118868 0.15622610125809963 -0.14636978781490884
ADV2:  -0.017254482151440396 0.7885775676113176 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.4546   0.5460   3.0319  29.5271  16.8478  11.1535
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0032   0.0016   0.0072   8.0871   2.2896   2.8947
U

ADV1:  0.0018560857800639621 0.01126375303920588 0.06141518004514962 -0.12541311582773895
ADV2:  0.0009923287677927708 0.893654097723396 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.1739   1.0908   5.2670  29.5271  16.8478  11.1535
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0027   0.0014   0.0060   8.0871   2.2896   2.8947
***** Episode 47416, Mean R = -21.1  Std R = 6.8  Min R = -42.7
PolicyLoss: -0.0172
Policy_Beta: 0.1
Policy_Entropy: 0.138
Policy_KL: 0.00116
Policy_SD: 0.562
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 1.71e+07
VF_0_ExplainedVarNew: 0.974
VF_0_ExplainedVarOld: 0.972
VF_0_Loss : 0.0116


ADV1:  0.0015145084941788373 0.011786788406851309 0.08268614207494385 -0.1344387395947052
ADV2:  0.008694478166265849 0.8566497462566511 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.1791   0.4166   2.2405  29.5271  16.8478  11.1535
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0016   0.0010   0.0039   8.0871   2.2896   2.8947
*

ADV1:  0.003132576388837493 0.009884503185317218 0.08381313827274972 -0.10138477624686416
ADV2:  -0.006691524243240588 0.8622556740148858 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.8740   1.1912   6.3413  29.5271  16.8478  11.1535
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0035   0.0022   0.0079   8.0871   2.2896   2.8947
***** Episode 47695, Mean R = -22.7  Std R = 7.9  Min R = -41.0
PolicyLoss: -0.0191
Policy_Beta: 0.1
Policy_Entropy: 0.136
Policy_KL: 0.00137
Policy_SD: 0.572
Policy_lr_mult: 0.198
Steps: 1.15e+04
TotalSteps: 1.72e+07
VF_0_ExplainedVarNew: 0.986
VF_0_ExplainedVarOld: 0.984
VF_0_Loss : 0.00921


ADV1:  -0.001013615262210497 0.011158836554486854 0.05962289921630959 -0.09427144830364448
ADV2:  0.016976788368496067 0.8979271923742095 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.2833   0.6428   3.0589  29.5271  16.8478  11.1535
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0022   0.0013   0.0048   8.0871   2.2896   2.894

ADV1:  0.0009335745275837876 0.008321539591625942 0.07595774431922281 -0.04965605855575905
ADV2:  -0.00632540566500874 0.8642347217570356 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.4070   0.6662   3.5446  29.5271  16.8478  11.1535
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0011   0.0006   0.0024   8.0871   2.2896   2.8947
***** Episode 47974, Mean R = -18.0  Std R = 5.3  Min R = -29.9
PolicyLoss: -0.007
Policy_Beta: 0.1
Policy_Entropy: 0.14
Policy_KL: 0.00106
Policy_SD: 0.55
Policy_lr_mult: 0.198
Steps: 1.16e+04
TotalSteps: 1.73e+07
VF_0_ExplainedVarNew: 0.985
VF_0_ExplainedVarOld: 0.983
VF_0_Loss : 0.0116


Dynamics: Max Disturbance (m/s^2):  [0.00149461 0.0018056  0.00138071] 0.002720371623523329
ADV1:  -0.0017651599436646023 0.01158032694382012 0.11947186792841757 -0.07987078951236637
ADV2:  0.021285910176886715 0.8794393634548551 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.5600   0.8894   4.8994  29.5271  16.8478  11.1535
ValFun  Gradi

ADV1:  0.00013090894131275908 0.011322060945631459 0.06526944002064375 -0.07833932597770642
ADV2:  0.012687945049073373 0.8951273107523076 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   3.0995   1.7934   9.0439  29.5271  16.8478  11.1535
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0002   0.0001   0.0004   8.0871   2.2896   2.8947
***** Episode 48253, Mean R = -21.3  Std R = 6.2  Min R = -32.9
PolicyLoss: -0.0177
Policy_Beta: 0.1
Policy_Entropy: 0.142
Policy_KL: 0.000809
Policy_SD: 0.551
Policy_lr_mult: 0.198
Steps: 1.18e+04
TotalSteps: 1.74e+07
VF_0_ExplainedVarNew: 0.974
VF_0_ExplainedVarOld: 0.972
VF_0_Loss : 0.00937


Dynamics: Max Disturbance (m/s^2):  [0.00149461 0.0018056  0.00138071] 0.002720371623523329
ADV1:  0.0010668584006881532 0.010279889392905977 0.0678517276147419 -0.07795964551429341
ADV2:  0.007296031296092521 0.8750939462693947 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.3733   0.9193   4.9303  29.5271  16.8478  11.1535
ValFun  

Dynamics: Max Disturbance (m/s^2):  [0.00149461 0.0018056  0.00138071] 0.002720371623523329
ADV1:  -6.0458302685797504e-05 0.0098791894423839 0.14683485646434125 -0.07983505666255947
ADV2:  0.016891502432870225 0.8340027124896056 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.3326   0.6032   3.0006  29.5271  16.8478  11.1535
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0002   0.0001   0.0004   8.0871   2.2896   2.8947
***** Episode 48532, Mean R = -21.6  Std R = 8.0  Min R = -47.9
PolicyLoss: -0.0207
Policy_Beta: 0.1
Policy_Entropy: 0.142
Policy_KL: 0.0011
Policy_SD: 0.559
Policy_lr_mult: 0.198
Steps: 1.16e+04
TotalSteps: 1.75e+07
VF_0_ExplainedVarNew: 0.985
VF_0_ExplainedVarOld: 0.982
VF_0_Loss : 0.0106


ADV1:  -0.001724310481542604 0.01134021990721238 0.14546115699570694 -0.05158423655811477
ADV2:  0.015720874046524693 0.9256760116703452 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.6602   1.1468   5.9628  29.5271  16.8478  11.1535
ValFun  Grad

Dynamics: Max Disturbance (m/s^2):  [0.00149461 0.0018056  0.00138071] 0.002720371623523329
ADV1:  -0.0008949277515990642 0.013230815837632656 0.15437499294694756 -0.2029369253738761
ADV2:  0.012352086997523505 0.813013637445074 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.8569   0.7551   3.7154  29.5271  16.8478  11.1535
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0011   0.0006   0.0025   8.0871   2.2896   2.8947
***** Episode 48811, Mean R = -23.9  Std R = 7.0  Min R = -42.1
PolicyLoss: -0.012
Policy_Beta: 0.1
Policy_Entropy: 0.139
Policy_KL: 0.00161
Policy_SD: 0.566
Policy_lr_mult: 0.198
Steps: 1.19e+04
TotalSteps: 1.76e+07
VF_0_ExplainedVarNew: 0.977
VF_0_ExplainedVarOld: 0.969
VF_0_Loss : 0.0101


ADV1:  0.00323633482533092 0.009361680654333715 0.2085509272007227 -0.05181143917935591
ADV2:  -0.03894569240451178 0.8142110601481007 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.3855   1.1377   5.4414  29.5271  16.8478  11.1535
ValFun  Gradien

Dynamics: Max Disturbance (m/s^2):  [0.00149461 0.0018056  0.00138071] 0.002720371623523329
ADV1:  -0.0019446387298995957 0.013752555863610636 0.05414865812331948 -0.3293028542061651
ADV2:  0.03478953825068257 0.7335700746452108 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.3018   0.6892   2.9651  29.5271  16.8478  11.1535
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0032   0.0017   0.0064   8.0871   2.2896   2.8947
***** Episode 49090, Mean R = -21.7  Std R = 8.5  Min R = -53.3
PolicyLoss: -0.0309
Policy_Beta: 0.1
Policy_Entropy: 0.138
Policy_KL: 0.00108
Policy_SD: 0.561
Policy_lr_mult: 0.198
Steps: 1.19e+04
TotalSteps: 1.77e+07
VF_0_ExplainedVarNew: 0.977
VF_0_ExplainedVarOld: 0.965
VF_0_Loss : 0.00664


ADV1:  0.0027987327704189963 0.01364650082450708 0.06480846332032747 -0.3167387250471202
ADV2:  0.004423208157388842 0.750870672847547 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.8194   0.4051   1.8844  29.5271  16.8478  11.1535
ValFun  Gradi

***** Episode 49338, Mean R = -22.4  Std R = 6.9  Min R = -36.6
PolicyLoss: -0.0193
Policy_Beta: 0.1
Policy_Entropy: 0.139
Policy_KL: 0.00151
Policy_SD: 0.569
Policy_lr_mult: 0.198
Steps: 1.16e+04
TotalSteps: 1.78e+07
VF_0_ExplainedVarNew: 0.975
VF_0_ExplainedVarOld: 0.971
VF_0_Loss : 0.00981


ADV1:  -0.0006313027619382639 0.010677638937393678 0.049046822292348635 -0.07089687975694076
ADV2:  0.016980779162883566 0.9046328153392258 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.0237   0.7124   3.9855  29.5271  16.8478  11.1535
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0006   0.0004   0.0016   8.0871   2.2896   2.8947
***** Episode 49369, Mean R = -20.8  Std R = 6.3  Min R = -36.6
PolicyLoss: -0.0166
Policy_Beta: 0.1
Policy_Entropy: 0.141
Policy_KL: 0.000966
Policy_SD: 0.55
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 1.78e+07
VF_0_ExplainedVarNew: 0.978
VF_0_ExplainedVarOld: 0.976
VF_0_Loss : 0.00913


ADV1:  -0.0001719865261911684 0.009564697543903274 0.

optical_flow | -0.0002 -0.0000 |  0.0269  0.0258 | -1.3398 -1.3567 |  1.1975  1.0944
v_err    | -0.0084 |  0.0554 | -0.4513 |  0.1245
landing_rewards |    9.13 |    2.82 |    0.00 |   10.00
landing_margin |   -0.02 |    0.02 |   -0.06 |    0.05
tracking_rewards |  -24.18 |    4.68 |  -38.87 |  -15.26
steps    |     376 |      21 |     333 |     416
***** Episode 49648, Mean R = -20.7  Std R = 6.6  Min R = -43.0
PolicyLoss: -0.0169
Policy_Beta: 0.1
Policy_Entropy: 0.14
Policy_KL: 0.00104
Policy_SD: 0.557
Policy_lr_mult: 0.198
Steps: 1.15e+04
TotalSteps: 1.79e+07
VF_0_ExplainedVarNew: 0.979
VF_0_ExplainedVarOld: 0.976
VF_0_Loss : 0.00789


ADV1:  -0.0013150041791151119 0.010134114218378308 0.04402948091323142 -0.1273176038968612
ADV2:  0.030634148143051366 0.8385791435809242 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.3831   0.6578   3.4975  29.5271  16.8478  11.1535
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0016   0.0009   0.0034   8.0871   2.2896   2.8947
*

attitude |   -0.03   -0.03   -0.00 |    1.23    0.67    1.86 |   -3.14   -1.55   -3.14 |    3.14    1.56    3.14
w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.08   -0.05   -0.08 |    0.08    0.07    0.05
a_f      |   -0.04   -0.01 |    0.66    1.85 |   -1.44   -3.12 |    1.43    3.12
w_f      |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.04   -0.03   -0.03 |    0.03    0.02    0.02
w_rewards |   -0.48 |    0.33 |   -1.75 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.28 |    0.31 |    0.00 |    3.12
seeker_angles |    0.00    0.00 |    0.08    0.09 |   -0.99   -1.00 |    0.97    1.00
cs_angles |  0.0020  0.0028 |  0.0848  0.0886 | -0.9929 -0.9991 |  0.9746  0.9952
optical_flow | -0.0001 -0.0001 |  0.0249  0.0254 | -1.0378 -1.1050 |  0.9752  1.1417
v_err    | -0.0086 |  0.0558 | -0.4535 |  0.1418
landing_rewards |    9.23 |    2.67 |    0.00 |   10.00
landing_margin |   -0

rewards  |  -21.05 |    8.37 | -114.93 |   -9.37
fuel_rewards |   -4.58 |    0.58 |   -6.93 |   -0.57
glideslope_rewards |    0.00 |    0.00 |    0.00 |    0.00
glideslope_penalty |    0.00 |    0.00 |    0.00 |    0.00
glideslope |    2.90 |   12.93 |    0.00 |  449.22
norm_af  |    1.76 |    0.88 |    0.12 |    3.36
norm_wf  |    0.02 |    0.01 |    0.00 |    0.11
rh_penalty |    0.00 |    0.00 |    0.00 |    0.00
att_rewards |    0.00 |    0.00 |    0.00 |    0.00
att_penalty |    0.00 |    0.00 |    0.00 |    0.00
attitude |   -0.08   -0.02    0.16 |    1.20    0.66    1.86 |   -3.14   -1.56   -3.14 |    3.14    1.54    3.14
w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.10   -0.05   -0.08 |    0.08    0.08    0.05
a_f      |   -0.02    0.20 |    0.65    1.85 |   -1.43   -3.13 |    1.35    3.13
w_f      |   -0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.10   -0.03   -0.04 |    0.04    0.03    0.03
w_rewards |   -0.48 |    0.34 |   -2.08 |    0.00
w_pena

Update Cnt = 1630    ET =    891.0   Stats:  Mean, Std, Min, Max
r_f      |   11.14    8.16   -1.91 |  180.38  179.58  197.48 | -390.42 -393.77 -382.93 |  393.37  377.15  375.43
v_f      |   -0.00   -0.00    0.00 |    0.05    0.04    0.05 |   -0.10   -0.11   -0.12 |    0.10    0.08    0.10
r_i      |   26.06   49.98  -39.03 |  691.33  643.18  769.67 |-1328.12-1285.41-1270.66 | 1297.99 1252.78 1299.93
v_i      |   -0.00   -0.00    0.00 |    0.04    0.04    0.05 |   -0.09   -0.09   -0.09 |    0.09    0.07    0.09
norm_rf  |    0.25 |    0.10 |    0.03 |    0.56
norm_vf  |    0.07 |    0.02 |    0.03 |    0.14
gs_f     |    1.29 |    1.69 |    0.01 |   13.22
thrust   |    0.00    0.00    0.00 |    0.69    0.69    0.68 |   -3.36   -3.45   -3.45 |    3.46    3.44    3.43
norm_thrust |    0.91 |    0.76 |    0.00 |    3.46
fuel     |    1.59 |    0.19 |    1.20 |    2.21
rewards  |  -20.35 |    6.84 |  -62.05 |  -10.54
fuel_rewards |   -4.57 |    0.55 |   -6.37 |   -3.44
glideslope_rewards |

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.3879   0.6077   3.2175  29.5271  16.8478  11.1535
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0016   0.0009   0.0033   8.0871   2.2896   2.8947
***** Episode 50857, Mean R = -20.0  Std R = 5.8  Min R = -36.3
PolicyLoss: -0.0069
Policy_Beta: 0.1
Policy_Entropy: 0.145
Policy_KL: 0.000803
Policy_SD: 0.539
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 1.84e+07
VF_0_ExplainedVarNew: 0.981
VF_0_ExplainedVarOld: 0.978
VF_0_Loss : 0.0056


ADV1:  0.002932008069269654 0.009682191125943953 0.04590172127569592 -0.12369724878647059
ADV2:  -0.0036797207388180315 0.8393881026203541 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.7800   0.9195   4.7523  29.5271  16.8478  11.1535
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0037   0.0023   0.0078   8.0871   2.2896   2.8947
Update Cnt = 1640    ET =    891.2   Stats:  Mean, Std, Min, Max
r_f      |   11.41   14.43    5.13 |  186.77  164.20  198.67 | -393.02 -391.61 

ADV1:  -0.004893016996526256 0.011021846157219854 0.05291723253552333 -0.11662918745412554
ADV2:  0.05001448965887421 0.8894518347312509 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.7627   1.1896   5.5623  29.5271  16.8478  11.1535
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0057   0.0034   0.0126   8.0871   2.2896   2.8947
***** Episode 51136, Mean R = -21.0  Std R = 6.4  Min R = -36.2
PolicyLoss: -0.0205
Policy_Beta: 0.1
Policy_Entropy: 0.142
Policy_KL: 0.00122
Policy_SD: 0.547
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 1.85e+07
VF_0_ExplainedVarNew: 0.978
VF_0_ExplainedVarOld: 0.975
VF_0_Loss : 0.00549


ADV1:  0.0018001950151063106 0.00905510646539366 0.07874904119436454 -0.05180583915129355
ADV2:  -0.011576247881444556 0.8888904114714509 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.2596   1.4180   7.3501  29.5271  16.8478  11.1535
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0020   0.0012   0.0047   8.0871   2.2896   2.8947

ADV1:  -0.0013494960490059652 0.010164950204919646 0.037747604291988424 -0.20230901718823102
ADV2:  0.03243224616391049 0.7983446938474414 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   3.0002   1.6052   8.9081  29.5271  16.8478  11.1535
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0018   0.0010   0.0037   8.0871   2.2896   2.8947
***** Episode 51415, Mean R = -19.1  Std R = 6.6  Min R = -38.5
PolicyLoss: -0.026
Policy_Beta: 0.1
Policy_Entropy: 0.141
Policy_KL: 0.00133
Policy_SD: 0.556
Policy_lr_mult: 0.198
Steps: 1.16e+04
TotalSteps: 1.86e+07
VF_0_ExplainedVarNew: 0.981
VF_0_ExplainedVarOld: 0.977
VF_0_Loss : 0.00532


ADV1:  -0.001928070268185237 0.011498937503964144 0.05382368880651095 -0.06391449294529658
ADV2:  0.022129060656556867 0.9229393586565326 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.9820   1.2618   6.1302  29.5271  16.8478  11.1535
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0025   0.0015   0.0052   8.0871   2.2896   2.894

ADV1:  -0.003328888920641414 0.009595216746229509 0.044606867164968776 -0.06004095968728963
ADV2:  0.038469804370133066 0.8902375895604888 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.4938   1.1221   5.2994  29.5271  16.8478  11.1535
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0041   0.0024   0.0086   8.0871   2.2896   2.8947
***** Episode 51694, Mean R = -21.6  Std R = 6.5  Min R = -34.5
PolicyLoss: -0.0211
Policy_Beta: 0.1
Policy_Entropy: 0.142
Policy_KL: 0.000941
Policy_SD: 0.559
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 1.87e+07
VF_0_ExplainedVarNew: 0.985
VF_0_ExplainedVarOld: 0.983
VF_0_Loss : 0.00415


ADV1:  0.004783806913140466 0.008966623208897776 0.055559134685185974 -0.06142612571595421
ADV2:  -0.021038590618139275 0.8729649324805169 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.4242   0.8089   3.8996  29.5271  16.8478  11.1535
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0054   0.0032   0.0123   8.0871   2.2896   2.

ADV1:  -0.001790840555137855 0.009822996540529235 0.04827682450273485 -0.09107396464297302
ADV2:  0.023456858448586228 0.9124406060890289 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.0228   1.3625   6.3115  29.5271  16.8478  11.1535
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0026   0.0015   0.0059   8.0871   2.2896   2.8947
***** Episode 51973, Mean R = -20.8  Std R = 6.2  Min R = -36.8
PolicyLoss: -0.0144
Policy_Beta: 0.1
Policy_Entropy: 0.143
Policy_KL: 0.000965
Policy_SD: 0.555
Policy_lr_mult: 0.198
Steps: 1.15e+04
TotalSteps: 1.88e+07
VF_0_ExplainedVarNew: 0.983
VF_0_ExplainedVarOld: 0.981
VF_0_Loss : 0.00378


Dynamics: Max Disturbance (m/s^2):  [0.00149461 0.0018056  0.00138071] 0.002720371623523329
ADV1:  0.0019211625373514749 0.008355728873551018 0.0475234461737532 -0.07759724498858378
ADV2:  0.000260934671010896 0.8817759074069518 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.8964   0.9637   5.0659  29.5271  16.8478  11.1535
ValFun  G

ADV1:  -0.00024248515654426905 0.010090497225129363 0.05415126539501247 -0.07267202421960062
ADV2:  0.017162344142685575 0.8672831020405642 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.5746   0.6304   3.2612  29.5271  16.8478  11.1535
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0005   0.0003   0.0009   8.0871   2.2896   2.8947
***** Episode 52252, Mean R = -22.6  Std R = 8.3  Min R = -44.4
PolicyLoss: -0.0198
Policy_Beta: 0.1
Policy_Entropy: 0.141
Policy_KL: 0.00105
Policy_SD: 0.574
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 1.89e+07
VF_0_ExplainedVarNew: 0.985
VF_0_ExplainedVarOld: 0.982
VF_0_Loss : 0.00478


Dynamics: Max Disturbance (m/s^2):  [0.00149461 0.0018056  0.00138071] 0.002720371623523329
ADV1:  -0.0005533297236743128 0.008628212384361 0.0433635745833148 -0.06304153104467196
ADV2:  0.023713855815249017 0.859431604729276 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.1504   0.2875   1.9640  29.5271  16.8478  11.1535
ValFun  Gra

Dynamics: Max Disturbance (m/s^2):  [0.00149461 0.0018056  0.00138071] 0.002720371623523329
ADV1:  -0.00012068294769102543 0.008615620678063303 0.04087163895805115 -0.05509532678026041
ADV2:  0.016477668103192587 0.8961575975390358 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.4005   0.5881   2.7076  29.5271  16.8478  11.1535
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0008   0.0005   0.0019   8.0871   2.2896   2.8947
***** Episode 52531, Mean R = -19.2  Std R = 5.1  Min R = -31.3
PolicyLoss: -0.0194
Policy_Beta: 0.1
Policy_Entropy: 0.145
Policy_KL: 0.000905
Policy_SD: 0.54
Policy_lr_mult: 0.198
Steps: 1.18e+04
TotalSteps: 1.9e+07
VF_0_ExplainedVarNew: 0.985
VF_0_ExplainedVarOld: 0.983
VF_0_Loss : 0.00455


ADV1:  0.0007510705302827722 0.009234631283494454 0.041670361860280336 -0.10387345289012084
ADV2:  0.01704102969011312 0.8398684060823636 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.4301   0.8295   4.4444  29.5271  16.8478  11.1535
ValFun  

Dynamics: Max Disturbance (m/s^2):  [0.00149461 0.0018056  0.00138071] 0.002720371623523329
ADV1:  0.0032870060276365084 0.007666431690424189 0.05693783654485962 -0.07499933844468465
ADV2:  -0.02427011636519551 0.879559008652759 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.7385   1.5892   8.3311  29.5271  16.8478  11.1535
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0039   0.0025   0.0085   8.0871   2.2896   2.8947
***** Episode 52810, Mean R = -19.6  Std R = 5.3  Min R = -34.0
PolicyLoss: -0.014
Policy_Beta: 0.1
Policy_Entropy: 0.143
Policy_KL: 0.00107
Policy_SD: 0.554
Policy_lr_mult: 0.198
Steps: 1.15e+04
TotalSteps: 1.91e+07
VF_0_ExplainedVarNew: 0.99
VF_0_ExplainedVarOld: 0.988
VF_0_Loss : 0.00418


ADV1:  -0.004454094078632705 0.011419776279117977 0.04101263420843315 -0.07898633723990041
ADV2:  0.042800545119838496 0.9020442329576215 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.1591   1.4475   6.9561  29.5271  16.8478  11.1535
ValFun  Grad

***** Episode 53058, Mean R = -20.6  Std R = 5.7  Min R = -34.1
PolicyLoss: -0.025
Policy_Beta: 0.1
Policy_Entropy: 0.146
Policy_KL: 0.0016
Policy_SD: 0.549
Policy_lr_mult: 0.198
Steps: 1.14e+04
TotalSteps: 1.92e+07
VF_0_ExplainedVarNew: 0.982
VF_0_ExplainedVarOld: 0.98
VF_0_Loss : 0.00396


ADV1:  0.0030043146547445872 0.006530440459058738 0.061148788181067615 -0.05455663171638486
ADV2:  -0.029444437607415178 0.8968815821535981 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.2633   0.4299   2.1686  29.5271  16.8478  11.1535
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0040   0.0023   0.0087   8.0871   2.2896   2.8947
***** Episode 53089, Mean R = -21.4  Std R = 7.3  Min R = -41.3
PolicyLoss: -0.00851
Policy_Beta: 0.1
Policy_Entropy: 0.143
Policy_KL: 0.00114
Policy_SD: 0.565
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 1.92e+07
VF_0_ExplainedVarNew: 0.994
VF_0_ExplainedVarOld: 0.993
VF_0_Loss : 0.00386


ADV1:  -0.0026612947482308395 0.00891608562161168 0.045

a_f      |    0.03    0.03 |    0.64    1.83 |   -1.48   -3.14 |    1.43    3.14
w_f      |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.04   -0.03   -0.03 |    0.03    0.03    0.02
w_rewards |   -0.48 |    0.34 |   -2.27 |   -0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.28 |    0.31 |    0.00 |    3.01
seeker_angles |    0.00    0.00 |    0.09    0.09 |   -0.99   -1.00 |    1.00    0.99
cs_angles |  0.0016  0.0032 |  0.0866  0.0871 | -0.9904 -0.9971 |  0.9965  0.9892
optical_flow | -0.0000 -0.0000 |  0.0268  0.0273 | -1.2033 -1.4639 |  1.2971  1.2400
v_err    | -0.0095 |  0.0569 | -0.4509 |  0.1152
landing_rewards |    9.32 |    2.51 |    0.00 |   10.00
landing_margin |   -0.03 |    0.02 |   -0.07 |    0.03
tracking_rewards |  -24.43 |    4.79 |  -44.29 |  -14.85
steps    |     375 |      20 |     330 |     417
***** Episode 53368, Mean R = -19.7  Std R = 4.9  Min R = -31.2
PolicyLoss: -0.00308
P

w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.08   -0.05   -0.07 |    0.07    0.08    0.05
a_f      |   -0.11    0.12 |    0.66    1.79 |   -1.55   -3.14 |    1.49    3.13
w_f      |   -0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.03   -0.03   -0.03 |    0.03    0.03    0.03
w_rewards |   -0.46 |    0.27 |   -1.33 |   -0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.28 |    0.31 |    0.00 |    2.93
seeker_angles |    0.00    0.00 |    0.09    0.09 |   -0.97   -1.00 |    0.98    0.99
cs_angles |  0.0050  0.0011 |  0.0862  0.0871 | -0.9717 -0.9977 |  0.9819  0.9944
optical_flow | -0.0001 -0.0002 |  0.0266  0.0266 | -0.9868 -1.2591 |  1.2473  1.2250
v_err    | -0.0096 |  0.0565 | -0.4525 |  0.1328
landing_rewards |    9.16 |    2.77 |    0.00 |   10.00
landing_margin |   -0.03 |    0.02 |   -0.08 |    0.06
tracking_rewards |  -24.24 |    4.74 |  -42.04 |  -15.55
steps    |     378 |  

attitude |    0.05    0.03    0.10 |    1.28    0.71    1.90 |   -3.14   -1.56   -3.14 |    3.14    1.56    3.14
w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.08   -0.05   -0.08 |    0.09    0.07    0.05
a_f      |    0.03    0.08 |    0.71    1.92 |   -1.43   -3.14 |    1.48    3.13
w_f      |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.04   -0.02   -0.03 |    0.03    0.03    0.03
w_rewards |   -0.45 |    0.30 |   -2.20 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.28 |    0.30 |    0.00 |    3.05
seeker_angles |    0.00    0.00 |    0.08    0.09 |   -1.00   -0.99 |    0.99    1.00
cs_angles |  0.0021  0.0039 |  0.0849  0.0895 | -0.9970 -0.9885 |  0.9940  0.9981
optical_flow | -0.0002 -0.0000 |  0.0257  0.0281 | -1.2272 -1.1158 |  1.1489  1.1863
v_err    | -0.0097 |  0.0571 | -0.4546 |  0.1215
landing_rewards |    9.42 |    2.34 |    0.00 |   10.00
landing_margin |   -0

w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.08   -0.05   -0.07 |    0.09    0.08    0.05
a_f      |   -0.02    0.16 |    0.68    1.85 |   -1.48   -3.14 |    1.53    3.14
w_f      |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.04   -0.02   -0.02 |    0.03    0.03    0.03
w_rewards |   -0.46 |    0.32 |   -2.64 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.28 |    0.31 |    0.00 |    2.96
seeker_angles |    0.00    0.00 |    0.08    0.09 |   -0.99   -0.99 |    0.99    1.00
cs_angles |  0.0023  0.0040 |  0.0840  0.0892 | -0.9914 -0.9938 |  0.9899  0.9981
optical_flow | -0.0000  0.0000 |  0.0253  0.0278 | -1.4870 -1.5351 |  1.0738  1.2575
v_err    | -0.0095 |  0.0562 | -0.4514 |  0.1255
landing_rewards |    9.45 |    2.28 |    0.00 |   10.00
landing_margin |   -0.03 |    0.02 |   -0.06 |    0.05
tracking_rewards |  -24.16 |    4.78 |  -41.14 |  -15.20
steps    |     375 |  

attitude |    0.09    0.04   -0.13 |    1.14    0.68    1.75 |   -3.14   -1.55   -3.14 |    3.14    1.57    3.14
w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.10   -0.05   -0.08 |    0.08    0.08    0.05
a_f      |    0.04   -0.11 |    0.68    1.74 |   -1.40   -3.13 |    1.52    3.13
w_f      |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.03   -0.02   -0.03 |    0.03    0.03    0.03
w_rewards |   -0.50 |    0.35 |   -2.73 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |   -0.16 |    2.84 |  -50.00 |    0.00
theta_cv |    0.29 |    0.31 |    0.00 |    3.01
seeker_angles |    0.00    0.00 |    0.09    0.09 |   -0.99   -0.99 |    0.99    1.00
cs_angles |  0.0014  0.0040 |  0.0857  0.0935 | -0.9923 -0.9881 |  0.9892  0.9986
optical_flow | -0.0001 -0.0001 |  0.0254  0.0258 | -1.1551 -0.8969 |  0.9614  1.2256
v_err    | -0.0096 |  0.0569 | -0.4532 |  0.4337
landing_rewards |    9.42 |    2.34 |    0.00 |   10.00
landing_margin |    0

attitude |   -0.02    0.01   -0.16 |    1.18    0.62    1.90 |   -3.14   -1.55   -3.14 |    3.14    1.55    3.14
w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.08   -0.05   -0.08 |    0.08    0.07    0.05
a_f      |    0.02   -0.13 |    0.62    1.90 |   -1.52   -3.13 |    1.44    3.13
w_f      |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.03   -0.03   -0.02 |    0.03    0.02    0.02
w_rewards |   -0.49 |    0.30 |   -2.30 |   -0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.28 |    0.31 |    0.00 |    3.00
seeker_angles |    0.00    0.00 |    0.08    0.09 |   -0.99   -1.00 |    1.00    1.00
cs_angles |  0.0005  0.0045 |  0.0834  0.0859 | -0.9898 -0.9964 |  0.9999  0.9966
optical_flow |  0.0000 -0.0001 |  0.0249  0.0268 | -0.9900 -1.1162 |  1.1519  1.1816
v_err    | -0.0093 |  0.0562 | -0.4519 |  0.1131
landing_rewards |    9.19 |    2.72 |    0.00 |   10.00
landing_margin |   -0

w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.09   -0.05   -0.07 |    0.09    0.08    0.05
a_f      |    0.03    0.11 |    0.64    1.78 |   -1.53   -3.14 |    1.54    3.06
w_f      |   -0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.04   -0.03   -0.03 |    0.03    0.03    0.02
w_rewards |   -0.50 |    0.35 |   -3.40 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.29 |    0.31 |    0.00 |    3.09
seeker_angles |    0.00    0.01 |    0.09    0.09 |   -0.99   -0.99 |    0.99    0.97
cs_angles |  0.0008  0.0055 |  0.0877  0.0881 | -0.9944 -0.9895 |  0.9855  0.9666
optical_flow | -0.0001 -0.0000 |  0.0246  0.0257 | -0.8900 -1.0522 |  1.0782  1.1917
v_err    | -0.0094 |  0.0565 | -0.4525 |  0.1992
landing_rewards |    9.13 |    2.82 |    0.00 |   10.00
landing_margin |   -0.03 |    0.02 |   -0.07 |    0.03
tracking_rewards |  -24.88 |    5.12 |  -50.84 |  -15.63
steps    |     377 |  

w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.10   -0.05   -0.08 |    0.08    0.08    0.05
a_f      |    0.08    0.02 |    0.64    1.86 |   -1.33   -3.13 |    1.54    3.14
w_f      |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.10   -0.03   -0.02 |    0.03    0.03    0.03
w_rewards |   -0.57 |    0.48 |   -5.39 |    0.00
w_penalty |   -0.32 |    5.67 | -100.00 |    0.00
fov_penalty |   -0.16 |    2.84 |  -50.00 |    0.00
theta_cv |    0.28 |    0.31 |    0.00 |    2.94
seeker_angles |    0.00    0.00 |    0.09    0.09 |   -1.00   -1.00 |    1.00    0.99
cs_angles |  0.0030  0.0031 |  0.0861  0.0863 | -0.9962 -0.9982 |  0.9996  0.9875
optical_flow | -0.0001 -0.0000 |  0.0276  0.0266 | -1.2537 -1.2760 |  1.2196  1.2735
v_err    | -0.0093 |  0.0571 | -0.4523 |  0.4661
landing_rewards |    9.39 |    2.40 |    0.00 |   10.00
landing_margin |    3.64 |   46.24 |   -0.08 |  669.04
tracking_rewards |  -24.26 |    5.43 |  -55.96 |  -16.09
steps    |     375 |  

attitude |    0.03   -0.09    0.06 |    1.24    0.64    1.92 |   -3.14   -1.57   -3.14 |    3.14    1.57    3.14
w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.10   -0.05   -0.08 |    0.09    0.07    0.06
a_f      |   -0.09    0.06 |    0.64    1.91 |   -1.42   -3.14 |    1.42    3.14
w_f      |   -0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.03   -0.02   -0.02 |    0.03    0.02    0.02
w_rewards |   -0.55 |    0.53 |   -6.63 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.29 |    0.32 |    0.00 |    3.13
seeker_angles |    0.00    0.01 |    0.09    0.09 |   -1.00   -0.99 |    1.00    1.00
cs_angles |  0.0009  0.0089 |  0.0859  0.0896 | -0.9997 -0.9911 |  0.9965  0.9973
optical_flow | -0.0002 -0.0001 |  0.0257  0.0268 | -1.1654 -1.3481 |  1.3800  1.1796
v_err    | -0.0093 |  0.0565 | -0.4529 |  0.1162
landing_rewards |    9.48 |    2.21 |    0.00 |   10.00
landing_margin |   -0

w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.10   -0.05   -0.07 |    0.09    0.08    0.08
a_f      |    0.01   -0.20 |    0.64    1.84 |   -1.33   -3.10 |    1.46    3.12
w_f      |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.10   -0.02   -0.02 |    0.03    0.03    0.04
w_rewards |   -0.58 |    0.49 |   -3.91 |    0.00
w_penalty |   -0.32 |    5.67 | -100.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.28 |    0.32 |    0.00 |    3.01
seeker_angles |    0.00    0.01 |    0.08    0.09 |   -0.99   -1.00 |    0.92    0.99
cs_angles |  0.0014  0.0074 |  0.0832  0.0904 | -0.9937 -0.9980 |  0.9242  0.9871
optical_flow | -0.0000  0.0001 |  0.0259  0.0261 | -0.9530 -0.9886 |  1.1176  1.4954
v_err    | -0.0095 |  0.0574 | -0.4534 |  0.1653
landing_rewards |    9.26 |    2.62 |    0.00 |   10.00
landing_margin |    3.17 |   56.23 |   -0.07 |  991.67
tracking_rewards |  -24.51 |    5.51 |  -57.84 |  -11.99
steps    |     377 |  

attitude |   -0.01    0.01    0.13 |    1.17    0.65    1.81 |   -3.14   -1.57   -3.14 |    3.14    1.56    3.14
w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.10   -0.05   -0.08 |    0.10    0.08    0.05
a_f      |    0.00    0.18 |    0.65    1.80 |   -1.45   -3.10 |    1.43    3.13
w_f      |   -0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.03   -0.02   -0.02 |    0.03    0.03    0.03
w_rewards |   -0.58 |    0.44 |   -4.79 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.28 |    0.31 |    0.00 |    3.10
seeker_angles |    0.00    0.01 |    0.09    0.08 |   -0.99   -0.99 |    0.98    0.99
cs_angles |  0.0005  0.0066 |  0.0875  0.0832 | -0.9920 -0.9940 |  0.9762  0.9924
optical_flow | -0.0001  0.0001 |  0.0254  0.0266 | -1.2126 -1.0883 |  1.1152  1.2140
v_err    | -0.0091 |  0.0572 | -0.4533 |  0.1171
landing_rewards |    9.39 |    2.40 |    0.00 |   10.00
landing_margin |   -0

thrust   |   -0.01    0.01    0.00 |    0.70    0.69    0.70 |   -3.45   -3.43   -3.43 |    3.45    3.46    3.45
norm_thrust |    0.93 |    0.77 |    0.00 |    3.46
fuel     |    1.64 |    0.28 |    0.24 |    4.20
rewards  |  -21.21 |   13.51 | -173.66 |   -9.91
fuel_rewards |   -4.69 |    0.80 |  -12.03 |   -0.69
glideslope_rewards |    0.00 |    0.00 |    0.00 |    0.00
glideslope_penalty |    0.00 |    0.00 |    0.00 |    0.00
glideslope |    2.93 |   13.19 |    0.01 |  262.91
norm_af  |    1.70 |    0.86 |    0.06 |    3.31
norm_wf  |    0.02 |    0.01 |    0.00 |    0.10
rh_penalty |    0.00 |    0.00 |    0.00 |    0.00
att_rewards |    0.00 |    0.00 |    0.00 |    0.00
att_penalty |    0.00 |    0.00 |    0.00 |    0.00
attitude |   -0.02    0.04    0.08 |    1.11    0.67    1.77 |   -3.14   -1.55   -3.14 |    3.14    1.55    3.14
w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.10   -0.09   -0.07 |    0.08    0.08    0.05
a_f      |    0.04    0.04 |    0.68

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   3.9652   1.8896   7.8267  29.5271  16.8478  11.1535
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0005   0.0003   0.0011   8.0871   2.2896   2.8947
Update Cnt = 1840    ET =   1206.6   Stats:  Mean, Std, Min, Max
r_f      |   16.06   -3.00   -6.22 |  200.27  161.16  197.94 | -383.19 -392.79 -389.77 |  399.67  386.83  388.73
v_f      |   -0.01   -0.00    0.00 |    0.04    0.04    0.05 |   -0.10   -0.10   -0.11 |    0.08    0.09    0.10
r_i      |   80.05    2.99  -34.56 |  725.79  615.24  756.28 |-1345.63-1334.78-1237.79 | 1351.57 1264.59 1273.83
v_i      |   -0.01   -0.00    0.00 |    0.05    0.04    0.05 |   -0.09   -0.09   -0.09 |    0.09    0.09    0.10
norm_rf  |    0.23 |    0.09 |    0.04 |    0.56
norm_vf  |    0.07 |    0.02 |    0.03 |    0.13
gs_f     |    1.33 |    2.37 |    0.01 |   27.77
thrust   |   -0.00   -0.00   -0.00 |    0.67    0.69    0.68 |   -3.46   -3.46   -3.46 |    3.44    3.46    3.44
norm_thrust |    

ADV1:  -0.00024918762479894267 0.02263971965866307 1.2430322946208672 -0.3404051222095116
ADV2:  -0.002664098760417023 0.3580888936765292 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.4957   0.1877   1.0169  29.5271  16.8478  11.1535
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0010   0.0007   0.0028   8.0871   2.2896   2.8947
***** Episode 57367, Mean R = -19.5  Std R = 5.9  Min R = -38.8
PolicyLoss: 0.00262
Policy_Beta: 0.1
Policy_Entropy: 0.146
Policy_KL: 0.000748
Policy_SD: 0.545
Policy_lr_mult: 0.198
Steps: 1.19e+04
TotalSteps: 2.08e+07
VF_0_ExplainedVarNew: 0.975
VF_0_ExplainedVarOld: 0.905
VF_0_Loss : 0.00924


ADV1:  -0.0017316859688115392 0.013914977947881572 0.09126578841474381 -0.2366138086488936
ADV2:  0.022451545750484095 0.7606307189225818 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.7629   1.0772   5.9265  29.5271  16.8478  11.1535
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0021   0.0012   0.0047   8.0871   2.2896   2.89

ADV1:  -0.000908330631177495 0.011362882852604481 0.10842426757007134 -0.23690210796588396
ADV2:  0.020356063327629893 0.7880558659049394 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.4450   0.6293   3.0423  29.5271  16.8478  11.1535
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0012   0.0007   0.0027   8.0871   2.2896   2.8947
***** Episode 57646, Mean R = -20.5  Std R = 6.5  Min R = -36.7
PolicyLoss: -0.0192
Policy_Beta: 0.1
Policy_Entropy: 0.144
Policy_KL: 0.00097
Policy_SD: 0.553
Policy_lr_mult: 0.198
Steps: 1.19e+04
TotalSteps: 2.09e+07
VF_0_ExplainedVarNew: 0.98
VF_0_ExplainedVarOld: 0.975
VF_0_Loss : 0.00539


ADV1:  -0.0004592887380819743 0.011142186877320291 0.054876925554477096 -0.07215321858085072
ADV2:  0.02000016750280854 0.8913912691017754 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.2790   1.1308   5.1215  29.5271  16.8478  11.1535
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0005   0.0003   0.0012   8.0871   2.2896   2.894

ADV1:  0.0006661963847865823 0.006533591837537778 0.04798881586507581 -0.055780971839518356
ADV2:  -0.010057934847463493 0.9009752722214124 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   3.7041   2.6376   9.9665  29.5271  16.8478  11.1535
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0009   0.0005   0.0019   8.0871   2.2896   2.8947
***** Episode 57925, Mean R = -19.2  Std R = 5.9  Min R = -37.4
PolicyLoss: -0.000969
Policy_Beta: 0.1
Policy_Entropy: 0.146
Policy_KL: 0.000905
Policy_SD: 0.562
Policy_lr_mult: 0.198
Steps: 1.18e+04
TotalSteps: 2.1e+07
VF_0_ExplainedVarNew: 0.993
VF_0_ExplainedVarOld: 0.991
VF_0_Loss : 0.00515


ADV1:  -0.002133223490693514 0.012179669760674068 0.12984219587696028 -0.2829904811335985
ADV2:  0.03173912347281085 0.7386274868461136 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.2150   0.5427   3.2795  29.5271  16.8478  11.1535
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0025   0.0014   0.0054   8.0871   2.2896   2.8

ADV1:  -0.00033249964847719495 0.006211322967198435 0.05273350503073643 -0.04646235399902565
ADV2:  0.00045566975691969393 0.904958801826596 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.2297   0.6203   3.3872  29.5271  16.8478  11.1535
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0005   0.0003   0.0012   8.0871   2.2896   2.8947
***** Episode 58204, Mean R = -19.1  Std R = 4.8  Min R = -28.8
PolicyLoss: 9.03e-05
Policy_Beta: 0.1
Policy_Entropy: 0.145
Policy_KL: 0.001
Policy_SD: 0.556
Policy_lr_mult: 0.198
Steps: 1.19e+04
TotalSteps: 2.11e+07
VF_0_ExplainedVarNew: 0.993
VF_0_ExplainedVarOld: 0.992
VF_0_Loss : 0.00565


ADV1:  -0.0028806896367310065 0.011472503971606396 0.0470501551107545 -0.08033494787111636
ADV2:  0.03851455869037367 0.8798494836683782 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   6.5189   4.9272  16.6021  29.5271  16.8478  11.1535
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0033   0.0021   0.0074   8.0871   2.2896   2.89

ADV1:  -0.000719587060427279 0.009425112844757095 0.04118468490845972 -0.11693345293829616
ADV2:  0.03252236999197883 0.8174214030305916 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.9548   2.2096   9.3424  29.5271  16.8478  11.1535
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0008   0.0005   0.0018   8.0871   2.2896   2.8947
***** Episode 58483, Mean R = -18.7  Std R = 7.1  Min R = -40.0
PolicyLoss: -0.0319
Policy_Beta: 0.1
Policy_Entropy: 0.147
Policy_KL: 0.00092
Policy_SD: 0.555
Policy_lr_mult: 0.198
Steps: 1.16e+04
TotalSteps: 2.12e+07
VF_0_ExplainedVarNew: 0.984
VF_0_ExplainedVarOld: 0.982
VF_0_Loss : 0.00608


ADV1:  -0.000588213729198114 0.00907419070983795 0.05345716352085761 -0.08704948815616698
ADV2:  0.018296028240857895 0.875995538032196 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   5.0807   3.4055  13.9090  29.5271  16.8478  11.1535
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0007   0.0004   0.0016   8.0871   2.2896   2.8947
*

ADV1:  -0.0023284229062112936 0.013819444774990466 0.07343587471482049 -0.28549759059165125
ADV2:  0.032630392081193234 0.7103998711338477 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.8733   0.3167   1.7417  29.5271  16.8478  11.1535
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0025   0.0015   0.0059   8.0871   2.2896   2.8947
***** Episode 58762, Mean R = -21.5  Std R = 7.7  Min R = -41.7
PolicyLoss: -0.0253
Policy_Beta: 0.1
Policy_Entropy: 0.144
Policy_KL: 0.001
Policy_SD: 0.567
Policy_lr_mult: 0.198
Steps: 1.18e+04
TotalSteps: 2.13e+07
VF_0_ExplainedVarNew: 0.976
VF_0_ExplainedVarOld: 0.968
VF_0_Loss : 0.00534


ADV1:  2.789281013266259e-05 0.009526569614548633 0.11086320441579794 -0.16551133607008373
ADV2:  0.016210428016914354 0.8034081987195899 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.6291   0.7595   3.9119  29.5271  16.8478  11.1535
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0004   0.0003   0.0011   8.0871   2.2896   2.8947

ADV1:  -0.00015291603810165707 0.008211012316692972 0.07262608237242105 -0.08013982947863851
ADV2:  0.017932567939170214 0.8413948843766869 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.3755   1.4556   6.6343  29.5271  16.8478  11.1535
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0007   0.0004   0.0014   8.0871   2.2896   2.8947
***** Episode 59041, Mean R = -19.6  Std R = 6.1  Min R = -39.5
PolicyLoss: -0.0208
Policy_Beta: 0.1
Policy_Entropy: 0.144
Policy_KL: 0.00108
Policy_SD: 0.557
Policy_lr_mult: 0.198
Steps: 1.19e+04
TotalSteps: 2.15e+07
VF_0_ExplainedVarNew: 0.988
VF_0_ExplainedVarOld: 0.986
VF_0_Loss : 0.00563


ADV1:  0.0007451619974445253 0.008535406863720415 0.06940716140282771 -0.17521803096764033
ADV2:  0.012678007633578545 0.7893698946769037 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.8572   1.7010   8.3992  29.5271  16.8478  11.1535
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0009   0.0005   0.0019   8.0871   2.2896   2.8

ADV1:  0.0004923598288403604 0.03225421631515804 0.6013467008089076 -0.12073749130521721
ADV2:  -0.04918424568961564 0.47373262953078377 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.1022   0.5234   2.4524  29.5271  16.8478  11.1535
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0028   0.0015   0.0061   8.0871   2.2896   2.8947
***** Episode 59320, Mean R = -20.9  Std R = 13.0  Min R = -86.5
PolicyLoss: 0.05
Policy_Beta: 0.1
Policy_Entropy: 0.145
Policy_KL: 0.000911
Policy_SD: 0.561
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 2.16e+07
VF_0_ExplainedVarNew: 0.948
VF_0_ExplainedVarOld: 0.827
VF_0_Loss : 0.0213


ADV1:  0.001349090282567587 0.013352117699603129 0.11907483035760696 -0.09961099711078186
ADV2:  -0.00915142368700383 0.9044799678789482 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   4.1440   2.5989  10.8341  29.5271  16.8478  11.1535
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0020   0.0010   0.0047   8.0871   2.2896   2.8947
**

ADV1:  0.00025586644737374167 0.011821939552245165 0.06272729301679408 -0.12166804900243744
ADV2:  0.012093603721216472 0.8971093053507527 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.6858   1.3897   7.1017  29.5271  16.8478  11.1535
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0004   0.0002   0.0009   8.0871   2.2896   2.8947
***** Episode 59599, Mean R = -22.6  Std R = 7.7  Min R = -40.1
PolicyLoss: -0.0179
Policy_Beta: 0.1
Policy_Entropy: 0.144
Policy_KL: 0.00111
Policy_SD: 0.567
Policy_lr_mult: 0.198
Steps: 1.16e+04
TotalSteps: 2.17e+07
VF_0_ExplainedVarNew: 0.979
VF_0_ExplainedVarOld: 0.976
VF_0_Loss : 0.00855


ADV1:  0.0021488610971317373 0.0068811458132428905 0.0865257036401037 -0.06041572067728612
ADV2:  -0.026789833335409907 0.8560325156696079 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.6976   0.9165   4.9194  29.5271  16.8478  11.1535
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0027   0.0015   0.0058   8.0871   2.2896   2.8

cs_angles | -0.0005  0.0067 |  0.0831  0.0864 | -0.9972 -0.9789 |  0.9677  0.9809
optical_flow | -0.0001 -0.0002 |  0.0249  0.0265 | -1.3479 -1.0326 |  1.2017  1.4441
v_err    | -0.0095 |  0.0566 | -0.4535 |  0.1576
landing_rewards |    9.42 |    2.34 |    0.00 |   10.00
landing_margin |   -0.02 |    0.02 |   -0.06 |    0.04
tracking_rewards |  -23.58 |    4.96 |  -44.01 |  -15.27
steps    |     377 |      20 |     331 |     418
***** Episode 59878, Mean R = -18.7  Std R = 5.9  Min R = -32.3
PolicyLoss: -0.0139
Policy_Beta: 0.1
Policy_Entropy: 0.146
Policy_KL: 0.00142
Policy_SD: 0.559
Policy_lr_mult: 0.198
Steps: 1.16e+04
TotalSteps: 2.18e+07
VF_0_ExplainedVarNew: 0.98
VF_0_ExplainedVarOld: 0.969
VF_0_Loss : 0.00855


ADV1:  0.0027096201681945076 0.008204805148492873 0.060971952887663106 -0.1714214761049747
ADV2:  -0.01514569746112414 0.7721933022909218 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.5862   0.8865   5.0039  29.5271  16.8478  11.1535
ValFun  Gradients: u/s

attitude |    0.03   -0.07    0.08 |    1.28    0.62    1.93 |   -3.14   -1.54   -3.14 |    3.14    1.54    3.14
w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.09   -0.05   -0.08 |    0.09    0.07    0.05
a_f      |   -0.07    0.13 |    0.62    1.92 |   -1.46   -3.14 |    1.43    3.14
w_f      |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.04   -0.03   -0.03 |    0.03    0.02    0.02
w_rewards |   -0.48 |    0.34 |   -2.81 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.27 |    0.31 |    0.00 |    3.03
seeker_angles |   -0.00    0.00 |    0.09    0.08 |   -0.99   -0.99 |    0.99    0.95
cs_angles | -0.0003  0.0042 |  0.0869  0.0822 | -0.9943 -0.9933 |  0.9927  0.9536
optical_flow | -0.0001 -0.0000 |  0.0252  0.0254 | -1.1100 -1.2233 |  1.2267  1.2179
v_err    | -0.0096 |  0.0568 | -0.4530 |  0.2143
landing_rewards |    9.58 |    2.00 |    0.00 |   10.00
landing_margin |   -0

attitude |   -0.06   -0.05   -0.01 |    1.24    0.68    1.86 |   -3.14   -1.55   -3.14 |    3.14    1.57    3.14
w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.10   -0.05   -0.07 |    0.09    0.07    0.06
a_f      |   -0.06    0.07 |    0.68    1.86 |   -1.49   -3.13 |    1.44    3.11
w_f      |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.10   -0.02   -0.03 |    0.03    0.03    0.02
w_rewards |   -0.47 |    0.33 |   -2.77 |   -0.00
w_penalty |   -0.32 |    5.67 | -100.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.27 |    0.30 |    0.00 |    3.04
seeker_angles |   -0.01    0.00 |    0.08    0.09 |   -1.00   -1.00 |    0.99    0.98
cs_angles | -0.0054  0.0038 |  0.0814  0.0853 | -0.9986 -0.9998 |  0.9920  0.9831
optical_flow |  0.0000  0.0001 |  0.0264  0.0272 | -1.2512 -1.0454 |  1.2702  1.2364
v_err    | -0.0096 |  0.0570 | -0.4571 |  0.1821
landing_rewards |    9.58 |    2.00 |    0.00 |   10.00
landing_margin |    3

attitude |   -0.03   -0.04   -0.02 |    1.18    0.63    1.87 |   -3.14   -1.55   -3.14 |    3.14    1.56    3.14
w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.09   -0.05   -0.07 |    0.07    0.07    0.05
a_f      |   -0.04    0.04 |    0.63    1.89 |   -1.40   -3.12 |    1.50    3.14
w_f      |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.03   -0.03   -0.02 |    0.03    0.02    0.02
w_rewards |   -0.46 |    0.32 |   -2.24 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.28 |    0.31 |    0.00 |    2.98
seeker_angles |    0.00    0.00 |    0.09    0.08 |   -1.00   -1.00 |    0.99    0.97
cs_angles |  0.0023  0.0046 |  0.0853  0.0848 | -0.9985 -0.9977 |  0.9862  0.9737
optical_flow | -0.0000  0.0000 |  0.0265  0.0257 | -1.1734 -1.0318 |  1.2823  1.0556
v_err    | -0.0093 |  0.0569 | -0.4525 |  0.1194
landing_rewards |    9.65 |    1.85 |    0.00 |   10.00
landing_margin |   -0

attitude |    0.02   -0.04    0.13 |    1.24    0.66    1.88 |   -3.14   -1.57   -3.14 |    3.14    1.55    3.14
w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.08   -0.05   -0.07 |    0.09    0.07    0.05
a_f      |   -0.04    0.12 |    0.65    1.87 |   -1.44   -3.13 |    1.38    3.12
w_f      |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.03   -0.02   -0.03 |    0.03    0.02    0.03
w_rewards |   -0.48 |    0.33 |   -1.78 |   -0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.28 |    0.31 |    0.00 |    3.03
seeker_angles |    0.00    0.01 |    0.08    0.09 |   -1.00   -1.00 |    1.00    0.99
cs_angles |  0.0015  0.0063 |  0.0843  0.0859 | -0.9967 -0.9964 |  0.9978  0.9901
optical_flow | -0.0001 -0.0002 |  0.0254  0.0260 | -1.1651 -1.1872 |  0.9713  1.3215
v_err    | -0.0091 |  0.0570 | -0.4524 |  0.1206
landing_rewards |    9.32 |    2.51 |    0.00 |   10.00
landing_margin |   -0

thrust   |   -0.00    0.00   -0.00 |    0.69    0.70    0.69 |   -3.44   -3.44   -3.46 |    3.45    3.42    3.46
norm_thrust |    0.93 |    0.76 |    0.00 |    3.46
fuel     |    1.60 |    0.21 |    1.14 |    2.23
rewards  |  -19.63 |    5.75 |  -40.72 |   -8.86
fuel_rewards |   -4.58 |    0.59 |   -6.39 |   -3.28
glideslope_rewards |    0.00 |    0.00 |    0.00 |    0.00
glideslope_penalty |    0.00 |    0.00 |    0.00 |    0.00
glideslope |    2.89 |   12.78 |    0.01 |  532.10
norm_af  |    1.76 |    0.89 |    0.14 |    3.25
norm_wf  |    0.02 |    0.01 |    0.00 |    0.04
rh_penalty |    0.00 |    0.00 |    0.00 |    0.00
att_rewards |    0.00 |    0.00 |    0.00 |    0.00
att_penalty |    0.00 |    0.00 |    0.00 |    0.00
attitude |   -0.00   -0.06    0.02 |    1.22    0.65    1.87 |   -3.14   -1.57   -3.14 |    3.14    1.56    3.14
w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.07   -0.05   -0.08 |    0.08    0.08    0.05
a_f      |   -0.06    0.11 |    0.65

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.0600   1.0227   4.6343  29.5271  16.8478  11.1535
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0008   0.0005   0.0017   8.0871   2.2896   2.8947
Update Cnt = 1990    ET =   1047.3   Stats:  Mean, Std, Min, Max
r_f      |    1.02  -16.37   -9.86 |  180.23  166.05  200.98 | -391.24 -365.09 -385.57 |  378.17  371.76  380.58
v_f      |   -0.00    0.00    0.00 |    0.04    0.04    0.05 |   -0.11   -0.09   -0.11 |    0.09    0.09    0.13
r_i      |    5.72  -51.32  -47.19 |  665.60  657.61  772.90 |-1251.50-1361.91-1293.30 | 1261.66 1246.53 1297.88
v_i      |   -0.00    0.00    0.00 |    0.04    0.04    0.05 |   -0.09   -0.10   -0.10 |    0.09    0.10    0.10
norm_rf  |    0.24 |    0.09 |    0.05 |    0.62
norm_vf  |    0.07 |    0.02 |    0.04 |    0.14
gs_f     |    1.58 |    5.00 |    0.01 |   83.35
thrust   |   -0.01    0.00    0.01 |    0.69    0.70    0.68 |   -3.42   -3.37   -3.44 |    3.46    3.45    3.45
norm_thrust |    

ADV1:  0.00019091628553641798 0.00812272251332068 0.06911652715966887 -0.0534713739847586
ADV2:  0.0043961769914270445 0.8719372377952136 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   3.1603   1.7415   7.8438  29.5271  16.8478  11.1535
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0003   0.0002   0.0006   8.0871   2.2896   2.8947
***** Episode 62017, Mean R = -19.2  Std R = 4.8  Min R = -29.6
PolicyLoss: -0.0097
Policy_Beta: 0.1
Policy_Entropy: 0.15
Policy_KL: 0.0013
Policy_SD: 0.548
Policy_lr_mult: 0.198
Steps: 1.18e+04
TotalSteps: 2.26e+07
VF_0_ExplainedVarNew: 0.988
VF_0_ExplainedVarOld: 0.986
VF_0_Loss : 0.0124


ADV1:  -0.002510803656873772 0.012119131454417446 0.06601263205516328 -0.0749171335352938
ADV2:  0.02785663633783256 0.9064541578392278 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   3.1643   1.9870   9.4046  29.5271  16.8478  11.1535
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0029   0.0018   0.0065   8.0871   2.2896   2.8947
Upd

ADV1:  0.0007965651056853899 0.007254309714909076 0.05685777729864905 -0.12300391610752182
ADV2:  0.014143453552659158 0.7846208601016478 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.8786   1.1599   5.4612  29.5271  16.8478  11.1535
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0009   0.0006   0.0022   8.0871   2.2896   2.8947
***** Episode 62296, Mean R = -19.6  Std R = 6.4  Min R = -34.1
PolicyLoss: -0.027
Policy_Beta: 0.1
Policy_Entropy: 0.148
Policy_KL: 0.000815
Policy_SD: 0.558
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 2.27e+07
VF_0_ExplainedVarNew: 0.992
VF_0_ExplainedVarOld: 0.99
VF_0_Loss : 0.00783


ADV1:  0.0005628789160980766 0.006252822875131442 0.05191470347589899 -0.07988934242982437
ADV2:  -0.0010794077209030492 0.8430930075557004 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.2933   0.5065   2.1780  29.5271  16.8478  11.1535
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0009   0.0004   0.0017   8.0871   2.2896   2.89

ADV1:  0.00024149867336140023 0.008300501080113659 0.19597390948795335 -0.06316461835109174
ADV2:  -0.012292533595384509 0.8020993282831669 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.6744   0.8111   4.5411  29.5271  16.8478  11.1535
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0008   0.0004   0.0017   8.0871   2.2896   2.8947
***** Episode 62575, Mean R = -18.5  Std R = 6.0  Min R = -36.5
PolicyLoss: 0.00753
Policy_Beta: 0.1
Policy_Entropy: 0.15
Policy_KL: 0.000777
Policy_SD: 0.553
Policy_lr_mult: 0.198
Steps: 1.16e+04
TotalSteps: 2.28e+07
VF_0_ExplainedVarNew: 0.99
VF_0_ExplainedVarOld: 0.986
VF_0_Loss : 0.0111


ADV1:  -0.0018449119463048648 0.006808718738897533 0.08576700252622954 -0.08163304787083203
ADV2:  0.02284433162909017 0.8468817873222866 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.2574   1.1076   5.1592  29.5271  16.8478  11.1535
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0024   0.0014   0.0049   8.0871   2.2896   2.894

ADV1:  0.001031620303428432 0.009399759247373494 0.04461531043428296 -0.09066361181534133
ADV2:  0.013464883943273795 0.8709528860473869 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.7511   0.7814   3.9449  29.5271  16.8478  11.1535
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0011   0.0007   0.0027   8.0871   2.2896   2.8947
***** Episode 62854, Mean R = -20.1  Std R = 4.4  Min R = -28.8
PolicyLoss: -0.0243
Policy_Beta: 0.1
Policy_Entropy: 0.148
Policy_KL: 0.00122
Policy_SD: 0.557
Policy_lr_mult: 0.198
Steps: 1.16e+04
TotalSteps: 2.29e+07
VF_0_ExplainedVarNew: 0.986
VF_0_ExplainedVarOld: 0.984
VF_0_Loss : 0.00947


ADV1:  0.0008372487237421345 0.008732592415089453 0.11758180515392086 -0.19758527126655345
ADV2:  0.007475775780589613 0.7809518505727331 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.6736   1.2537   6.5633  29.5271  16.8478  11.1535
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0012   0.0007   0.0025   8.0871   2.2896   2.8947

ADV1:  -0.0018611938522890641 0.014510405699379763 0.17361417972390514 -0.10093900812618745
ADV2:  -0.005095964888707623 0.8386107142274193 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.4348   0.6929   3.5273  29.5271  16.8478  11.1535
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0017   0.0011   0.0051   8.0871   2.2896   2.8947
***** Episode 63133, Mean R = -20.3  Std R = 5.2  Min R = -32.1
PolicyLoss: 0.0117
Policy_Beta: 0.1
Policy_Entropy: 0.148
Policy_KL: 0.000956
Policy_SD: 0.56
Policy_lr_mult: 0.198
Steps: 1.19e+04
TotalSteps: 2.3e+07
VF_0_ExplainedVarNew: 0.966
VF_0_ExplainedVarOld: 0.957
VF_0_Loss : 0.000636


Dynamics: Max Disturbance (m/s^2):  [0.00149461 0.0018056  0.00138071] 0.002720371623523329
ADV1:  0.0007840107026724787 0.01647621440446819 0.31026491507428733 -0.18219971341576635
ADV2:  -0.024808611194355873 0.6783819908104152 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.3264   0.5871   2.7718  29.5271  16.8478  11.1535
ValFun  

ADV1:  0.0009384200196617226 0.010422931301157847 0.16644232775803885 -0.09443335242518669
ADV2:  -0.0030953388327170962 0.8203651583786596 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.2989   0.6109   3.0797  29.5271  16.8478  11.1535
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0010   0.0005   0.0024   8.0871   2.2896   2.8947
***** Episode 63412, Mean R = -19.5  Std R = 5.2  Min R = -35.9
PolicyLoss: -0.00652
Policy_Beta: 0.1
Policy_Entropy: 0.148
Policy_KL: 0.000838
Policy_SD: 0.554
Policy_lr_mult: 0.198
Steps: 1.18e+04
TotalSteps: 2.31e+07
VF_0_ExplainedVarNew: 0.983
VF_0_ExplainedVarOld: 0.978
VF_0_Loss : 0.00337


Dynamics: Max Disturbance (m/s^2):  [0.00149461 0.0018056  0.00138071] 0.002720371623523329
ADV1:  -0.00033095401265113817 0.009719472538694473 0.16453159588889363 -0.1509771254981656
ADV2:  0.009286594483961673 0.7443025215334366 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.7795   1.0757   5.0643  29.5271  16.8478  11.1535
ValF

Dynamics: Max Disturbance (m/s^2):  [0.00149461 0.0018056  0.00138071] 0.002720371623523329
ADV1:  -1.180273362386869e-05 0.008163739197080988 0.07474134595487791 -0.11777434575727974
ADV2:  0.01678897719027337 0.8638981622373277 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.4234   0.6796   3.7249  29.5271  16.8478  11.1535
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0007   0.0004   0.0017   8.0871   2.2896   2.8947
***** Episode 63691, Mean R = -18.9  Std R = 4.2  Min R = -29.9
PolicyLoss: -0.021
Policy_Beta: 0.1
Policy_Entropy: 0.152
Policy_KL: 0.00102
Policy_SD: 0.542
Policy_lr_mult: 0.198
Steps: 1.18e+04
TotalSteps: 2.32e+07
VF_0_ExplainedVarNew: 0.987
VF_0_ExplainedVarOld: 0.986
VF_0_Loss : 0.00213


ADV1:  0.0009605302737339032 0.008491190723732412 0.0807195432164215 -0.1251131291349491
ADV2:  0.010307353055172344 0.7820464372081131 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.5289   0.6405   3.7722  29.5271  16.8478  11.1535
ValFun  Grad

Dynamics: Max Disturbance (m/s^2):  [0.00149461 0.0018056  0.00138071] 0.002720371623523329
ADV1:  0.00239613156188997 0.008346511406601812 0.09314621566017817 -0.07173273242592249
ADV2:  -0.009259471506830652 0.8206562643453301 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.7877   0.9953   5.3850  29.5271  16.8478  11.1535
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0029   0.0017   0.0063   8.0871   2.2896   2.8947
***** Episode 63970, Mean R = -20.5  Std R = 6.5  Min R = -33.3
PolicyLoss: -0.0184
Policy_Beta: 0.1
Policy_Entropy: 0.149
Policy_KL: 0.00127
Policy_SD: 0.556
Policy_lr_mult: 0.198
Steps: 1.19e+04
TotalSteps: 2.33e+07
VF_0_ExplainedVarNew: 0.991
VF_0_ExplainedVarOld: 0.988
VF_0_Loss : 0.00204


ADV1:  -0.0022089778398001656 0.011355242139606212 0.0574747977826916 -0.07667465254639722
ADV2:  0.03400575179300207 0.877278932505339 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.0518   0.9297   4.0332  29.5271  16.8478  11.1535
ValFun  Grad

***** Episode 64218, Mean R = -20.0  Std R = 6.3  Min R = -32.7
PolicyLoss: -0.0238
Policy_Beta: 0.1
Policy_Entropy: 0.149
Policy_KL: 0.000802
Policy_SD: 0.555
Policy_lr_mult: 0.198
Steps: 1.15e+04
TotalSteps: 2.34e+07
VF_0_ExplainedVarNew: 0.978
VF_0_ExplainedVarOld: 0.977
VF_0_Loss : 0.00214


ADV1:  0.002311506377562911 0.008600028480024962 0.059570060795100965 -0.07929582372090495
ADV2:  -0.002255686025336824 0.8752158706453587 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   3.7866   2.2145   9.0362  29.5271  16.8478  11.1535
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0026   0.0015   0.0061   8.0871   2.2896   2.8947
***** Episode 64249, Mean R = -20.1  Std R = 5.1  Min R = -31.5
PolicyLoss: -0.0223
Policy_Beta: 0.1
Policy_Entropy: 0.15
Policy_KL: 0.00121
Policy_SD: 0.553
Policy_lr_mult: 0.198
Steps: 1.19e+04
TotalSteps: 2.34e+07
VF_0_ExplainedVarNew: 0.987
VF_0_ExplainedVarOld: 0.985
VF_0_Loss : 0.00214


ADV1:  0.00040846470918796284 0.009289485002098455 0.2

seeker_angles |   -0.00    0.00 |    0.08    0.09 |   -1.00   -0.99 |    1.00    1.00
cs_angles | -0.0008  0.0023 |  0.0840  0.0857 | -0.9981 -0.9928 |  0.9959  0.9984
optical_flow | -0.0001 -0.0001 |  0.0262  0.0267 | -1.3226 -1.5231 |  1.0852  1.2760
v_err    | -0.0095 |  0.0561 | -0.4548 |  0.1761
landing_rewards |    9.45 |    2.28 |    0.00 |   10.00
landing_margin |   -0.03 |    0.02 |   -0.07 |    0.01
tracking_rewards |  -23.59 |    4.92 |  -50.44 |  -14.67
steps    |     379 |      21 |     335 |     420
***** Episode 64528, Mean R = -19.8  Std R = 7.0  Min R = -39.8
PolicyLoss: -0.0248
Policy_Beta: 0.1
Policy_Entropy: 0.148
Policy_KL: 0.00135
Policy_SD: 0.55
Policy_lr_mult: 0.198
Steps: 1.16e+04
TotalSteps: 2.35e+07
VF_0_ExplainedVarNew: 0.978
VF_0_ExplainedVarOld: 0.975
VF_0_Loss : 0.00129


ADV1:  -0.0005741489305345551 0.007294628288691743 0.03377650224536105 -0.06540225815906103
ADV2:  0.023462146002790608 0.8697996779055599 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max 

w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.08   -0.05   -0.07 |    0.08    0.07    0.05
a_f      |   -0.02    0.14 |    0.68    1.84 |   -1.54   -3.10 |    1.46    3.14
w_f      |   -0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.02   -0.02   -0.04 |    0.03    0.02    0.03
w_rewards |   -0.42 |    0.28 |   -1.61 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.27 |    0.31 |    0.00 |    3.10
seeker_angles |   -0.00    0.00 |    0.08    0.08 |   -0.99   -0.99 |    0.99    0.99
cs_angles | -0.0023  0.0033 |  0.0828  0.0810 | -0.9938 -0.9929 |  0.9886  0.9929
optical_flow | -0.0001 -0.0001 |  0.0250  0.0252 | -1.2036 -1.0413 |  1.1291  1.0583
v_err    | -0.0095 |  0.0561 | -0.4531 |  0.1154
landing_rewards |    9.61 |    1.93 |    0.00 |   10.00
landing_margin |   -0.03 |    0.02 |   -0.07 |    0.03
tracking_rewards |  -22.98 |    4.48 |  -41.78 |  -14.88
steps    |     377 |  

thrust   |   -0.01    0.01   -0.00 |    0.69    0.69    0.69 |   -3.44   -3.44   -3.46 |    3.46    3.32    3.46
norm_thrust |    0.92 |    0.76 |    0.00 |    3.46
fuel     |    1.60 |    0.20 |    1.22 |    2.46
rewards  |  -19.21 |    5.99 |  -41.65 |   -9.61
fuel_rewards |   -4.59 |    0.57 |   -7.03 |   -3.48
glideslope_rewards |    0.00 |    0.00 |    0.00 |    0.00
glideslope_penalty |    0.00 |    0.00 |    0.00 |    0.00
glideslope |    2.90 |   12.94 |    0.01 | 1184.93
norm_af  |    1.63 |    0.90 |    0.02 |    3.25
norm_wf  |    0.01 |    0.01 |    0.00 |    0.03
rh_penalty |    0.00 |    0.00 |    0.00 |    0.00
att_rewards |    0.00 |    0.00 |    0.00 |    0.00
att_penalty |    0.00 |    0.00 |    0.00 |    0.00
attitude |    0.08   -0.03   -0.19 |    1.08    0.63    1.74 |   -3.14   -1.56   -3.14 |    3.14    1.57    3.14
w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.10   -0.05   -0.07 |    0.09    0.08    0.05
a_f      |   -0.02   -0.14 |    0.64

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   5.0542   2.9161  11.1135  29.5271  16.8478  11.1535
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0015   0.0008   0.0032   8.0871   2.2896   2.8947
Update Cnt = 2110    ET =   1097.7   Stats:  Mean, Std, Min, Max
r_f      |   -0.49   13.19  -10.10 |  182.44  168.52  198.07 | -390.65 -390.98 -395.31 |  388.86  371.03  390.38
v_f      |   -0.00   -0.00    0.00 |    0.04    0.04    0.05 |   -0.10   -0.09   -0.10 |    0.10    0.09    0.13
r_i      |   21.51   39.76  -24.65 |  681.09  670.50  747.67 |-1280.15-1257.93-1279.68 | 1322.21 1254.62 1274.06
v_i      |   -0.00   -0.00    0.00 |    0.04    0.04    0.05 |   -0.09   -0.09   -0.09 |    0.09    0.09    0.10
norm_rf  |    0.22 |    0.09 |    0.02 |    0.50
norm_vf  |    0.07 |    0.02 |    0.03 |    0.14
gs_f     |    1.29 |    2.45 |    0.01 |   29.29
thrust   |   -0.00    0.00   -0.01 |    0.69    0.69    0.70 |   -3.43   -3.42   -3.43 |    3.40    3.45    3.40
norm_thrust |    

ADV1:  0.0027349259058126276 0.0064565289353864345 0.0653334527230392 -0.06173835789328419
ADV2:  -0.02121614211388959 0.8352148387063236 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.6723   0.9156   5.1108  29.5271  16.8478  11.1535
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0036   0.0021   0.0077   8.0871   2.2896   2.8947
***** Episode 65737, Mean R = -15.8  Std R = 4.2  Min R = -24.7
PolicyLoss: -0.0168
Policy_Beta: 0.1
Policy_Entropy: 0.153
Policy_KL: 0.00101
Policy_SD: 0.535
Policy_lr_mult: 0.198
Steps: 1.16e+04
TotalSteps: 2.4e+07
VF_0_ExplainedVarNew: 0.991
VF_0_ExplainedVarOld: 0.99
VF_0_Loss : 0.00151


ADV1:  -0.0022810155075969766 0.009019847420092974 0.05230186961996558 -0.15066758557683602
ADV2:  0.04039007051372903 0.7964849764320007 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.2540   1.0177   4.7216  29.5271  16.8478  11.1535
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0025   0.0015   0.0059   8.0871   2.2896   2.8947


ADV1:  -0.001161065657287522 0.009094208731666737 0.06007740937022388 -0.05896548401420042
ADV2:  0.027019024291027004 0.8637568479791966 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.6829   0.8762   4.4753  29.5271  16.8478  11.1535
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0015   0.0008   0.0034   8.0871   2.2896   2.8947
***** Episode 66016, Mean R = -17.7  Std R = 4.8  Min R = -28.0
PolicyLoss: -0.0223
Policy_Beta: 0.1
Policy_Entropy: 0.153
Policy_KL: 0.000986
Policy_SD: 0.546
Policy_lr_mult: 0.198
Steps: 1.16e+04
TotalSteps: 2.41e+07
VF_0_ExplainedVarNew: 0.983
VF_0_ExplainedVarOld: 0.981
VF_0_Loss : 0.00122


ADV1:  0.0010993122988913096 0.007988300472158396 0.05089266744399146 -0.05913815926213506
ADV2:  0.0071056347445477884 0.8848157675492608 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.2818   0.6235   3.3702  29.5271  16.8478  11.1535
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0012   0.0007   0.0029   8.0871   2.2896   2.8

ADV1:  -5.649885681319038e-06 0.008833989315279253 0.055099595616585895 -0.08140875530311986
ADV2:  0.026698777240577905 0.8082670842017292 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.6034   0.9076   4.9586  29.5271  16.8478  11.1535
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0006   0.0003   0.0014   8.0871   2.2896   2.8947
***** Episode 66295, Mean R = -20.3  Std R = 5.2  Min R = -32.3
PolicyLoss: -0.0314
Policy_Beta: 0.1
Policy_Entropy: 0.149
Policy_KL: 0.00083
Policy_SD: 0.556
Policy_lr_mult: 0.198
Steps: 1.18e+04
TotalSteps: 2.42e+07
VF_0_ExplainedVarNew: 0.987
VF_0_ExplainedVarOld: 0.985
VF_0_Loss : 0.00102


ADV1:  -0.000900173292423721 0.011910211027249165 0.1970369104284876 -0.14822605209501338
ADV2:  0.008243502064366411 0.7746351211459541 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.8160   1.0026   4.6583  29.5271  16.8478  11.1535
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0011   0.0006   0.0025   8.0871   2.2896   2.89

***** Episode 66543, Mean R = -19.0  Std R = 5.0  Min R = -31.7
PolicyLoss: -0.0217
Policy_Beta: 0.1
Policy_Entropy: 0.152
Policy_KL: 0.00103
Policy_SD: 0.548
Policy_lr_mult: 0.198
Steps: 1.16e+04
TotalSteps: 2.43e+07
VF_0_ExplainedVarNew: 0.984
VF_0_ExplainedVarOld: 0.981
VF_0_Loss : 0.00136


ADV1:  5.1805080194731934e-05 0.007505171388364458 0.03934613411911647 -0.05966790968788299
ADV2:  0.022267624458892802 0.8488596437627957 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.2112   0.9373   4.5471  29.5271  16.8478  11.1535
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0002   0.0001   0.0003   8.0871   2.2896   2.8947
***** Episode 66574, Mean R = -17.8  Std R = 5.2  Min R = -32.5
PolicyLoss: -0.0272
Policy_Beta: 0.1
Policy_Entropy: 0.151
Policy_KL: 0.000946
Policy_SD: 0.536
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 2.43e+07
VF_0_ExplainedVarNew: 0.989
VF_0_ExplainedVarOld: 0.988
VF_0_Loss : 0.00121


Dynamics: Max Disturbance (m/s^2):  [0.00149461 0.001

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.4893   1.2820   5.8327  29.5271  16.8478  11.1535
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0025   0.0016   0.0059   8.0871   2.2896   2.8947
***** Episode 66822, Mean R = -21.3  Std R = 6.9  Min R = -42.4
PolicyLoss: -0.0096
Policy_Beta: 0.1
Policy_Entropy: 0.15
Policy_KL: 0.000925
Policy_SD: 0.56
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 2.44e+07
VF_0_ExplainedVarNew: 0.987
VF_0_ExplainedVarOld: 0.984
VF_0_Loss : 0.00168


ADV1:  0.0020453193399294876 0.008435297096194762 0.04849675623609506 -0.05367565423155618
ADV2:  -0.0017455217792381014 0.8735303873786538 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.6603   0.7043   3.1041  29.5271  16.8478  11.1535
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0023   0.0014   0.0052   8.0871   2.2896   2.8947
***** Episode 66853, Mean R = -19.5  Std R = 5.8  Min R = -32.3
PolicyLoss: -0.0172
Policy_Beta: 0.1
Policy_Entropy: 0.15
Policy_KL: 0.00103
Pol

ADV1:  -0.002901658125004438 0.009120103495031106 0.0720485576162872 -0.08221693044651235
ADV2:  0.03762074301909551 0.8160177566294252 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.0063   0.9788   4.3877  29.5271  16.8478  11.1535
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0032   0.0018   0.0075   8.0871   2.2896   2.8947
***** Episode 67101, Mean R = -18.4  Std R = 5.1  Min R = -29.7
PolicyLoss: -0.0193
Policy_Beta: 0.1
Policy_Entropy: 0.153
Policy_KL: 0.000968
Policy_SD: 0.542
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 2.45e+07
VF_0_ExplainedVarNew: 0.986
VF_0_ExplainedVarOld: 0.983
VF_0_Loss : 0.00132


Dynamics: Max Disturbance (m/s^2):  [0.00149461 0.0018056  0.00138071] 0.002720371623523329
ADV1:  -0.0004578534208066078 0.008444392561525895 0.04631827678876416 -0.11538792969820633
ADV2:  0.03450595522036532 0.7681502235045841 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.4781   0.9614   4.9361  29.5271  16.8478  11.1535
ValFun  Gr

ADV1:  0.0015439933847417636 0.019198879059681206 0.1837275270438264 -0.4571448992047277
ADV2:  0.02089573703820901 0.4721824594738376 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.2434   0.6754   3.5439  29.5271  16.8478  11.1535
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0018   0.0009   0.0045   8.0871   2.2896   2.8947
***** Episode 67380, Mean R = -19.8  Std R = 8.1  Min R = -58.6
PolicyLoss: -0.0297
Policy_Beta: 0.1
Policy_Entropy: 0.151
Policy_KL: 0.000982
Policy_SD: 0.558
Policy_lr_mult: 0.198
Steps: 1.18e+04
TotalSteps: 2.46e+07
VF_0_ExplainedVarNew: 0.962
VF_0_ExplainedVarOld: 0.943
VF_0_Loss : 0.00356


Dynamics: Max Disturbance (m/s^2):  [0.00149461 0.0018056  0.00138071] 0.002720371623523329
ADV1:  -0.0005044447083771162 0.009890101845081226 0.09912065496815697 -0.09011383552995689
ADV2:  0.00510875176223622 0.7894637152040964 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.4362   0.8109   4.1108  29.5271  16.8478  11.1535
ValFun  Gra

Dynamics: Max Disturbance (m/s^2):  [0.00149461 0.0018056  0.00138071] 0.002720371623523329
ADV1:  0.003570423785584354 0.010630412471906566 0.16842113000449804 -0.0977479207800544
ADV2:  -0.01673541021182218 0.807293429784155 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.8281   1.1899   5.6526  29.5271  16.8478  11.1535
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0046   0.0027   0.0091   8.0871   2.2896   2.8947
***** Episode 67659, Mean R = -18.7  Std R = 4.8  Min R = -32.9
PolicyLoss: -0.0107
Policy_Beta: 0.1
Policy_Entropy: 0.153
Policy_KL: 0.00104
Policy_SD: 0.54
Policy_lr_mult: 0.198
Steps: 1.2e+04
TotalSteps: 2.47e+07
VF_0_ExplainedVarNew: 0.982
VF_0_ExplainedVarOld: 0.976
VF_0_Loss : 0.0043


ADV1:  0.0019830327818820023 0.010532517116117007 0.15666578867795888 -0.06858292873309985
ADV2:  -0.026038624120093497 0.772129475268035 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.8793   1.0186   5.1601  29.5271  16.8478  11.1535
ValFun  Gradien

optical_flow | -0.0001 -0.0000 |  0.0253  0.0252 | -1.1204 -0.9062 |  1.1680  1.0505
v_err    | -0.0102 |  0.0576 | -0.6793 |  0.1459
landing_rewards |    9.61 |    1.93 |    0.00 |   10.00
landing_margin |   -0.03 |    0.02 |   -0.07 |    0.02
tracking_rewards |  -23.07 |    6.55 | -101.67 |  -14.62
steps    |     381 |      20 |     338 |     438
***** Episode 67938, Mean R = -19.4  Std R = 6.4  Min R = -37.9
PolicyLoss: -0.00155
Policy_Beta: 0.0667
Policy_Entropy: 0.151
Policy_KL: 0.00469
Policy_SD: 0.554
Policy_lr_mult: 0.198
Steps: 1.2e+04
TotalSteps: 2.48e+07
VF_0_ExplainedVarNew: 0.984
VF_0_ExplainedVarOld: 0.981
VF_0_Loss : 0.00417


ADV1:  0.001730842928054183 0.009497881328156528 0.09682010313809516 -0.09106319993745216
ADV2:  -0.0028309579758413078 0.8721946914266923 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   9.1712   5.7403  19.1021  29.5271  16.8478  11.1535
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0020   0.0014   0.0044   8.0871   2.2896   2.8

attitude |    0.01    0.00    0.10 |    1.17    0.63    1.79 |   -3.14   -1.55   -3.14 |    3.14    1.52    3.14
w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.09   -0.05   -0.07 |    0.08    0.07    0.05
a_f      |    0.00    0.10 |    0.64    1.78 |   -1.49   -3.12 |    1.40    3.14
w_f      |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.03   -0.02   -0.03 |    0.03    0.04    0.02
w_rewards |   -0.43 |    0.27 |   -2.53 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.27 |    0.31 |    0.00 |    3.01
seeker_angles |   -0.00    0.00 |    0.08    0.09 |   -0.97   -0.97 |    0.97    1.00
cs_angles | -0.0013  0.0039 |  0.0829  0.0861 | -0.9683 -0.9659 |  0.9677  0.9961
optical_flow | -0.0000  0.0001 |  0.0238  0.0253 | -1.1671 -1.2238 |  1.1025  1.3714
v_err    | -0.0096 |  0.0560 | -0.4535 |  0.1103
landing_rewards |    9.45 |    2.28 |    0.00 |   10.00
landing_margin |   -0

attitude |   -0.09   -0.04   -0.04 |    1.17    0.66    1.82 |   -3.14   -1.56   -3.14 |    3.14    1.57    3.14
w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.08   -0.05   -0.07 |    0.09    0.07    0.05
a_f      |   -0.04   -0.08 |    0.67    1.82 |   -1.54   -3.14 |    1.42    3.13
w_f      |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.03   -0.03   -0.04 |    0.03    0.02    0.03
w_rewards |   -0.47 |    0.32 |   -2.67 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.27 |    0.32 |    0.00 |    3.00
seeker_angles |    0.00    0.00 |    0.09    0.09 |   -1.00   -1.00 |    0.99    1.00
cs_angles |  0.0022  0.0031 |  0.0857  0.0882 | -0.9996 -0.9998 |  0.9910  0.9999
optical_flow | -0.0003  0.0000 |  0.0263  0.0266 | -1.3190 -1.2484 |  0.9735  1.3455
v_err    | -0.0097 |  0.0565 | -0.4534 |  0.1515
landing_rewards |    9.52 |    2.15 |    0.00 |   10.00
landing_margin |   -0

attitude |    0.16    0.03    0.22 |    1.12    0.68    1.78 |   -3.14   -1.57   -3.14 |    3.14    1.57    3.14
w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.10   -0.05   -0.07 |    0.08    0.07    0.05
a_f      |    0.02    0.21 |    0.67    1.76 |   -1.56   -3.13 |    1.39    3.13
w_f      |   -0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.10   -0.02   -0.03 |    0.03    0.03    0.03
w_rewards |   -0.42 |    0.30 |   -2.63 |    0.00
w_penalty |   -0.32 |    5.67 | -100.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.27 |    0.31 |    0.00 |    3.04
seeker_angles |    0.00    0.00 |    0.08    0.09 |   -0.97   -0.99 |    0.97    1.00
cs_angles |  0.0040  0.0024 |  0.0808  0.0852 | -0.9685 -0.9906 |  0.9711  0.9986
optical_flow | -0.0001 -0.0001 |  0.0253  0.0251 | -1.4467 -1.0467 |  1.1705  0.9775
v_err    | -0.0098 |  0.0555 | -0.4532 |  0.1292
landing_rewards |    9.55 |    2.08 |    0.00 |   10.00
landing_margin |    2

w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.08   -0.05   -0.08 |    0.08    0.07    0.05
a_f      |   -0.07    0.07 |    0.64    1.77 |   -1.50   -3.14 |    1.38    3.14
w_f      |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.02   -0.02   -0.03 |    0.03    0.03    0.03
w_rewards |   -0.45 |    0.32 |   -1.70 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.28 |    0.31 |    0.00 |    2.99
seeker_angles |    0.00    0.00 |    0.09    0.09 |   -1.00   -1.00 |    1.00    0.98
cs_angles |  0.0014  0.0020 |  0.0867  0.0866 | -0.9988 -0.9991 |  0.9989  0.9842
optical_flow | -0.0002 -0.0002 |  0.0250  0.0258 | -1.2860 -1.2209 |  0.9951  1.2035
v_err    | -0.0096 |  0.0563 | -0.4527 |  0.1311
landing_rewards |    9.32 |    2.51 |    0.00 |   10.00
landing_margin |   -0.03 |    0.02 |   -0.07 |    0.06
tracking_rewards |  -23.65 |    5.17 |  -49.38 |  -15.32
steps    |     377 |  

attitude |    0.01    0.02    0.01 |    1.20    0.65    1.86 |   -3.14   -1.56   -3.14 |    3.14    1.56    3.14
w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.06   -0.05   -0.07 |    0.07    0.07    0.05
a_f      |    0.02    0.05 |    0.65    1.85 |   -1.45   -3.14 |    1.47    3.13
w_f      |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.03   -0.02   -0.02 |    0.03    0.02    0.03
w_rewards |   -0.41 |    0.24 |   -1.15 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.27 |    0.31 |    0.00 |    3.05
seeker_angles |    0.00    0.00 |    0.08    0.08 |   -0.98   -0.97 |    0.97    0.98
cs_angles |  0.0011  0.0036 |  0.0847  0.0843 | -0.9846 -0.9657 |  0.9654  0.9764
optical_flow | -0.0003 -0.0001 |  0.0256  0.0261 | -1.0480 -1.0846 |  1.2609  1.2849
v_err    | -0.0091 |  0.0565 | -0.6041 |  0.1344
landing_rewards |    9.68 |    1.77 |    0.00 |   10.00
landing_margin |   -0

attitude |    0.04    0.02    0.02 |    1.23    0.66    1.88 |   -3.14   -1.55   -3.14 |    3.14    1.57    3.14
w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.07   -0.05   -0.07 |    0.08    0.08    0.05
a_f      |    0.01    0.05 |    0.67    1.89 |   -1.39   -3.10 |    1.56    3.14
w_f      |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.03   -0.02   -0.03 |    0.02    0.02    0.03
w_rewards |   -0.40 |    0.29 |   -2.15 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.27 |    0.31 |    0.00 |    3.00
seeker_angles |    0.00    0.00 |    0.08    0.08 |   -0.99   -1.00 |    0.99    0.99
cs_angles |  0.0032  0.0046 |  0.0836  0.0831 | -0.9930 -0.9975 |  0.9923  0.9881
optical_flow | -0.0001 -0.0002 |  0.0255  0.0260 | -1.1706 -1.3554 |  1.1857  0.9202
v_err    | -0.0092 |  0.0563 | -0.4531 |  0.1537
landing_rewards |    9.45 |    2.28 |    0.00 |   10.00
landing_margin |   -0

w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.10   -0.05   -0.08 |    0.09    0.08    0.05
a_f      |   -0.03    0.03 |    0.65    1.87 |   -1.50   -3.12 |    1.34    3.11
w_f      |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.10   -0.02   -0.03 |    0.02    0.02    0.05
w_rewards |   -0.42 |    0.34 |   -3.47 |    0.00
w_penalty |   -0.32 |    5.67 | -100.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.27 |    0.32 |    0.00 |    3.08
seeker_angles |    0.00    0.00 |    0.08    0.09 |   -0.99   -1.00 |    1.00    0.99
cs_angles |  0.0003  0.0024 |  0.0849  0.0876 | -0.9877 -0.9980 |  0.9986  0.9919
optical_flow | -0.0000 -0.0000 |  0.0251  0.0253 | -1.1122 -1.1772 |  1.2332  1.2989
v_err    | -0.0094 |  0.0570 | -0.5826 |  0.1103
landing_rewards |    9.65 |    1.85 |    0.00 |   10.00
landing_margin |    3.20 |   56.70 |   -0.07 |  999.82
tracking_rewards |  -23.66 |    5.63 |  -70.13 |  -14.10
steps    |     378 |  

attitude |    0.04    0.03   -0.07 |    1.10    0.68    1.77 |   -3.14   -1.57   -3.14 |    3.14    1.56    3.14
w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.09   -0.05   -0.07 |    0.08    0.08    0.05
a_f      |    0.03   -0.05 |    0.69    1.78 |   -1.51   -3.11 |    1.48    3.14
w_f      |   -0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.02   -0.02   -0.03 |    0.03    0.03    0.02
w_rewards |   -0.39 |    0.28 |   -2.53 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.27 |    0.31 |    0.00 |    2.94
seeker_angles |    0.00    0.00 |    0.08    0.08 |   -0.99   -1.00 |    0.99    0.99
cs_angles |  0.0002  0.0022 |  0.0848  0.0828 | -0.9941 -0.9964 |  0.9915  0.9934
optical_flow | -0.0002 -0.0000 |  0.0247  0.0247 | -1.1722 -1.1229 |  1.3775  1.1123
v_err    | -0.0089 |  0.0558 | -0.4527 |  0.1069
landing_rewards |    9.55 |    2.08 |    0.00 |   10.00
landing_margin |   -0

attitude |    0.07    0.07   -0.10 |    1.27    0.68    1.85 |   -3.14   -1.56   -3.14 |    3.14    1.55    3.14
w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.09   -0.05   -0.08 |    0.08    0.07    0.05
a_f      |    0.07   -0.05 |    0.68    1.85 |   -1.44   -3.13 |    1.55    3.13
w_f      |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.03   -0.02   -0.03 |    0.03    0.02    0.02
w_rewards |   -0.40 |    0.26 |   -1.99 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.27 |    0.31 |    0.00 |    3.02
seeker_angles |   -0.00    0.00 |    0.08    0.08 |   -0.99   -0.99 |    0.99    0.98
cs_angles | -0.0002  0.0026 |  0.0844  0.0830 | -0.9930 -0.9861 |  0.9893  0.9776
optical_flow | -0.0001  0.0001 |  0.0240  0.0254 | -1.3597 -1.2060 |  1.0160  1.1883
v_err    | -0.0091 |  0.0559 | -0.4516 |  0.1215
landing_rewards |    9.65 |    1.85 |    0.00 |   10.00
landing_margin |   -0

attitude |    0.08   -0.01    0.05 |    1.25    0.69    1.87 |   -3.14   -1.56   -3.14 |    3.14    1.56    3.14
w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.10   -0.08   -0.07 |    0.08    0.09    0.07
a_f      |   -0.01    0.10 |    0.68    1.86 |   -1.45   -3.13 |    1.55    3.12
w_f      |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.03   -0.02   -0.03 |    0.02    0.02    0.03
w_rewards |   -0.45 |    0.65 |   -9.92 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |   -0.16 |    2.84 |  -50.00 |    0.00
theta_cv |    0.27 |    0.31 |    0.00 |    3.02
seeker_angles |    0.00    0.00 |    0.09    0.08 |   -1.00   -0.99 |    0.99    1.00
cs_angles |  0.0004  0.0025 |  0.0863  0.0844 | -0.9998 -0.9875 |  0.9949  0.9962
optical_flow |  0.0001 -0.0001 |  0.0254  0.0252 | -1.2415 -1.1899 |  1.1068  1.2577
v_err    | -0.0099 |  0.0596 | -0.7201 |  0.2809
landing_rewards |    9.39 |    2.40 |    0.00 |   10.00
landing_margin |    2

thrust   |    0.00   -0.00   -0.00 |    0.68    0.68    0.69 |   -3.46   -3.45   -3.46 |    3.46    3.42    3.46
norm_thrust |    0.90 |    0.76 |    0.00 |    3.46
fuel     |    1.55 |    0.20 |    1.04 |    2.70
rewards  |  -18.71 |    6.46 |  -70.80 |   -8.47
fuel_rewards |   -4.43 |    0.58 |   -7.73 |   -2.98
glideslope_rewards |    0.00 |    0.00 |    0.00 |    0.00
glideslope_penalty |    0.00 |    0.00 |    0.00 |    0.00
glideslope |    2.81 |   12.38 |    0.01 |  117.31
norm_af  |    1.85 |    0.89 |    0.12 |    3.34
norm_wf  |    0.01 |    0.01 |    0.00 |    0.04
rh_penalty |    0.00 |    0.00 |    0.00 |    0.00
att_rewards |    0.00 |    0.00 |    0.00 |    0.00
att_penalty |    0.00 |    0.00 |    0.00 |    0.00
attitude |   -0.02    0.03   -0.08 |    1.25    0.65    1.95 |   -3.14   -1.55   -3.14 |    3.14    1.57    3.14
w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.09   -0.07   -0.07 |    0.08    0.08    0.05
a_f      |    0.05   -0.14 |    0.65

ADV1:  0.0003736285000676489 0.00818605655145576 0.06031748943756432 -0.06537488976806821
ADV2:  0.005022836062900914 0.8943854334555911 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.0277   0.9939   5.0373  29.5271  16.8478  11.1535
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0006   0.0003   0.0013   8.0871   2.2896   2.8947
Update Cnt = 2310    ET =   1028.0   Stats:  Mean, Std, Min, Max
r_f      |   10.36   -3.78   27.12 |  184.55  169.47  203.83 | -387.96 -382.74 -357.64 |  389.80  395.08  393.15
v_f      |   -0.00    0.00   -0.00 |    0.04    0.04    0.05 |   -0.10   -0.09   -0.09 |    0.11    0.11    0.10
r_i      |   51.43  -36.86   80.22 |  691.68  634.45  771.84 |-1295.48-1271.95-1252.95 | 1354.00 1306.03 1314.68
v_i      |   -0.00    0.00   -0.00 |    0.04    0.04    0.05 |   -0.08   -0.09   -0.10 |    0.09    0.10    0.10
norm_rf  |    0.21 |    0.08 |    0.02 |    0.49
norm_vf  |    0.08 |    0.01 |    0.04 |    0.13
gs_f     |    1.65 |    3.40 |   

ADV1:  -0.0011249561444091932 0.009899971136921983 0.08433949018317793 -0.0639110384280775
ADV2:  0.01861962853906054 0.8882273986838823 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.3382   1.0383   5.3353  29.5271  16.8478  11.1535
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0013   0.0007   0.0030   8.0871   2.2896   2.8947
***** Episode 71937, Mean R = -19.5  Std R = 5.7  Min R = -32.1
PolicyLoss: -0.0142
Policy_Beta: 0.1
Policy_Entropy: 0.156
Policy_KL: 0.00103
Policy_SD: 0.544
Policy_lr_mult: 0.198
Steps: 1.16e+04
TotalSteps: 2.63e+07
VF_0_ExplainedVarNew: 0.983
VF_0_ExplainedVarOld: 0.981
VF_0_Loss : 0.00234


ADV1:  0.0013475676591895953 0.007704914531224782 0.04819656551170104 -0.062248008325846205
ADV2:  -0.0019721900460216812 0.8915723841746244 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.0425   1.0871   6.0990  29.5271  16.8478  11.1535
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0017   0.0009   0.0036   8.0871   2.2896   2.8

ADV1:  0.0004226981251964952 0.008880131887504037 0.06394257834148143 -0.06890436541399814
ADV2:  0.014123816767594721 0.8554492160066945 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.6478   0.9733   5.0655  29.5271  16.8478  11.1535
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0013   0.0007   0.0026   8.0871   2.2896   2.8947
***** Episode 72216, Mean R = -17.7  Std R = 5.4  Min R = -32.0
PolicyLoss: -0.0221
Policy_Beta: 0.1
Policy_Entropy: 0.155
Policy_KL: 0.000913
Policy_SD: 0.53
Policy_lr_mult: 0.198
Steps: 1.18e+04
TotalSteps: 2.64e+07
VF_0_ExplainedVarNew: 0.985
VF_0_ExplainedVarOld: 0.983
VF_0_Loss : 0.0036


ADV1:  0.0019762271243452104 0.009407562722642244 0.06990416923623155 -0.06721149374933189
ADV2:  0.0011935325170759257 0.8614301534543849 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   5.7320   4.1946  16.3229  29.5271  16.8478  11.1535
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0027   0.0015   0.0059   8.0871   2.2896   2.894

ADV1:  -0.0008851840192025418 0.009996633572355015 0.06062007478743242 -0.09808291597365071
ADV2:  0.020094188598743193 0.8809133843765242 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.9009   0.7167   3.9097  29.5271  16.8478  11.1535
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0014   0.0007   0.0025   8.0871   2.2896   2.8947
***** Episode 72495, Mean R = -18.2  Std R = 5.6  Min R = -30.6
PolicyLoss: -0.0187
Policy_Beta: 0.1
Policy_Entropy: 0.157
Policy_KL: 0.00107
Policy_SD: 0.529
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 2.65e+07
VF_0_ExplainedVarNew: 0.98
VF_0_ExplainedVarOld: 0.978
VF_0_Loss : 0.0024


ADV1:  7.908861748235285e-05 0.01006256518044818 0.19507376341157423 -0.09253123279211767
ADV2:  -0.0011415660203249116 0.7528213183938797 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.0786   0.6990   3.5556  29.5271  16.8478  11.1535
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0003   0.0001   0.0005   8.0871   2.2896   2.894

***** Episode 72743, Mean R = -18.8  Std R = 5.8  Min R = -32.0
PolicyLoss: -0.00746
Policy_Beta: 0.1
Policy_Entropy: 0.158
Policy_KL: 0.00108
Policy_SD: 0.536
Policy_lr_mult: 0.198
Steps: 1.16e+04
TotalSteps: 2.66e+07
VF_0_ExplainedVarNew: 0.976
VF_0_ExplainedVarOld: 0.972
VF_0_Loss : 0.00303


ADV1:  0.0018155766419349145 0.007322614985119517 0.05974949526215312 -0.06664278448320798
ADV2:  -0.016074323347021573 0.8547389715328095 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.8529   1.3124   6.8250  29.5271  16.8478  11.1535
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0026   0.0015   0.0056   8.0871   2.2896   2.8947
***** Episode 72774, Mean R = -16.4  Std R = 4.0  Min R = -26.6
PolicyLoss: -0.00736
Policy_Beta: 0.1
Policy_Entropy: 0.156
Policy_KL: 0.00115
Policy_SD: 0.541
Policy_lr_mult: 0.198
Steps: 1.13e+04
TotalSteps: 2.66e+07
VF_0_ExplainedVarNew: 0.99
VF_0_ExplainedVarOld: 0.989
VF_0_Loss : 0.00307


ADV1:  4.166667757378955e-05 0.007299474419890623 0.0

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   3.6326   2.0713  11.2011  29.5271  16.8478  11.1535
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0012   0.0006   0.0024   8.0871   2.2896   2.8947
***** Episode 73022, Mean R = -19.3  Std R = 5.4  Min R = -36.9
PolicyLoss: -0.0324
Policy_Beta: 0.1
Policy_Entropy: 0.152
Policy_KL: 0.00118
Policy_SD: 0.556
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 2.67e+07
VF_0_ExplainedVarNew: 0.985
VF_0_ExplainedVarOld: 0.98
VF_0_Loss : 0.00578


ADV1:  -0.0023140185416670113 0.02779090186511911 0.30538272275619893 -0.6912183187476741
ADV2:  0.027253395128854503 0.4570747029804802 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.8772   0.4727   2.1199  29.5271  16.8478  11.1535
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0025   0.0014   0.0056   8.0871   2.2896   2.8947
***** Episode 73053, Mean R = -22.3  Std R = 24.6  Min R = -154.1
PolicyLoss: -0.025
Policy_Beta: 0.1
Policy_Entropy: 0.154
Policy_KL: 0.000775
Pol

ADV1:  0.0008090503128722259 0.009630640918284927 0.07205279863303399 -0.08576579433908582
ADV2:  0.011734626576752465 0.8346746838961044 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.8847   0.8784   3.4578  29.5271  16.8478  11.1535
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0021   0.0013   0.0045   8.0871   2.2896   2.8947
***** Episode 73301, Mean R = -19.3  Std R = 5.5  Min R = -33.6
PolicyLoss: -0.0219
Policy_Beta: 0.1
Policy_Entropy: 0.155
Policy_KL: 0.000978
Policy_SD: 0.55
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 2.68e+07
VF_0_ExplainedVarNew: 0.985
VF_0_ExplainedVarOld: 0.982
VF_0_Loss : 0.00302


ADV1:  0.0019156994957499308 0.010454544687337385 0.07841321589634409 -0.0795131555126668
ADV2:  -9.87374619170068e-06 0.8838331734295782 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.5439   1.2448   5.3630  29.5271  16.8478  11.1535
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0020   0.0012   0.0051   8.0871   2.2896   2.894

ADV1:  -0.0009331543289472416 0.0063424340151249595 0.05843074366871237 -0.06251885384250422
ADV2:  0.00915191197516421 0.8685037190774828 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   4.6029   3.8600  14.6155  29.5271  16.8478  11.1535
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0012   0.0007   0.0025   8.0871   2.2896   2.8947
***** Episode 73580, Mean R = -16.9  Std R = 4.2  Min R = -29.9
PolicyLoss: -0.000181
Policy_Beta: 0.1
Policy_Entropy: 0.155
Policy_KL: 0.00063
Policy_SD: 0.541
Policy_lr_mult: 0.198
Steps: 1.18e+04
TotalSteps: 2.69e+07
VF_0_ExplainedVarNew: 0.992
VF_0_ExplainedVarOld: 0.991
VF_0_Loss : 0.00435


ADV1:  -0.0033685636450420764 0.010139631116768789 0.07001615892262125 -0.06513665961520546
ADV2:  0.04704828884200893 0.8647802689508718 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.9883   2.1415   8.8419  29.5271  16.8478  11.1535
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0041   0.0025   0.0089   8.0871   2.2896   2.

ADV1:  0.00044320971759999583 0.008418093586263475 0.047324154423866394 -0.06967960698765846
ADV2:  0.017930142710751266 0.844962383140647 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.0387   0.5415   2.3379  29.5271  16.8478  11.1535
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0006   0.0003   0.0013   8.0871   2.2896   2.8947
***** Episode 73859, Mean R = -17.9  Std R = 5.0  Min R = -31.8
PolicyLoss: -0.0274
Policy_Beta: 0.1
Policy_Entropy: 0.155
Policy_KL: 0.00111
Policy_SD: 0.556
Policy_lr_mult: 0.198
Steps: 1.15e+04
TotalSteps: 2.7e+07
VF_0_ExplainedVarNew: 0.987
VF_0_ExplainedVarOld: 0.985
VF_0_Loss : 0.00394


ADV1:  -0.0030971359743794686 0.010344496466202977 0.056480701066379146 -0.10199997051194831
ADV2:  0.03674049102424477 0.8672483150100379 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.0027   1.0384   4.4639  29.5271  16.8478  11.1535
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0038   0.0022   0.0084   8.0871   2.2896   2.89

seeker_angles |   -0.00    0.00 |    0.08    0.09 |   -0.97   -1.00 |    0.99    0.98
cs_angles | -0.0017  0.0011 |  0.0819  0.0852 | -0.9730 -1.0000 |  0.9923  0.9806
optical_flow | -0.0001 -0.0000 |  0.0232  0.0271 | -0.9285 -1.2550 |  1.0026  1.2083
v_err    | -0.0094 |  0.0559 | -0.4582 |  0.1206
landing_rewards |    9.42 |    2.34 |    0.00 |   10.00
landing_margin |   -0.02 |    0.01 |   -0.07 |    0.02
tracking_rewards |  -22.69 |    4.62 |  -46.85 |  -15.05
steps    |     377 |      20 |     328 |     420
***** Episode 74138, Mean R = -19.0  Std R = 6.0  Min R = -34.7
PolicyLoss: -0.0179
Policy_Beta: 0.1
Policy_Entropy: 0.157
Policy_KL: 0.00102
Policy_SD: 0.548
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 2.71e+07
VF_0_ExplainedVarNew: 0.978
VF_0_ExplainedVarOld: 0.976
VF_0_Loss : 0.00429


ADV1:  0.0027749847587677616 0.007411546743242607 0.05382807622782931 -0.08460263680141317
ADV2:  -0.020315922984943693 0.8849071524398913 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max

attitude |   -0.06   -0.00   -0.16 |    1.19    0.63    1.84 |   -3.14   -1.56   -3.14 |    3.14    1.57    3.14
w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.10   -0.05   -0.07 |    0.09    0.07    0.06
a_f      |    0.01   -0.22 |    0.63    1.83 |   -1.51   -3.14 |    1.51    3.13
w_f      |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.10   -0.03   -0.03 |    0.03    0.02    0.04
w_rewards |   -0.39 |    0.42 |   -5.64 |    0.00
w_penalty |   -0.32 |    5.67 | -100.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.26 |    0.31 |    0.00 |    3.06
seeker_angles |    0.00    0.01 |    0.08    0.08 |   -0.99   -0.99 |    0.99    1.00
cs_angles |  0.0035  0.0071 |  0.0827  0.0844 | -0.9944 -0.9895 |  0.9883  0.9955
optical_flow | -0.0002 -0.0001 |  0.0248  0.0250 | -1.1629 -1.0718 |  1.1046  1.0952
v_err    | -0.0093 |  0.0561 | -0.4517 |  0.1002
landing_rewards |    9.71 |    1.68 |    0.00 |   10.00
landing_margin |    2

attitude |   -0.10   -0.01   -0.04 |    1.27    0.70    1.87 |   -3.14   -1.57   -3.14 |    3.14    1.53    3.14
w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.07   -0.05   -0.07 |    0.08    0.07    0.05
a_f      |   -0.02    0.02 |    0.70    1.85 |   -1.41   -3.11 |    1.52    3.11
w_f      |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.03   -0.02   -0.02 |    0.02    0.03    0.02
w_rewards |   -0.38 |    0.30 |   -2.61 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.27 |    0.31 |    0.00 |    3.02
seeker_angles |    0.00    0.00 |    0.09    0.08 |   -0.99   -1.00 |    0.99    0.98
cs_angles |  0.0009  0.0020 |  0.0852  0.0838 | -0.9911 -0.9974 |  0.9936  0.9845
optical_flow | -0.0001 -0.0001 |  0.0234  0.0254 | -0.9121 -1.1236 |  1.0569  1.1463
v_err    | -0.0095 |  0.0560 | -0.4534 |  0.1205
landing_rewards |    9.52 |    2.15 |    0.00 |   10.00
landing_margin |   -0

attitude |   -0.01    0.04   -0.20 |    1.16    0.66    1.77 |   -3.14   -1.54   -3.14 |    3.14    1.56    3.14
w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.09   -0.05   -0.07 |    0.09    0.07    0.05
a_f      |    0.05   -0.20 |    0.65    1.76 |   -1.31   -3.12 |    1.44    3.14
w_f      |   -0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.03   -0.02   -0.02 |    0.02    0.03    0.02
w_rewards |   -0.38 |    0.31 |   -3.58 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.27 |    0.31 |    0.00 |    3.09
seeker_angles |    0.00    0.00 |    0.08    0.09 |   -0.99   -1.00 |    1.00    0.94
cs_angles |  0.0020  0.0035 |  0.0821  0.0856 | -0.9872 -0.9985 |  0.9953  0.9406
optical_flow | -0.0000 -0.0000 |  0.0247  0.0256 | -1.1156 -1.2057 |  1.1185  0.9521
v_err    | -0.0095 |  0.0558 | -0.4601 |  0.1998
landing_rewards |    9.68 |    1.77 |    0.00 |   10.00
landing_margin |   -0

attitude |    0.04    0.01   -0.12 |    1.15    0.66    1.77 |   -3.14   -1.54   -3.14 |    3.14    1.55    3.14
w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.08   -0.05   -0.07 |    0.08    0.07    0.05
a_f      |    0.01   -0.22 |    0.66    1.77 |   -1.46   -3.13 |    1.52    3.07
w_f      |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.02   -0.02   -0.02 |    0.02    0.03    0.02
w_rewards |   -0.39 |    0.25 |   -1.49 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.27 |    0.31 |    0.00 |    3.09
seeker_angles |    0.00    0.00 |    0.08    0.09 |   -1.00   -1.00 |    1.00    0.99
cs_angles |  0.0012  0.0006 |  0.0828  0.0861 | -0.9950 -0.9995 |  0.9961  0.9943
optical_flow | -0.0000  0.0000 |  0.0246  0.0255 | -1.1424 -1.2686 |  1.0743  1.4546
v_err    | -0.0096 |  0.0558 | -0.4534 |  0.1188
landing_rewards |    9.61 |    1.93 |    0.00 |   10.00
landing_margin |   -0

attitude |   -0.02    0.05   -0.13 |    1.19    0.65    1.85 |   -3.14   -1.55   -3.14 |    3.14    1.57    3.14
w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.10   -0.05   -0.07 |    0.08    0.08    0.05
a_f      |    0.05   -0.08 |    0.66    1.84 |   -1.44   -3.12 |    1.52    3.13
w_f      |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.10   -0.02   -0.03 |    0.02    0.02    0.02
w_rewards |   -0.42 |    0.28 |   -2.43 |   -0.00
w_penalty |   -0.32 |    5.67 | -100.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.27 |    0.31 |    0.00 |    2.98
seeker_angles |    0.00    0.00 |    0.09    0.08 |   -0.98   -0.97 |    1.00    0.98
cs_angles |  0.0021  0.0020 |  0.0868  0.0827 | -0.9800 -0.9696 |  0.9975  0.9837
optical_flow | -0.0001 -0.0001 |  0.0243  0.0255 | -1.3440 -1.1086 |  1.0679  1.2352
v_err    | -0.0096 |  0.0562 | -0.4516 |  0.2413
landing_rewards |    9.58 |    2.00 |    0.00 |   10.00
landing_margin |    2

attitude |    0.03   -0.05    0.12 |    1.19    0.66    1.82 |   -3.14   -1.56   -3.14 |    3.14    1.55    3.14
w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.08   -0.05   -0.07 |    0.08    0.07    0.07
a_f      |   -0.05    0.13 |    0.66    1.80 |   -1.54   -3.12 |    1.50    3.11
w_f      |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.03   -0.03   -0.03 |    0.02    0.04    0.02
w_rewards |   -0.39 |    0.32 |   -2.67 |   -0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.26 |    0.31 |    0.00 |    3.02
seeker_angles |   -0.00    0.00 |    0.08    0.09 |   -1.00   -0.99 |    0.99    0.99
cs_angles | -0.0008  0.0011 |  0.0779  0.0860 | -0.9991 -0.9854 |  0.9872  0.9928
optical_flow | -0.0002  0.0000 |  0.0237  0.0262 | -0.8813 -1.1883 |  1.0329  1.1946
v_err    | -0.0097 |  0.0560 | -0.4537 |  0.1095
landing_rewards |    9.55 |    2.08 |    0.00 |   10.00
landing_margin |   -0

attitude |    0.07    0.02    0.14 |    1.17    0.67    1.82 |   -3.14   -1.57   -3.14 |    3.14    1.56    3.14
w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.08   -0.05   -0.07 |    0.09    0.07    0.05
a_f      |    0.03    0.08 |    0.67    1.81 |   -1.51   -3.11 |    1.49    3.11
w_f      |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.03   -0.03   -0.02 |    0.02    0.02    0.02
w_rewards |   -0.45 |    0.29 |   -1.97 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.27 |    0.31 |    0.00 |    3.01
seeker_angles |   -0.00   -0.00 |    0.08    0.08 |   -0.99   -0.97 |    0.99    1.00
cs_angles | -0.0001 -0.0008 |  0.0817  0.0841 | -0.9926 -0.9709 |  0.9929  0.9993
optical_flow | -0.0000  0.0000 |  0.0233  0.0256 | -1.2011 -1.0198 |  1.0749  1.2661
v_err    | -0.0095 |  0.0560 | -0.4519 |  0.1900
landing_rewards |    9.58 |    2.00 |    0.00 |   10.00
landing_margin |   -0

w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.09   -0.05   -0.07 |    0.08    0.07    0.05
a_f      |    0.04    0.03 |    0.62    1.77 |   -1.42   -3.14 |    1.50    3.13
w_f      |   -0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.03   -0.03   -0.03 |    0.03    0.03    0.02
w_rewards |   -0.43 |    0.34 |   -4.07 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.26 |    0.31 |    0.00 |    2.98
seeker_angles |   -0.00    0.00 |    0.08    0.08 |   -0.99   -0.97 |    0.94    0.98
cs_angles | -0.0003  0.0026 |  0.0807  0.0829 | -0.9887 -0.9672 |  0.9354  0.9801
optical_flow | -0.0001 -0.0002 |  0.0227  0.0263 | -1.1827 -1.1356 |  0.8819  1.3837
v_err    | -0.0096 |  0.0561 | -0.4530 |  0.1345
landing_rewards |    9.71 |    1.68 |    0.00 |   10.00
landing_margin |   -0.03 |    0.01 |   -0.07 |    0.03
tracking_rewards |  -22.52 |    4.57 |  -47.69 |  -13.80
steps    |     379 |  

attitude |   -0.02   -0.04    0.13 |    1.24    0.64    1.91 |   -3.14   -1.55   -3.14 |    3.14    1.56    3.14
w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.07   -0.05   -0.07 |    0.08    0.07    0.05
a_f      |   -0.04    0.12 |    0.64    1.89 |   -1.48   -3.14 |    1.53    3.14
w_f      |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.03   -0.02   -0.02 |    0.02    0.03    0.02
w_rewards |   -0.44 |    0.28 |   -1.74 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.26 |    0.31 |    0.00 |    3.07
seeker_angles |   -0.00    0.00 |    0.08    0.08 |   -0.99   -1.00 |    0.95    0.98
cs_angles | -0.0019  0.0026 |  0.0801  0.0832 | -0.9868 -0.9972 |  0.9508  0.9761
optical_flow | -0.0001 -0.0001 |  0.0221  0.0233 | -0.9923 -1.1200 |  1.0337  0.9356
v_err    | -0.0094 |  0.0554 | -0.4522 |  0.1538
landing_rewards |    9.55 |    2.08 |    0.00 |   10.00
landing_margin |   -0

attitude |    0.04    0.02   -0.12 |    1.11    0.67    1.71 |   -3.14   -1.56   -3.14 |    3.14    1.57    3.14
w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.10   -0.06   -0.07 |    0.08    0.08    0.07
a_f      |    0.02   -0.12 |    0.67    1.72 |   -1.48   -3.12 |    1.52    3.11
w_f      |   -0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.10   -0.02   -0.03 |    0.03    0.03    0.02
w_rewards |   -0.42 |    0.33 |   -2.67 |    0.00
w_penalty |   -0.32 |    5.67 | -100.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.27 |    0.32 |    0.00 |    3.02
seeker_angles |   -0.00    0.00 |    0.09    0.09 |   -0.99   -1.00 |    0.99    1.00
cs_angles | -0.0004  0.0018 |  0.0857  0.0898 | -0.9927 -0.9951 |  0.9892  0.9981
optical_flow | -0.0002  0.0001 |  0.0245  0.0252 | -1.2852 -1.2051 |  1.1463  1.2531
v_err    | -0.0100 |  0.0568 | -0.6060 |  0.2113
landing_rewards |    9.61 |    1.93 |    0.00 |   10.00
landing_margin |    3

w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.10   -0.05   -0.07 |    0.08    0.08    0.05
a_f      |   -0.04   -0.05 |    0.66    1.87 |   -1.43   -3.13 |    1.47    3.13
w_f      |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.10   -0.03   -0.03 |    0.03    0.03    0.02
w_rewards |   -0.43 |    0.33 |   -2.72 |   -0.00
w_penalty |   -0.32 |    5.67 | -100.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.27 |    0.32 |    0.00 |    3.01
seeker_angles |    0.00    0.00 |    0.08    0.09 |   -0.99   -0.98 |    0.95    1.00
cs_angles |  0.0023  0.0017 |  0.0817  0.0854 | -0.9929 -0.9782 |  0.9542  0.9986
optical_flow | -0.0001 -0.0001 |  0.0242  0.0269 | -1.2228 -1.1084 |  1.0875  1.4310
v_err    | -0.0097 |  0.0562 | -0.4516 |  0.1233
landing_rewards |    9.65 |    1.85 |    0.00 |   10.00
landing_margin |    3.03 |   53.69 |   -0.06 |  946.84
tracking_rewards |  -22.77 |    4.97 |  -46.16 |  -12.85
steps    |     376 |  

attitude |    0.06    0.01   -0.13 |    1.15    0.66    1.79 |   -3.14   -1.55   -3.14 |    3.14    1.57    3.14
w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.08   -0.05   -0.07 |    0.08    0.08    0.05
a_f      |    0.02   -0.17 |    0.66    1.80 |   -1.41   -3.14 |    1.48    3.14
w_f      |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.03   -0.02   -0.02 |    0.02    0.03    0.01
w_rewards |   -0.41 |    0.30 |   -2.50 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.27 |    0.32 |    0.00 |    3.02
seeker_angles |    0.00    0.00 |    0.08    0.08 |   -0.99   -0.97 |    0.97    0.99
cs_angles |  0.0005  0.0026 |  0.0841  0.0807 | -0.9893 -0.9746 |  0.9709  0.9899
optical_flow | -0.0000  0.0000 |  0.0222  0.0252 | -0.9368 -1.1740 |  0.8407  1.0048
v_err    | -0.0096 |  0.0563 | -0.4530 |  0.1079
landing_rewards |    9.77 |    1.49 |    0.00 |   10.00
landing_margin |   -0

attitude |   -0.00   -0.01   -0.12 |    1.21    0.60    1.89 |   -3.14   -1.54   -3.14 |    3.14    1.57    3.14
w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.07   -0.05   -0.07 |    0.08    0.07    0.05
a_f      |   -0.02   -0.12 |    0.60    1.89 |   -1.42   -3.13 |    1.46    3.13
w_f      |   -0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.02   -0.02   -0.02 |    0.03    0.02    0.02
w_rewards |   -0.44 |    0.28 |   -2.38 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.27 |    0.32 |    0.00 |    3.07
seeker_angles |    0.00    0.00 |    0.09    0.09 |   -0.99   -0.97 |    0.89    0.97
cs_angles |  0.0012  0.0013 |  0.0854  0.0881 | -0.9889 -0.9748 |  0.8863  0.9744
optical_flow | -0.0001 -0.0001 |  0.0243  0.0253 | -1.0715 -1.1641 |  0.9845  1.2140
v_err    | -0.0093 |  0.0566 | -0.4525 |  0.1660
landing_rewards |    9.55 |    2.08 |    0.00 |   10.00
landing_margin |   -0

attitude |    0.02   -0.03   -0.02 |    1.15    0.67    1.85 |   -3.14   -1.57   -3.14 |    3.14    1.57    3.14
w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.07   -0.05   -0.07 |    0.08    0.07    0.06
a_f      |   -0.02   -0.07 |    0.66    1.85 |   -1.47   -3.11 |    1.49    3.13
w_f      |   -0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.02   -0.02   -0.02 |    0.02    0.03    0.02
w_rewards |   -0.44 |    0.28 |   -1.66 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.26 |    0.32 |    0.00 |    2.96
seeker_angles |    0.00    0.00 |    0.08    0.08 |   -0.99   -1.00 |    0.98    1.00
cs_angles |  0.0003  0.0014 |  0.0836  0.0846 | -0.9945 -0.9999 |  0.9774  0.9962
optical_flow | -0.0002 -0.0001 |  0.0235  0.0261 | -1.1517 -1.1194 |  0.9284  1.1007
v_err    | -0.0090 |  0.0564 | -0.4526 |  0.1734
landing_rewards |    9.45 |    2.28 |    0.00 |   10.00
landing_margin |   -0

glideslope_penalty |    0.00 |    0.00 |    0.00 |    0.00
glideslope |    3.05 |   12.89 |    0.01 |  622.88
norm_af  |    1.70 |    0.94 |    0.01 |    3.34
norm_wf  |    0.01 |    0.01 |    0.00 |    0.03
rh_penalty |    0.00 |    0.00 |    0.00 |    0.00
att_rewards |    0.00 |    0.00 |    0.00 |    0.00
att_penalty |    0.00 |    0.00 |    0.00 |    0.00
attitude |   -0.07   -0.02   -0.18 |    1.19    0.68    1.81 |   -3.14   -1.57   -3.14 |    3.14    1.55    3.14
w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.10   -0.05   -0.07 |    0.08    0.08    0.05
a_f      |   -0.03   -0.21 |    0.68    1.81 |   -1.49   -3.13 |    1.49    3.12
w_f      |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.03   -0.02   -0.02 |    0.02    0.03    0.01
w_rewards |   -0.44 |    0.29 |   -2.97 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.27 |    0.31 |    0.00 |    3.11
seeker_angles | 

attitude |    0.15   -0.03    0.02 |    1.13    0.62    1.85 |   -3.14   -1.55   -3.14 |    3.14    1.56    3.14
w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.07   -0.05   -0.08 |    0.08    0.07    0.05
a_f      |   -0.03    0.02 |    0.62    1.84 |   -1.33   -3.12 |    1.35    3.14
w_f      |   -0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.03   -0.02   -0.02 |    0.03    0.04    0.02
w_rewards |   -0.42 |    0.26 |   -1.79 |   -0.01
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.27 |    0.32 |    0.00 |    3.02
seeker_angles |   -0.00   -0.00 |    0.08    0.09 |   -0.99   -1.00 |    0.98    0.98
cs_angles | -0.0039 -0.0009 |  0.0823  0.0857 | -0.9905 -0.9979 |  0.9762  0.9788
optical_flow | -0.0000 -0.0001 |  0.0233  0.0249 | -1.1404 -1.1149 |  1.0850  1.3416
v_err    | -0.0089 |  0.0562 | -0.4534 |  0.1090
landing_rewards |    9.58 |    2.00 |    0.00 |   10.00
landing_margin |   -0

attitude |    0.04    0.08    0.11 |    1.22    0.68    1.80 |   -3.14   -1.57   -3.14 |    3.14    1.57    3.14
w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.08   -0.05   -0.08 |    0.08    0.07    0.05
a_f      |    0.08    0.15 |    0.66    1.78 |   -1.36   -3.14 |    1.43    3.13
w_f      |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.03   -0.02   -0.02 |    0.02    0.02    0.02
w_rewards |   -0.44 |    0.27 |   -1.70 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.27 |    0.32 |    0.00 |    2.89
seeker_angles |    0.00    0.00 |    0.09    0.09 |   -0.99   -0.99 |    1.00    1.00
cs_angles |  0.0000  0.0036 |  0.0853  0.0858 | -0.9856 -0.9896 |  0.9999  0.9992
optical_flow | -0.0001 -0.0002 |  0.0237  0.0253 | -1.2534 -1.3082 |  1.2097  1.0907
v_err    | -0.0090 |  0.0565 | -0.4521 |  0.1158
landing_rewards |    9.42 |    2.34 |    0.00 |   10.00
landing_margin |   -0

attitude |    0.00    0.00    0.29 |    1.25    0.66    1.86 |   -3.14   -1.55   -3.14 |    3.14    1.56    3.14
w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.09   -0.05   -0.07 |    0.08    0.07    0.05
a_f      |    0.00    0.31 |    0.65    1.85 |   -1.55   -3.13 |    1.53    3.14
w_f      |   -0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.04   -0.02   -0.02 |    0.02    0.03    0.02
w_rewards |   -0.43 |    0.35 |   -4.46 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.27 |    0.32 |    0.00 |    2.98
seeker_angles |   -0.00   -0.00 |    0.08    0.09 |   -0.97   -1.00 |    0.98    1.00
cs_angles | -0.0020 -0.0011 |  0.0804  0.0874 | -0.9725 -0.9965 |  0.9758  0.9973
optical_flow | -0.0000  0.0000 |  0.0235  0.0247 | -1.1881 -1.1407 |  1.3865  1.6035
v_err    | -0.0090 |  0.0567 | -0.4535 |  0.2102
landing_rewards |    9.55 |    2.08 |    0.00 |   10.00
landing_margin |   -0

w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.09   -0.05   -0.07 |    0.09    0.07    0.05
a_f      |   -0.00   -0.05 |    0.67    1.81 |   -1.48   -3.14 |    1.48    3.13
w_f      |   -0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.03   -0.03   -0.03 |    0.03    0.02    0.02
w_rewards |   -0.47 |    0.37 |   -3.46 |   -0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.27 |    0.31 |    0.00 |    3.11
seeker_angles |    0.00    0.00 |    0.08    0.08 |   -0.99   -1.00 |    1.00    0.99
cs_angles |  0.0005  0.0036 |  0.0799  0.0829 | -0.9930 -0.9981 |  0.9982  0.9897
optical_flow | -0.0001 -0.0002 |  0.0232  0.0259 | -1.2579 -1.6140 |  1.0685  1.1164
v_err    | -0.0094 |  0.0568 | -0.4513 |  0.1076
landing_rewards |    9.48 |    2.21 |    0.00 |   10.00
landing_margin |   -0.03 |    0.01 |   -0.07 |    0.03
tracking_rewards |  -22.52 |    4.78 |  -42.63 |  -14.22
steps    |     376 |  

thrust   |   -0.00    0.00    0.00 |    0.70    0.69    0.70 |   -3.45   -3.39   -3.45 |    3.39    3.42    3.41
norm_thrust |    0.93 |    0.77 |    0.00 |    3.46
fuel     |    1.58 |    0.22 |    0.31 |    2.39
rewards  |  -18.75 |    8.47 | -117.24 |   -7.44
fuel_rewards |   -4.53 |    0.62 |   -6.84 |   -0.89
glideslope_rewards |    0.00 |    0.00 |    0.00 |    0.00
glideslope_penalty |    0.00 |    0.00 |    0.00 |    0.00
glideslope |    2.85 |   16.65 |    0.01 | 3678.15
norm_af  |    1.72 |    0.87 |    0.10 |    3.21
norm_wf  |    0.01 |    0.01 |    0.00 |    0.10
rh_penalty |    0.00 |    0.00 |    0.00 |    0.00
att_rewards |    0.00 |    0.00 |    0.00 |    0.00
att_penalty |    0.00 |    0.00 |    0.00 |    0.00
attitude |   -0.02   -0.02   -0.01 |    1.14    0.63    1.82 |   -3.14   -1.55   -3.14 |    3.14    1.57    3.14
w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.10   -0.05   -0.07 |    0.08    0.07    0.05
a_f      |   -0.02   -0.00 |    0.63

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.1356   1.5491   6.8366  29.5271  16.8478  11.4563
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0013   0.0008   0.0029   8.0871   2.2896   2.8947
Update Cnt = 2600    ET =   1106.9   Stats:  Mean, Std, Min, Max
r_f      |    5.06  -24.95  -11.25 |  190.57  170.97  197.91 | -383.51 -393.23 -392.08 |  396.82  390.15  395.77
v_f      |   -0.00    0.00    0.00 |    0.04    0.04    0.05 |   -0.10   -0.08   -0.10 |    0.09    0.10    0.09
r_i      |   24.97  -65.06  -59.31 |  691.10  673.74  738.37 |-1361.08-1293.91-1343.10 | 1359.35 1281.43 1264.55
v_i      |   -0.00    0.00    0.00 |    0.04    0.04    0.05 |   -0.09   -0.09   -0.09 |    0.09    0.09    0.10
norm_rf  |    0.20 |    0.09 |    0.02 |    0.44
norm_vf  |    0.07 |    0.01 |    0.04 |    0.12
gs_f     |    1.24 |    2.01 |    0.01 |   22.43
thrust   |    0.00    0.00    0.01 |    0.69    0.71    0.69 |   -3.44   -3.46   -3.37 |    3.46    3.43    3.43
norm_thrust |    

ADV1:  -0.0002732792969720121 0.013367637095336277 0.23543601322000102 -0.17627479424061376
ADV2:  0.003676503324603565 0.7829898919870437 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.7622   0.7292   3.5657  29.5271  16.8478  11.4563
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0004   0.0002   0.0008   8.0871   2.2896   2.8947
***** Episode 80927, Mean R = -19.7  Std R = 6.7  Min R = -41.8
PolicyLoss: -0.00552
Policy_Beta: 0.1
Policy_Entropy: 0.157
Policy_KL: 0.00105
Policy_SD: 0.563
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 2.97e+07
VF_0_ExplainedVarNew: 0.974
VF_0_ExplainedVarOld: 0.967
VF_0_Loss : 0.00406


Dynamics: Max Disturbance (m/s^2):  [0.00149461 0.0018056  0.00138071] 0.002720371623523329
ADV1:  0.0010340877529476254 0.010977404454445136 0.07973034327364698 -0.09679796011748337
ADV2:  0.0031511184281054192 0.854157333578144 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   3.1014   1.7950   8.6727  29.5271  16.8478  11.4563
ValFun 

ADV1:  0.004136052198904885 0.009364522203751039 0.07626418850178263 -0.06947575400541228
ADV2:  -0.013632795462276423 0.840324472225061 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.8789   1.6187   8.6585  29.5271  16.8478  11.4563
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0053   0.0030   0.0111   8.0871   2.2896   2.8947
***** Episode 81206, Mean R = -17.9  Std R = 5.1  Min R = -35.0
PolicyLoss: -0.021
Policy_Beta: 0.1
Policy_Entropy: 0.159
Policy_KL: 0.00137
Policy_SD: 0.54
Policy_lr_mult: 0.198
Steps: 1.15e+04
TotalSteps: 2.98e+07
VF_0_ExplainedVarNew: 0.986
VF_0_ExplainedVarOld: 0.983
VF_0_Loss : 0.0027


Dynamics: Max Disturbance (m/s^2):  [0.00149461 0.0018056  0.00138071] 0.002720371623523329
ADV1:  -0.003159976976245108 0.011741362702227792 0.0677899775953679 -0.07121711517249965
ADV2:  0.025696541444267203 0.9132773313516258 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.6477   0.7483   3.2930  29.5271  16.8478  11.4563
ValFun  Gradie

Dynamics: Max Disturbance (m/s^2):  [0.00149461 0.0018056  0.00138071] 0.002720371623523329
ADV1:  -0.00121409545349175 0.009605623929027408 0.07703353965879539 -0.127556020229449
ADV2:  0.028710133595998014 0.749601070710269 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.4495   0.6886   3.5885  29.5271  16.8478  11.4563
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0016   0.0009   0.0033   8.0871   2.2896   2.8947
***** Episode 81485, Mean R = -19.4  Std R = 5.2  Min R = -34.6
PolicyLoss: -0.0254
Policy_Beta: 0.1
Policy_Entropy: 0.158
Policy_KL: 0.00109
Policy_SD: 0.545
Policy_lr_mult: 0.198
Steps: 1.19e+04
TotalSteps: 2.99e+07
VF_0_ExplainedVarNew: 0.986
VF_0_ExplainedVarOld: 0.984
VF_0_Loss : 0.00261


ADV1:  0.0023538632108515193 0.009542448808197624 0.08585580591442565 -0.05040229560319792
ADV2:  -0.008705091925936428 0.8543751272184454 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.3906   0.5609   3.1173  29.5271  16.8478  11.4563
ValFun  Grad

Dynamics: Max Disturbance (m/s^2):  [0.00149461 0.0018056  0.00138071] 0.002720371623523329
ADV1:  -0.0020166326573428615 0.009550737081443992 0.0590774465496936 -0.10147257766606321
ADV2:  0.03328889753766743 0.8361851535048433 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.4023   0.7983   3.5228  29.5271  16.8478  11.4563
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0023   0.0013   0.0053   8.0871   2.2896   2.8947
***** Episode 81764, Mean R = -17.4  Std R = 5.8  Min R = -31.3
PolicyLoss: -0.0218
Policy_Beta: 0.1
Policy_Entropy: 0.159
Policy_KL: 0.000833
Policy_SD: 0.54
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 3e+07
VF_0_ExplainedVarNew: 0.985
VF_0_ExplainedVarOld: 0.982
VF_0_Loss : 0.00242


ADV1:  -0.0007031477092696372 0.010729525356148151 0.060055419874907534 -0.08192247156378546
ADV2:  0.02246656995036603 0.8670348117663749 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.6630   1.5668   8.0582  29.5271  16.8478  11.4563
ValFun  Grad

***** Episode 82012, Mean R = -20.0  Std R = 9.3  Min R = -54.6
PolicyLoss: -0.0347
Policy_Beta: 0.1
Policy_Entropy: 0.159
Policy_KL: 0.000946
Policy_SD: 0.55
Policy_lr_mult: 0.198
Steps: 1.19e+04
TotalSteps: 3.01e+07
VF_0_ExplainedVarNew: 0.978
VF_0_ExplainedVarOld: 0.975
VF_0_Loss : 0.00188


ADV1:  0.0013054423935611585 0.009936247299379246 0.06466069762963955 -0.13488938249361393
ADV2:  0.00328693919906602 0.8190654447373649 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.2496   1.4358   6.4310  29.5271  16.8478  11.4563
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0014   0.0008   0.0035   8.0871   2.2896   2.8947
***** Episode 82043, Mean R = -18.3  Std R = 6.9  Min R = -37.9
PolicyLoss: -0.0184
Policy_Beta: 0.1
Policy_Entropy: 0.159
Policy_KL: 0.00112
Policy_SD: 0.548
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 3.01e+07
VF_0_ExplainedVarNew: 0.984
VF_0_ExplainedVarOld: 0.982
VF_0_Loss : 0.00196


ADV1:  -0.0012682662654377832 0.014519001534380429 0.331

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.0272   1.0687   5.5870  29.5271  16.8478  11.4563
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0020   0.0013   0.0046   8.0871   2.2896   2.8947
***** Episode 82291, Mean R = -17.5  Std R = 4.1  Min R = -27.1
PolicyLoss: -0.00224
Policy_Beta: 0.1
Policy_Entropy: 0.162
Policy_KL: 0.00116
Policy_SD: 0.538
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 3.02e+07
VF_0_ExplainedVarNew: 0.985
VF_0_ExplainedVarOld: 0.977
VF_0_Loss : 0.00269


ADV1:  -0.0007058546312708244 0.010133906655841785 0.05196099228691625 -0.12069402842199634
ADV2:  0.0253275296987055 0.8517489534713848 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.3649   0.7547   2.9508  29.5271  16.8478  11.4563
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0011   0.0007   0.0025   8.0871   2.2896   2.8947
***** Episode 82322, Mean R = -17.8  Std R = 5.2  Min R = -30.4
PolicyLoss: -0.0258
Policy_Beta: 0.1
Policy_Entropy: 0.161
Policy_KL: 0.000969
Po

ADV1:  0.001658038512262232 0.008876529256749068 0.07796475532656555 -0.19424682307558816
ADV2:  0.0071707668303151425 0.6781232643322647 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.5456   1.4631   5.6984  29.5271  16.8478  11.4563
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0018   0.0011   0.0044   8.0871   2.2896   2.8947
***** Episode 82570, Mean R = -17.4  Std R = 4.5  Min R = -29.6
PolicyLoss: -0.026
Policy_Beta: 0.1
Policy_Entropy: 0.161
Policy_KL: 0.00116
Policy_SD: 0.546
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 3.03e+07
VF_0_ExplainedVarNew: 0.987
VF_0_ExplainedVarOld: 0.984
VF_0_Loss : 0.00175


ADV1:  -0.0014936955874462045 0.008627710241638855 0.07458125389483172 -0.13347951313499984
ADV2:  0.016441503991579377 0.8307737102313771 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.6918   0.7171   3.8904  29.5271  16.8478  11.4563
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0021   0.0011   0.0045   8.0871   2.2896   2.894

ADV1:  0.0005546102184412509 0.009764922125295722 0.0983400592891997 -0.08286765696457443
ADV2:  0.00996388405494239 0.8495155891855042 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.1783   1.0714   4.7537  29.5271  16.8478  11.4563
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0008   0.0004   0.0017   8.0871   2.2896   2.8947
***** Episode 82849, Mean R = -20.5  Std R = 5.8  Min R = -36.7
PolicyLoss: -0.019
Policy_Beta: 0.1
Policy_Entropy: 0.16
Policy_KL: 0.000937
Policy_SD: 0.562
Policy_lr_mult: 0.198
Steps: 1.15e+04
TotalSteps: 3.04e+07
VF_0_ExplainedVarNew: 0.986
VF_0_ExplainedVarOld: 0.984
VF_0_Loss : 0.00172


ADV1:  -0.0015514328564654994 0.009301828861981587 0.10019412356744795 -0.05745376833567055
ADV2:  0.021434046376469576 0.8506862318685573 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.7286   0.8305   3.9184  29.5271  16.8478  11.4563
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0018   0.0011   0.0041   8.0871   2.2896   2.8947


theta_cv |    0.27 |    0.31 |    0.00 |    3.01
seeker_angles |    0.00    0.00 |    0.09    0.09 |   -0.95   -1.00 |    1.00    1.00
cs_angles |  0.0027  0.0032 |  0.0853  0.0878 | -0.9518 -0.9973 |  0.9952  0.9960
optical_flow | -0.0001 -0.0000 |  0.0233  0.0258 | -1.2621 -1.3059 |  1.2023  1.1734
v_err    | -0.0090 |  0.0569 | -0.4535 |  0.1980
landing_rewards |    9.58 |    2.00 |    0.00 |   10.00
landing_margin |   -0.03 |    0.01 |   -0.06 |    0.02
tracking_rewards |  -23.13 |    5.10 |  -49.15 |  -14.48
steps    |     374 |      20 |     334 |     416
***** Episode 83128, Mean R = -17.0  Std R = 4.9  Min R = -28.2
PolicyLoss: -0.00859
Policy_Beta: 0.1
Policy_Entropy: 0.162
Policy_KL: 0.000974
Policy_SD: 0.532
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 3.05e+07
VF_0_ExplainedVarNew: 0.992
VF_0_ExplainedVarOld: 0.991
VF_0_Loss : 0.00176


ADV1:  -0.0005930258336904674 0.008230476245347852 0.0600263265970753 -0.15238741464658007
ADV2:  0.023255348081235992 0.7215481441096

attitude |    0.09   -0.01   -0.01 |    1.28    0.64    1.94 |   -3.14   -1.56   -3.14 |    3.14    1.57    3.14
w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.06   -0.05   -0.07 |    0.09    0.07    0.05
a_f      |   -0.02   -0.07 |    0.63    1.94 |   -1.48   -3.14 |    1.41    3.10
w_f      |   -0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.02   -0.03   -0.02 |    0.02    0.03    0.02
w_rewards |   -0.44 |    0.78 |  -12.96 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.27 |    0.32 |    0.00 |    3.12
seeker_angles |    0.00    0.00 |    0.09    0.09 |   -0.98   -0.99 |    0.97    0.98
cs_angles |  0.0020  0.0035 |  0.0855  0.0875 | -0.9751 -0.9948 |  0.9741  0.9803
optical_flow | -0.0001 -0.0001 |  0.0232  0.0255 | -1.4263 -1.0366 |  1.2683  1.1301
v_err    | -0.0098 |  0.0602 | -0.6448 |  0.2662
landing_rewards |    9.71 |    1.68 |    0.00 |   10.00
landing_margin |   -0

thrust   |    0.00    0.00   -0.01 |    0.68    0.67    0.68 |   -3.41   -3.46   -3.46 |    3.35    3.46    3.37
norm_thrust |    0.90 |    0.76 |    0.00 |    3.46
fuel     |    1.52 |    0.18 |    1.12 |    2.07
rewards  |  -17.53 |    5.75 |  -42.03 |   -8.22
fuel_rewards |   -4.36 |    0.52 |   -5.92 |   -3.20
glideslope_rewards |    0.00 |    0.00 |    0.00 |    0.00
glideslope_penalty |    0.00 |    0.00 |    0.00 |    0.00
glideslope |    3.13 |   13.23 |    0.01 |  612.45
norm_af  |    1.77 |    0.92 |    0.15 |    3.39
norm_wf  |    0.01 |    0.01 |    0.00 |    0.03
rh_penalty |    0.00 |    0.00 |    0.00 |    0.00
att_rewards |    0.00 |    0.00 |    0.00 |    0.00
att_penalty |    0.00 |    0.00 |    0.00 |    0.00
attitude |   -0.02   -0.02   -0.21 |    1.26    0.67    1.86 |   -3.14   -1.56   -3.14 |    3.14    1.57    3.14
w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.07   -0.05   -0.07 |    0.08    0.07    0.05
a_f      |   -0.03   -0.18 |    0.68

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.4489   0.4652   2.4092  29.5271  16.8478  11.4563
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0053   0.0031   0.0115   8.0871   2.2896   2.8947
Update Cnt = 2710    ET =   1279.3   Stats:  Mean, Std, Min, Max
r_f      |    5.28   -0.07   -8.62 |  188.75  169.67  198.93 | -392.27 -389.12 -390.61 |  392.18  375.40  375.02
v_f      |   -0.00    0.00    0.00 |    0.04    0.04    0.05 |   -0.09   -0.10   -0.09 |    0.09    0.09    0.10
r_i      |   36.36    3.05  -31.59 |  685.00  658.85  767.76 |-1311.43-1368.97-1266.05 | 1290.41 1344.90 1317.50
v_i      |   -0.00   -0.00    0.00 |    0.04    0.04    0.05 |   -0.09   -0.10   -0.09 |    0.09    0.10    0.10
norm_rf  |    0.20 |    0.08 |    0.03 |    0.43
norm_vf  |    0.07 |    0.01 |    0.03 |    0.11
gs_f     |    1.23 |    1.60 |    0.02 |   11.99
thrust   |    0.00    0.00    0.00 |    0.67    0.68    0.67 |   -3.46   -3.46   -3.46 |    3.39    3.45    3.46
norm_thrust |    

ADV1:  0.0013675837373269806 0.007703382651265524 0.050748905557300605 -0.10801957368850704
ADV2:  0.0057446725946187 0.8500026201356945 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.7551   0.6842   4.2098  29.5271  16.8478  11.4563
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0016   0.0010   0.0035   8.0871   2.2896   2.8947
***** Episode 84337, Mean R = -16.9  Std R = 4.1  Min R = -29.2
PolicyLoss: -0.0204
Policy_Beta: 0.1
Policy_Entropy: 0.159
Policy_KL: 0.00119
Policy_SD: 0.539
Policy_lr_mult: 0.198
Steps: 1.15e+04
TotalSteps: 3.1e+07
VF_0_ExplainedVarNew: 0.99
VF_0_ExplainedVarOld: 0.988
VF_0_Loss : 0.00121


ADV1:  -0.003019761665525087 0.009049630809376177 0.044981564151698405 -0.08148872663967976
ADV2:  0.03968765548332717 0.8796226853637638 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.9205   1.2005   4.8704  29.5271  16.8478  11.4563
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0035   0.0022   0.0079   8.0871   2.2896   2.8947
U

ADV1:  0.0012892747271407389 0.007925796106600528 0.19954080895168386 -0.08081968312358229
ADV2:  -0.019127571630648006 0.7628165612491663 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.4265   1.7247   5.7907  29.5271  16.8478  11.4563
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0016   0.0009   0.0035   8.0871   2.2896   2.8947
***** Episode 84616, Mean R = -18.6  Std R = 5.9  Min R = -33.3
PolicyLoss: 0.00361
Policy_Beta: 0.1
Policy_Entropy: 0.159
Policy_KL: 0.00084
Policy_SD: 0.559
Policy_lr_mult: 0.198
Steps: 1.16e+04
TotalSteps: 3.11e+07
VF_0_ExplainedVarNew: 0.992
VF_0_ExplainedVarOld: 0.989
VF_0_Loss : 0.000975


ADV1:  -0.0019812972780905804 0.008542322102834943 0.05973865764145525 -0.10175301901446726
ADV2:  0.0342272340290011 0.8215010121335907 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.6959   0.7601   3.3887  29.5271  16.8478  11.4563
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0022   0.0014   0.0052   8.0871   2.2896   2.89

***** Episode 84864, Mean R = -17.6  Std R = 6.6  Min R = -37.1
PolicyLoss: -0.00885
Policy_Beta: 0.1
Policy_Entropy: 0.16
Policy_KL: 0.000976
Policy_SD: 0.538
Policy_lr_mult: 0.198
Steps: 1.16e+04
TotalSteps: 3.12e+07
VF_0_ExplainedVarNew: 0.991
VF_0_ExplainedVarOld: 0.983
VF_0_Loss : 0.000384


ADV1:  -0.0005059564437109333 0.009348885015570366 0.06269596733777538 -0.11556993564322288
ADV2:  0.025997889230177252 0.7893114056536522 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.8362   0.9203   5.1389  29.5271  16.8478  11.4563
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0010   0.0005   0.0021   8.0871   2.2896   2.8947
***** Episode 84895, Mean R = -19.4  Std R = 6.3  Min R = -37.4
PolicyLoss: -0.0276
Policy_Beta: 0.1
Policy_Entropy: 0.159
Policy_KL: 0.000957
Policy_SD: 0.557
Policy_lr_mult: 0.198
Steps: 1.16e+04
TotalSteps: 3.12e+07
VF_0_ExplainedVarNew: 0.988
VF_0_ExplainedVarOld: 0.985
VF_0_Loss : 0.000664


ADV1:  -0.0015158991334959268 0.011345034311080878

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.6620   1.4891   5.2638  29.5271  16.8478  11.4563
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0012   0.0007   0.0027   8.0871   2.2896   2.8947
***** Episode 85143, Mean R = -17.5  Std R = 4.6  Min R = -29.5
PolicyLoss: -0.0161
Policy_Beta: 0.1
Policy_Entropy: 0.162
Policy_KL: 0.00134
Policy_SD: 0.531
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 3.13e+07
VF_0_ExplainedVarNew: 0.99
VF_0_ExplainedVarOld: 0.989
VF_0_Loss : 0.000489


ADV1:  0.00015174597137188132 0.007774126530943788 0.057778052329278407 -0.0677410797294622
ADV2:  0.0035648496590798954 0.8780279796462935 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.0287   1.2953   6.2527  29.5271  16.8478  11.4563
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0006   0.0003   0.0014   8.0871   2.2896   2.8947
***** Episode 85174, Mean R = -18.4  Std R = 6.1  Min R = -38.5
PolicyLoss: -0.0085
Policy_Beta: 0.1
Policy_Entropy: 0.162
Policy_KL: 0.000974


ADV1:  0.0011567058271719003 0.007773449540523122 0.04556297780221852 -0.1210082487839369
ADV2:  0.01083956978190932 0.7944087496398051 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.4549   1.0071   4.9938  29.5271  16.8478  11.4563
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0021   0.0009   0.0035   8.0871   2.2896   2.8947
***** Episode 85422, Mean R = -18.2  Std R = 6.2  Min R = -30.7
PolicyLoss: -0.0263
Policy_Beta: 0.1
Policy_Entropy: 0.163
Policy_KL: 0.0009
Policy_SD: 0.547
Policy_lr_mult: 0.198
Steps: 1.16e+04
TotalSteps: 3.14e+07
VF_0_ExplainedVarNew: 0.993
VF_0_ExplainedVarOld: 0.989
VF_0_Loss : 0.000555


ADV1:  -0.0006729150804354238 0.007287275428454033 0.04594404098317453 -0.07777627447051216
ADV2:  0.023723490836888256 0.8431117003839179 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.4428   1.7179   7.4360  29.5271  16.8478  11.4563
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0014   0.0008   0.0027   8.0871   2.2896   2.8947

ADV1:  -0.001194204166405955 0.014453586752377033 0.3677428930952209 -0.2096821537268122
ADV2:  0.017875506116598723 0.6098519380984279 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.0550   0.6480   3.5502  29.5271  16.8478  11.4563
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0018   0.0010   0.0034   8.0871   2.2896   2.8947
***** Episode 85701, Mean R = -19.2  Std R = 7.3  Min R = -41.7
PolicyLoss: -0.0147
Policy_Beta: 0.1
Policy_Entropy: 0.161
Policy_KL: 0.000819
Policy_SD: 0.543
Policy_lr_mult: 0.198
Steps: 1.18e+04
TotalSteps: 3.15e+07
VF_0_ExplainedVarNew: 0.978
VF_0_ExplainedVarOld: 0.964
VF_0_Loss : 0.000997


Dynamics: Max Disturbance (m/s^2):  [0.00149461 0.0018056  0.00138071] 0.002720371623523329
ADV1:  0.0016107590905919682 0.009072814093069991 0.0816935548336245 -0.048227466571216515
ADV2:  -0.027615471889649176 0.837108200548519 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.3246   0.5441   2.6798  29.5271  16.8478  11.4563
ValFun  G

ADV1:  0.0009981021846943623 0.008831495714842232 0.19445903953256116 -0.07611355234071415
ADV2:  -0.027918235138491027 0.7484445290733356 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.4833   0.7718   3.7046  29.5271  16.8478  11.4563
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0014   0.0008   0.0032   8.0871   2.2896   2.8947
***** Episode 85980, Mean R = -17.3  Std R = 5.2  Min R = -30.8
PolicyLoss: 0.0187
Policy_Beta: 0.1
Policy_Entropy: 0.159
Policy_KL: 0.000937
Policy_SD: 0.556
Policy_lr_mult: 0.198
Steps: 1.15e+04
TotalSteps: 3.16e+07
VF_0_ExplainedVarNew: 0.99
VF_0_ExplainedVarOld: 0.984
VF_0_Loss : 0.00114


Dynamics: Max Disturbance (m/s^2):  [0.00149461 0.0018056  0.00138071] 0.002720371623523329
ADV1:  0.0010302812213969666 0.012351719038179837 0.2662416371637355 -0.1292506706485902
ADV2:  -0.015573867415687673 0.7266832684373352 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.9144   0.3502   1.8974  29.5271  16.8478  11.4563
ValFun  Gr

Dynamics: Max Disturbance (m/s^2):  [0.00149461 0.0018056  0.00138071] 0.002720371623523329
ADV1:  -0.001939536686842751 0.009557659915407678 0.0603722094982041 -0.13429172889967544
ADV2:  0.03670579422055725 0.808906220469801 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.1458   0.9945   5.2700  29.5271  16.8478  11.4563
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0021   0.0013   0.0051   8.0871   2.2896   2.8947
***** Episode 86259, Mean R = -16.9  Std R = 3.9  Min R = -24.4
PolicyLoss: -0.0251
Policy_Beta: 0.1
Policy_Entropy: 0.161
Policy_KL: 0.000879
Policy_SD: 0.542
Policy_lr_mult: 0.198
Steps: 1.16e+04
TotalSteps: 3.17e+07
VF_0_ExplainedVarNew: 0.982
VF_0_ExplainedVarOld: 0.98
VF_0_Loss : 0.000759


ADV1:  -0.00030562595033569796 0.009501069101317011 0.11565120751481728 -0.1013206394719488
ADV2:  0.027782606655211924 0.7606022791208755 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.0393   1.5462   7.6861  29.5271  16.8478  11.4563
ValFun  Gr

seeker_angles |    0.00    0.00 |    0.08    0.08 |   -0.94   -1.00 |    0.92    0.99
cs_angles |  0.0016  0.0024 |  0.0830  0.0825 | -0.9404 -0.9957 |  0.9156  0.9947
optical_flow | -0.0001  0.0001 |  0.0228  0.0249 | -1.1554 -1.0655 |  1.0340  1.0891
v_err    | -0.0091 |  0.0570 | -0.4533 |  0.1018
landing_rewards |    9.65 |    1.85 |    0.00 |   10.00
landing_margin |   -0.03 |    0.01 |   -0.06 |    0.02
tracking_rewards |  -22.50 |    4.77 |  -47.82 |  -14.67
steps    |     376 |      19 |     338 |     419
***** Episode 86538, Mean R = -18.1  Std R = 5.8  Min R = -34.1
PolicyLoss: -0.0222
Policy_Beta: 0.1
Policy_Entropy: 0.162
Policy_KL: 0.000939
Policy_SD: 0.547
Policy_lr_mult: 0.198
Steps: 1.16e+04
TotalSteps: 3.18e+07
VF_0_ExplainedVarNew: 0.984
VF_0_ExplainedVarOld: 0.981
VF_0_Loss : 0.000412


ADV1:  0.0023595550620236043 0.008407338427951834 0.06723801836628729 -0.06342566854933235
ADV2:  -0.007797478385923299 0.8736999999001435 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/M

w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.06   -0.05   -0.07 |    0.08    0.08    0.05
a_f      |   -0.04   -0.00 |    0.68    1.83 |   -1.55   -3.13 |    1.54    3.11
w_f      |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.02   -0.02   -0.03 |    0.03    0.02    0.02
w_rewards |   -0.38 |    0.27 |   -1.62 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.27 |    0.31 |    0.00 |    3.05
seeker_angles |   -0.00    0.00 |    0.08    0.09 |   -1.00   -0.99 |    0.97    0.99
cs_angles | -0.0032  0.0017 |  0.0818  0.0852 | -0.9987 -0.9935 |  0.9671  0.9909
optical_flow |  0.0000  0.0000 |  0.0227  0.0246 | -0.9201 -1.1271 |  1.0348  1.2550
v_err    | -0.0092 |  0.0569 | -0.4522 |  0.1114
landing_rewards |    9.71 |    1.68 |    0.00 |   10.00
landing_margin |   -0.03 |    0.01 |   -0.07 |    0.05
tracking_rewards |  -22.53 |    5.06 |  -47.90 |  -14.59
steps    |     377 |  

attitude |    0.05   -0.05    0.19 |    1.15    0.63    1.86 |   -3.14   -1.54   -3.14 |    3.14    1.56    3.14
w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.08   -0.05   -0.07 |    0.08    0.07    0.05
a_f      |   -0.04    0.15 |    0.64    1.86 |   -1.40   -3.14 |    1.37    3.14
w_f      |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.02   -0.02   -0.02 |    0.02    0.02    0.02
w_rewards |   -0.38 |    0.25 |   -1.33 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.26 |    0.32 |    0.00 |    3.10
seeker_angles |   -0.00    0.00 |    0.08    0.09 |   -1.00   -0.99 |    0.98    1.00
cs_angles | -0.0010  0.0038 |  0.0808  0.0856 | -0.9970 -0.9930 |  0.9817  0.9990
optical_flow | -0.0002  0.0001 |  0.0230  0.0254 | -0.9479 -1.1840 |  1.0116  1.3267
v_err    | -0.0088 |  0.0562 | -0.4532 |  0.1085
landing_rewards |    9.71 |    1.68 |    0.00 |   10.00
landing_margin |   -0

attitude |   -0.04   -0.05   -0.01 |    1.22    0.65    1.87 |   -3.14   -1.56   -3.14 |    3.14    1.56    3.14
w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.09   -0.05   -0.07 |    0.07    0.07    0.05
a_f      |   -0.05   -0.02 |    0.66    1.88 |   -1.45   -3.13 |    1.45    3.14
w_f      |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.03   -0.02   -0.02 |    0.03    0.02    0.02
w_rewards |   -0.39 |    0.29 |   -2.66 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.26 |    0.31 |    0.00 |    2.92
seeker_angles |   -0.00    0.00 |    0.08    0.08 |   -0.98   -1.00 |    0.99    0.95
cs_angles | -0.0031  0.0023 |  0.0802  0.0838 | -0.9802 -0.9999 |  0.9861  0.9497
optical_flow | -0.0001 -0.0001 |  0.0225  0.0244 | -1.1974 -0.9598 |  0.9989  0.9743
v_err    | -0.0092 |  0.0563 | -0.4534 |  0.1065
landing_rewards |    9.58 |    2.00 |    0.00 |   10.00
landing_margin |   -0

attitude |    0.04    0.01   -0.07 |    1.22    0.67    1.85 |   -3.14   -1.57   -3.14 |    3.14    1.57    3.14
w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.08   -0.05   -0.07 |    0.09    0.07    0.05
a_f      |    0.01   -0.05 |    0.68    1.84 |   -1.42   -3.08 |    1.52    3.12
w_f      |   -0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.02   -0.02   -0.01 |    0.02    0.03    0.02
w_rewards |   -0.38 |    0.26 |   -1.82 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.27 |    0.32 |    0.00 |    3.05
seeker_angles |   -0.00    0.00 |    0.08    0.09 |   -0.99   -0.98 |    0.98    0.99
cs_angles | -0.0040  0.0008 |  0.0843  0.0851 | -0.9945 -0.9812 |  0.9813  0.9927
optical_flow | -0.0001  0.0000 |  0.0245  0.0259 | -1.3765 -1.0767 |  0.9529  1.1537
v_err    | -0.0090 |  0.0561 | -0.4520 |  0.1225
landing_rewards |    9.74 |    1.59 |    0.00 |   10.00
landing_margin |   -0

thrust   |   -0.00    0.01   -0.00 |    0.69    0.70    0.69 |   -3.45   -3.42   -3.46 |    3.46    3.45    3.44
norm_thrust |    0.92 |    0.77 |    0.00 |    3.46
fuel     |    1.57 |    0.20 |    1.19 |    2.86
rewards  |  -19.08 |    7.18 |  -70.36 |   -8.69
fuel_rewards |   -4.51 |    0.59 |   -8.22 |   -3.40
glideslope_rewards |    0.00 |    0.00 |    0.00 |    0.00
glideslope_penalty |    0.00 |    0.00 |    0.00 |    0.00
glideslope |    2.86 |   13.21 |    0.01 |  244.49
norm_af  |    1.83 |    0.87 |    0.04 |    3.33
norm_wf  |    0.01 |    0.01 |    0.00 |    0.03
rh_penalty |    0.00 |    0.00 |    0.00 |    0.00
att_rewards |    0.00 |    0.00 |    0.00 |    0.00
att_penalty |    0.00 |    0.00 |    0.00 |    0.00
attitude |    0.07    0.00    0.03 |    1.25    0.69    1.90 |   -3.14   -1.56   -3.14 |    3.14    1.57    3.14
w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.08   -0.05   -0.07 |    0.08    0.07    0.05
a_f      |    0.01    0.01 |    0.69

ADV1:  0.000495928722766091 0.010098445922675238 0.24992538739874448 -0.11429024998296256
ADV2:  -0.0014895455716123225 0.7503770555987997 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.6672   1.5365   7.7011  29.5271  16.8478  11.4563
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0011   0.0007   0.0028   8.0871   2.2896   2.8947
Update Cnt = 2850    ET =   1088.9   Stats:  Mean, Std, Min, Max
r_f      |   12.97   -3.58    2.78 |  179.82  172.19  197.94 | -389.63 -393.62 -388.89 |  380.35  367.12  396.74
v_f      |    0.00    0.00   -0.00 |    0.04    0.04    0.05 |   -0.09   -0.12   -0.09 |    0.09    0.11    0.10
r_i      |   17.09  -16.50   22.37 |  684.23  642.96  760.38 |-1371.93-1260.87-1351.18 | 1315.96 1304.55 1304.94
v_i      |   -0.00    0.00   -0.00 |    0.04    0.04    0.05 |   -0.09   -0.10   -0.09 |    0.09    0.08    0.10
norm_rf  |    0.20 |    0.08 |    0.04 |    0.51
norm_vf  |    0.07 |    0.01 |    0.04 |    0.12
gs_f     |    1.24 |    1.62 | 

Dynamics: Max Disturbance (m/s^2):  [0.00149461 0.0018056  0.00138071] 0.002720371623523329
ADV1:  -0.000755655946432926 0.008225153817221862 0.05179652407219498 -0.07215333743012409
ADV2:  0.030121163583529738 0.8273205119161241 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   8.9173   4.0253  15.4564  29.5271  16.8478  11.4563
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0008   0.0004   0.0019   8.0871   2.2896   2.8947
***** Episode 88677, Mean R = -16.6  Std R = 5.2  Min R = -37.0
PolicyLoss: -0.028
Policy_Beta: 0.0667
Policy_Entropy: 0.162
Policy_KL: 0.000683
Policy_SD: 0.523
Policy_lr_mult: 0.198
Steps: 1.21e+04
TotalSteps: 3.26e+07
VF_0_ExplainedVarNew: 0.987
VF_0_ExplainedVarOld: 0.985
VF_0_Loss : 0.00046


ADV1:  0.0025470687372586907 0.006485364778786456 0.0721142636629355 -0.10572398623347656
ADV2:  -0.031106962678128378 0.8679635196238862 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.3545   0.9203   5.1638  29.5271  16.8478  11.4563
ValFun

***** Episode 88925, Mean R = -17.2  Std R = 5.2  Min R = -26.0
PolicyLoss: -0.0274
Policy_Beta: 0.1
Policy_Entropy: 0.161
Policy_KL: 0.000813
Policy_SD: 0.543
Policy_lr_mult: 0.198
Steps: 1.16e+04
TotalSteps: 3.27e+07
VF_0_ExplainedVarNew: 0.987
VF_0_ExplainedVarOld: 0.985
VF_0_Loss : 0.0013


ADV1:  0.002735720061111748 0.006229642767678225 0.05697915376793353 -0.03853712052721203
ADV2:  -0.031736056239410414 0.9074489796317962 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.7467   0.9460   5.0968  29.5271  16.8478  11.4563
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0031   0.0020   0.0072   8.0871   2.2896   2.8947
***** Episode 88956, Mean R = -16.6  Std R = 4.7  Min R = -27.5
PolicyLoss: -0.00365
Policy_Beta: 0.1
Policy_Entropy: 0.162
Policy_KL: 0.000953
Policy_SD: 0.536
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 3.27e+07
VF_0_ExplainedVarNew: 0.993
VF_0_ExplainedVarOld: 0.992
VF_0_Loss : 0.00115


ADV1:  -0.00043866568927969184 0.006187164620661133 0

ADV1:  0.0004146505547505592 0.007536291987378716 0.04311151228340848 -0.08029671532228355
ADV2:  0.02155839942135125 0.8358402191212655 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   8.0626   3.2982  15.3317  29.5271  18.5111  12.4602
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0010   0.0004   0.0019   8.0871   2.2896   2.8947
***** Episode 89204, Mean R = -17.9  Std R = 6.4  Min R = -31.9
PolicyLoss: -0.0284
Policy_Beta: 0.0667
Policy_Entropy: 0.163
Policy_KL: 0.000234
Policy_SD: 0.533
Policy_lr_mult: 0.198
Steps: 1.18e+04
TotalSteps: 3.28e+07
VF_0_ExplainedVarNew: 0.99
VF_0_ExplainedVarOld: 0.989
VF_0_Loss : 0.000741


ADV1:  0.0012805624097023407 0.006791445582983237 0.04454406846327469 -0.048298506734630986
ADV2:  6.442283873164769e-05 0.8691309243960467 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.9161   1.4816   7.0407  29.5271  18.5111  12.4602
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0018   0.0010   0.0034   8.0871   2.2896   

***** Episode 89452, Mean R = -16.0  Std R = 6.0  Min R = -31.8
PolicyLoss: 0.00626
Policy_Beta: 0.1
Policy_Entropy: 0.165
Policy_KL: 0.000618
Policy_SD: 0.532
Policy_lr_mult: 0.198
Steps: 1.16e+04
TotalSteps: 3.29e+07
VF_0_ExplainedVarNew: 0.995
VF_0_ExplainedVarOld: 0.993
VF_0_Loss : 0.00137


ADV1:  -0.0012603192280944888 0.009106238972371275 0.045614364417750575 -0.06033157376584337
ADV2:  0.03451731168842646 0.8534713129464534 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.2678   1.1633   4.6658  29.5271  18.5111  12.4602
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0025   0.0013   0.0043   8.0871   2.2896   2.8947
***** Episode 89483, Mean R = -17.4  Std R = 5.4  Min R = -31.1
PolicyLoss: -0.0291
Policy_Beta: 0.1
Policy_Entropy: 0.164
Policy_KL: 0.00117
Policy_SD: 0.539
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 3.29e+07
VF_0_ExplainedVarNew: 0.984
VF_0_ExplainedVarOld: 0.982
VF_0_Loss : 0.0013


ADV1:  0.0007057223889251975 0.0073006366687653835 0.0

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.6703   0.8079   3.9114  29.5271  18.5111  12.4602
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0047   0.0025   0.0088   8.0871   2.2896   2.8947
***** Episode 89731, Mean R = -17.8  Std R = 5.5  Min R = -32.2
PolicyLoss: -0.0353
Policy_Beta: 0.1
Policy_Entropy: 0.163
Policy_KL: 0.000672
Policy_SD: 0.544
Policy_lr_mult: 0.198
Steps: 1.15e+04
TotalSteps: 3.3e+07
VF_0_ExplainedVarNew: 0.99
VF_0_ExplainedVarOld: 0.986
VF_0_Loss : 0.00126


ADV1:  -0.0019963783670340083 0.011660067028857829 0.05401403882445288 -0.1927146515311351
ADV2:  0.04157802686204388 0.7203514018541797 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.1293   0.6745   3.7118  29.5271  18.5111  12.4602
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0024   0.0015   0.0054   8.0871   2.2896   2.8947
***** Episode 89762, Mean R = -16.9  Std R = 6.9  Min R = -40.0
PolicyLoss: -0.0328
Policy_Beta: 0.1
Policy_Entropy: 0.164
Policy_KL: 0.000698
Poli

ADV1:  -0.002198556797226235 0.006564466731790688 0.044502654171104994 -0.09732227519178871
ADV2:  0.03262041977088495 0.8533726991904639 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   3.1373   1.5581   7.7665  29.5271  18.5111  12.4602
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0024   0.0014   0.0057   8.0871   2.2896   2.8947
***** Episode 90010, Mean R = -17.1  Std R = 4.7  Min R = -30.3
PolicyLoss: -0.0135
Policy_Beta: 0.1
Policy_Entropy: 0.165
Policy_KL: 0.00109
Policy_SD: 0.531
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 3.31e+07
VF_0_ExplainedVarNew: 0.993
VF_0_ExplainedVarOld: 0.991
VF_0_Loss : 0.00136


ADV1:  6.720941999864014e-05 0.007510030897900339 0.07753106962560619 -0.08228753321713056
ADV2:  0.023121151091580118 0.8061479585000609 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.9464   0.8670   4.2191  29.5271  18.5111  12.4602
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0008   0.0005   0.0020   8.0871   2.2896   2.894

ADV1:  0.0011455439073516198 0.00917081084733044 0.06977632703824233 -0.05584899976962693
ADV2:  0.00675335713000396 0.8509113504427993 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.5294   1.3509   6.8513  29.5271  18.5111  12.4602
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0015   0.0009   0.0031   8.0871   2.2896   2.8947
***** Episode 90289, Mean R = -17.2  Std R = 4.6  Min R = -30.3
PolicyLoss: -0.021
Policy_Beta: 0.1
Policy_Entropy: 0.164
Policy_KL: 0.000912
Policy_SD: 0.532
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 3.32e+07
VF_0_ExplainedVarNew: 0.984
VF_0_ExplainedVarOld: 0.982
VF_0_Loss : 0.00137


ADV1:  0.00017248420291686732 0.006823646455467895 0.04195035118157148 -0.11024239044140083
ADV2:  0.01660577191879968 0.8167903404632919 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.8024   0.9763   4.1952  29.5271  18.5111  12.4602
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0004   0.0002   0.0008   8.0871   2.2896   2.8947


optical_flow | -0.0001 -0.0001 |  0.0231  0.0256 | -1.2987 -1.1863 |  0.9095  1.1748
v_err    | -0.0094 |  0.0562 | -0.4552 |  0.1283
landing_rewards |    9.58 |    2.00 |    0.00 |   10.00
landing_margin |   -0.02 |    0.01 |   -0.06 |    0.01
tracking_rewards |  -22.65 |    4.53 |  -41.05 |  -14.83
steps    |     378 |      21 |     335 |     418
***** Episode 90568, Mean R = -17.3  Std R = 6.2  Min R = -35.1
PolicyLoss: -0.0243
Policy_Beta: 0.1
Policy_Entropy: 0.166
Policy_KL: 0.000652
Policy_SD: 0.529
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 3.33e+07
VF_0_ExplainedVarNew: 0.989
VF_0_ExplainedVarOld: 0.986
VF_0_Loss : 0.00173


ADV1:  0.0009033123948203055 0.00747896264109326 0.03876446241904913 -0.05501103495027593
ADV2:  0.014021720032242379 0.8484506769226234 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.8352   0.7535   3.5480  29.5271  18.5111  12.4602
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0009   0.0006   0.0024   8.0871   2.2896   2.8947


w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.10   -0.05   -0.07 |    0.08    0.07    0.05
a_f      |    0.05    0.04 |    0.65    1.78 |   -1.48   -3.14 |    1.52    3.03
w_f      |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.10   -0.02   -0.02 |    0.02    0.03    0.03
w_rewards |   -0.34 |    0.28 |   -2.79 |    0.00
w_penalty |   -0.32 |    5.67 | -100.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.26 |    0.31 |    0.00 |    2.93
seeker_angles |    0.00    0.00 |    0.08    0.09 |   -0.98   -0.99 |    0.98    1.00
cs_angles |  0.0027  0.0038 |  0.0833  0.0858 | -0.9787 -0.9947 |  0.9785  0.9981
optical_flow | -0.0000  0.0001 |  0.0230  0.0255 | -1.1871 -0.8775 |  1.0996  1.1666
v_err    | -0.0097 |  0.0561 | -0.4526 |  0.1136
landing_rewards |    9.61 |    1.93 |    0.00 |   10.00
landing_margin |    2.95 |   52.28 |   -0.06 |  921.98
tracking_rewards |  -22.59 |    4.66 |  -37.72 |  -12.90
steps    |     377 |  

rewards  |  -17.78 |    6.19 |  -60.19 |   -6.43
fuel_rewards |   -4.42 |    0.57 |   -6.36 |   -2.97
glideslope_rewards |    0.00 |    0.00 |    0.00 |    0.00
glideslope_penalty |    0.00 |    0.00 |    0.00 |    0.00
glideslope |    2.98 |   13.11 |    0.01 |  839.18
norm_af  |    1.67 |    0.91 |    0.07 |    3.32
norm_wf  |    0.01 |    0.01 |    0.00 |    0.03
rh_penalty |    0.00 |    0.00 |    0.00 |    0.00
att_rewards |    0.00 |    0.00 |    0.00 |    0.00
att_penalty |    0.00 |    0.00 |    0.00 |    0.00
attitude |   -0.04    0.01    0.01 |    1.16    0.68    1.78 |   -3.14   -1.56   -3.14 |    3.14    1.56    3.14
w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.08   -0.05   -0.07 |    0.07    0.07    0.05
a_f      |    0.00   -0.07 |    0.68    1.77 |   -1.56   -3.14 |    1.54    3.13
w_f      |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.03   -0.02   -0.02 |    0.02    0.02    0.02
w_rewards |   -0.33 |    0.24 |   -1.71 |    0.00
w_pena

Update Cnt = 2950    ET =   1073.7   Stats:  Mean, Std, Min, Max
r_f      |    6.56   -0.68   -9.83 |  189.42  158.51  206.38 | -389.67 -348.41 -386.97 |  397.55  381.19  387.12
v_f      |   -0.00   -0.00    0.00 |    0.04    0.04    0.05 |   -0.09   -0.11   -0.11 |    0.10    0.08    0.10
r_i      |   -1.21    3.58  -35.58 |  675.69  623.15  803.68 |-1355.73-1268.77-1307.62 | 1348.62 1367.92 1290.98
v_i      |    0.00   -0.00   -0.00 |    0.04    0.04    0.05 |   -0.09   -0.09   -0.10 |    0.10    0.10    0.10
norm_rf  |    0.19 |    0.08 |    0.01 |    0.48
norm_vf  |    0.07 |    0.01 |    0.04 |    0.12
gs_f     |    1.39 |    1.82 |    0.01 |   20.40
thrust   |   -0.00    0.00   -0.00 |    0.67    0.70    0.68 |   -3.45   -3.46   -3.42 |    3.45    3.45    3.44
norm_thrust |    0.91 |    0.76 |    0.00 |    3.46
fuel     |    1.55 |    0.18 |    1.07 |    2.10
rewards  |  -17.56 |    5.27 |  -34.01 |   -7.97
fuel_rewards |   -4.45 |    0.51 |   -6.02 |   -3.07
glideslope_rewards |

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.6125   0.6090   3.2027  29.5271  18.5111  12.4602
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0008   0.0004   0.0018   8.0871   2.2896   2.8947
***** Episode 91777, Mean R = -17.0  Std R = 5.9  Min R = -31.3
PolicyLoss: 0.00364
Policy_Beta: 0.1
Policy_Entropy: 0.164
Policy_KL: 0.0011
Policy_SD: 0.536
Policy_lr_mult: 0.198
Steps: 1.18e+04
TotalSteps: 3.38e+07
VF_0_ExplainedVarNew: 0.988
VF_0_ExplainedVarOld: 0.983
VF_0_Loss : 0.00104


ADV1:  0.000645673123803695 0.008238479248735418 0.18401595621800493 -0.13357175096939422
ADV2:  -0.010008719954828337 0.7395518073141863 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.6159   0.7767   3.7424  29.5271  18.5111  12.4602
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0009   0.0005   0.0018   8.0871   2.2896   2.8947
Update Cnt = 2960    ET =   1059.3   Stats:  Mean, Std, Min, Max
r_f      |  -16.94    1.57    5.13 |  184.90  175.74  203.04 | -398.32 -382.22 -3

ADV1:  -0.0004138466900242396 0.00980721638638577 0.13538302881067799 -0.15083486668888224
ADV2:  0.020537214586991093 0.7612730106908261 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.1414   0.7262   3.8353  29.5271  18.5111  12.4602
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0004   0.0003   0.0011   8.0871   2.2896   2.8947
***** Episode 92056, Mean R = -18.2  Std R = 5.0  Min R = -26.9
PolicyLoss: -0.0216
Policy_Beta: 0.1
Policy_Entropy: 0.165
Policy_KL: 0.000949
Policy_SD: 0.54
Policy_lr_mult: 0.198
Steps: 1.18e+04
TotalSteps: 3.39e+07
VF_0_ExplainedVarNew: 0.985
VF_0_ExplainedVarOld: 0.982
VF_0_Loss : 0.000672


ADV1:  -0.00103677290423214 0.009788244785949867 0.058367751058556516 -0.0743462863439383
ADV2:  0.01971771940085432 0.8899624441383566 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.4845   1.2248   5.4552  29.5271  18.5111  12.4602
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0015   0.0009   0.0032   8.0871   2.2896   2.8947

***** Episode 92304, Mean R = -16.9  Std R = 3.9  Min R = -27.7
PolicyLoss: -0.00844
Policy_Beta: 0.1
Policy_Entropy: 0.165
Policy_KL: 0.000809
Policy_SD: 0.537
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 3.4e+07
VF_0_ExplainedVarNew: 0.985
VF_0_ExplainedVarOld: 0.982
VF_0_Loss : 0.00184


ADV1:  0.0022014369746928813 0.007055151147681705 0.1250047750923845 -0.06718879127354233
ADV2:  -0.023733045152308768 0.8168199695515407 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   3.0571   2.0975  10.4410  29.5271  18.5111  12.4602
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0027   0.0016   0.0058   8.0871   2.2896   2.8947
***** Episode 92335, Mean R = -16.2  Std R = 4.3  Min R = -25.4
PolicyLoss: -0.00133
Policy_Beta: 0.1
Policy_Entropy: 0.165
Policy_KL: 0.00095
Policy_SD: 0.529
Policy_lr_mult: 0.198
Steps: 1.19e+04
TotalSteps: 3.4e+07
VF_0_ExplainedVarNew: 0.992
VF_0_ExplainedVarOld: 0.989
VF_0_Loss : 0.00189


Dynamics: Max Disturbance (m/s^2):  [0.00149461 0.0018

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.0207   0.4087   1.6131  29.5271  18.5111  12.4602
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0007   0.0003   0.0013   8.0871   2.2896   2.8947
***** Episode 92583, Mean R = -18.6  Std R = 5.9  Min R = -33.0
PolicyLoss: 0.0076
Policy_Beta: 0.1
Policy_Entropy: 0.165
Policy_KL: 0.00103
Policy_SD: 0.545
Policy_lr_mult: 0.198
Steps: 1.18e+04
TotalSteps: 3.41e+07
VF_0_ExplainedVarNew: 0.987
VF_0_ExplainedVarOld: 0.982
VF_0_Loss : 0.00103


ADV1:  -0.0012365577516819171 0.008450501170228789 0.03995718201001489 -0.1036601460212837
ADV2:  0.03850024258492049 0.8272517822359228 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   3.1781   2.0530   9.2544  29.5271  18.5111  12.4602
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0019   0.0010   0.0041   8.0871   2.2896   2.8947
***** Episode 92614, Mean R = -18.6  Std R = 4.4  Min R = -28.1
PolicyLoss: -0.0331
Policy_Beta: 0.1
Policy_Entropy: 0.166
Policy_KL: 0.00126
Polic

ADV1:  0.0007266835249269498 0.008593495424042965 0.08712966651666221 -0.04891672127724912
ADV2:  0.008956117306628458 0.8515045077015213 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.2405   0.4958   2.9977  29.5271  18.5111  12.4602
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0008   0.0004   0.0019   8.0871   2.2896   2.8947
***** Episode 92862, Mean R = -19.0  Std R = 6.4  Min R = -34.9
PolicyLoss: -0.0191
Policy_Beta: 0.1
Policy_Entropy: 0.166
Policy_KL: 0.00104
Policy_SD: 0.539
Policy_lr_mult: 0.198
Steps: 1.16e+04
TotalSteps: 3.42e+07
VF_0_ExplainedVarNew: 0.989
VF_0_ExplainedVarOld: 0.987
VF_0_Loss : 0.0024


Dynamics: Max Disturbance (m/s^2):  [0.00149461 0.0018056  0.00138071] 0.002720371623523329
ADV1:  0.0005573493801763051 0.008065789297723416 0.05918837322713766 -0.05667166630358078
ADV2:  0.0050321267454278085 0.8751000939830186 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.2987   0.6147   3.5313  29.5271  18.5111  12.4602
ValFun  G

***** Episode 93110, Mean R = -16.0  Std R = 3.7  Min R = -24.0
PolicyLoss: 0.00132
Policy_Beta: 0.0667
Policy_Entropy: 0.166
Policy_KL: 0.00497
Policy_SD: 0.528
Policy_lr_mult: 0.198
Steps: 1.18e+04
TotalSteps: 3.43e+07
VF_0_ExplainedVarNew: 0.993
VF_0_ExplainedVarOld: 0.992
VF_0_Loss : 0.00256


ADV1:  6.571135854654863e-05 0.007348236915185281 0.03985398666918116 -0.09836450912396788
ADV2:  0.02334083653170252 0.7674591747957069 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   8.6863   6.8519  19.8375  29.5271  18.5111  12.4602
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0004   0.0002   0.0007   8.0871   2.2896   2.8947
***** Episode 93141, Mean R = -16.6  Std R = 5.5  Min R = -29.3
PolicyLoss: -0.0271
Policy_Beta: 0.0667
Policy_Entropy: 0.165
Policy_KL: 0.0012
Policy_SD: 0.533
Policy_lr_mult: 0.198
Steps: 1.16e+04
TotalSteps: 3.43e+07
VF_0_ExplainedVarNew: 0.992
VF_0_ExplainedVarOld: 0.989
VF_0_Loss : 0.00266


Dynamics: Max Disturbance (m/s^2):  [0.00149461 0.0

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.2359   0.1300   0.5825  29.5271  18.5111  12.4602
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0120   0.0067   0.0256   8.0871   2.2896   2.8947
***** Episode 93389, Mean R = -20.4  Std R = 18.1  Min R = -116.3
PolicyLoss: -0.0335
Policy_Beta: 0.1
Policy_Entropy: 0.165
Policy_KL: 0.000583
Policy_SD: 0.531
Policy_lr_mult: 0.198
Steps: 1.13e+04
TotalSteps: 3.44e+07
VF_0_ExplainedVarNew: 0.7
VF_0_ExplainedVarOld: 0.413
VF_0_Loss : 0.0107


ADV1:  0.0002616058992261251 0.017703892848827795 0.36818380401281114 -0.20213462849977826
ADV2:  -0.01922197534873693 0.72645358827448 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.3304   0.5335   2.8709  29.5271  18.5111  12.4602
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0020   0.0010   0.0041   8.0871   2.2896   2.8947
***** Episode 93420, Mean R = -18.6  Std R = 5.2  Min R = -28.9
PolicyLoss: 0.0164
Policy_Beta: 0.1
Policy_Entropy: 0.165
Policy_KL: 0.000801
Polic

cs_angles | -0.0021  0.0004 |  0.0799  0.0853 | -0.9937 -0.9992 |  0.9993  0.9810
optical_flow | -0.0000  0.0000 |  0.0211  0.0255 | -1.1129 -0.9800 |  1.0153  1.2003
v_err    | -0.0094 |  0.0565 | -0.4530 |  0.1079
landing_rewards |    9.45 |    2.28 |    0.00 |   10.00
landing_margin |    2.69 |   47.68 |   -0.07 |  840.90
tracking_rewards |  -22.46 |    4.72 |  -46.84 |  -13.26
steps    |     376 |      29 |      17 |     419
***** Episode 93668, Mean R = -17.6  Std R = 5.9  Min R = -35.0
PolicyLoss: -0.0227
Policy_Beta: 0.1
Policy_Entropy: 0.167
Policy_KL: 0.0011
Policy_SD: 0.535
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 3.45e+07
VF_0_ExplainedVarNew: 0.985
VF_0_ExplainedVarOld: 0.983
VF_0_Loss : 0.00394


Dynamics: Max Disturbance (m/s^2):  [0.00149461 0.0018056  0.00138071] 0.002720371623523329
ADV1:  0.0010534160675060547 0.007676793179544425 0.10743296936550362 -0.10252936861631179
ADV2:  -0.003524635823263445 0.7768519209047541 3.0 -3.0
Policy  Gradients: u/sd/Max/C Ma

attitude |    0.05   -0.02    0.08 |    1.16    0.65    1.83 |   -3.14   -1.55   -3.14 |    3.14    1.57    3.14
w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.07   -0.05   -0.07 |    0.07    0.07    0.05
a_f      |   -0.00    0.05 |    0.64    1.83 |   -1.44   -3.12 |    1.50    3.14
w_f      |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.02   -0.03   -0.02 |    0.02    0.03    0.02
w_rewards |   -0.30 |    0.22 |   -1.18 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.26 |    0.31 |    0.00 |    3.13
seeker_angles |   -0.00    0.00 |    0.08    0.08 |   -0.99   -0.98 |    0.98    0.95
cs_angles | -0.0004  0.0019 |  0.0829  0.0810 | -0.9928 -0.9797 |  0.9764  0.9500
optical_flow | -0.0001 -0.0000 |  0.0228  0.0238 | -1.1601 -0.9684 |  1.1643  0.9832
v_err    | -0.0091 |  0.0558 | -0.4516 |  0.1020
landing_rewards |    9.71 |    1.68 |    0.00 |   10.00
landing_margin |   -0

attitude |   -0.08    0.02    0.21 |    1.20    0.66    1.83 |   -3.14   -1.55   -3.14 |    3.14    1.56    3.14
w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.07   -0.05   -0.07 |    0.10    0.07    0.05
a_f      |    0.02    0.22 |    0.66    1.83 |   -1.51   -3.13 |    1.48    3.14
w_f      |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.03   -0.02   -0.02 |    0.10    0.03    0.03
w_rewards |   -0.36 |    0.60 |   -9.87 |    0.00
w_penalty |   -0.32 |    5.67 | -100.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.27 |    0.31 |    0.00 |    3.10
seeker_angles |    0.00    0.00 |    0.08    0.09 |   -0.99   -1.00 |    0.99    1.00
cs_angles |  0.0012  0.0036 |  0.0817  0.0858 | -0.9890 -0.9969 |  0.9863  0.9995
optical_flow | -0.0001 -0.0001 |  0.0221  0.0252 | -1.0611 -1.2998 |  1.1270  0.9961
v_err    | -0.0096 |  0.0573 | -0.6529 |  0.1087
landing_rewards |    9.45 |    2.28 |    0.00 |   10.00
landing_margin |    2

w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.09   -0.05   -0.07 |    0.09    0.07    0.07
a_f      |    0.04    0.07 |    0.66    1.94 |   -1.52   -3.13 |    1.42    3.13
w_f      |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.02   -0.02   -0.02 |    0.02    0.03    0.02
w_rewards |   -0.32 |    0.28 |   -1.96 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.26 |    0.31 |    0.00 |    3.08
seeker_angles |    0.00    0.00 |    0.08    0.09 |   -0.98   -0.98 |    0.98    0.95
cs_angles |  0.0009  0.0013 |  0.0842  0.0890 | -0.9801 -0.9826 |  0.9804  0.9517
optical_flow |  0.0001  0.0001 |  0.0225  0.0259 | -1.1717 -1.3031 |  1.1311  1.1405
v_err    | -0.0091 |  0.0556 | -0.4534 |  0.1230
landing_rewards |    9.74 |    1.59 |    0.00 |   10.00
landing_margin |   -0.03 |    0.01 |   -0.07 |    0.02
tracking_rewards |  -22.74 |    5.96 |  -70.34 |  -14.42
steps    |     375 |  

norm_thrust |    0.90 |    0.76 |    0.00 |    3.46
fuel     |    1.52 |    0.18 |    1.12 |    2.08
rewards  |  -17.28 |    5.68 |  -40.59 |   -6.36
fuel_rewards |   -4.36 |    0.52 |   -5.95 |   -3.19
glideslope_rewards |    0.00 |    0.00 |    0.00 |    0.00
glideslope_penalty |    0.00 |    0.00 |    0.00 |    0.00
glideslope |    2.90 |   12.76 |    0.01 |  323.41
norm_af  |    1.83 |    0.93 |    0.07 |    3.44
norm_wf  |    0.01 |    0.01 |    0.00 |    0.03
rh_penalty |    0.00 |    0.00 |    0.00 |    0.00
att_rewards |    0.00 |    0.00 |    0.00 |    0.00
att_penalty |    0.00 |    0.00 |    0.00 |    0.00
attitude |   -0.04    0.03   -0.07 |    1.30    0.70    1.90 |   -3.14   -1.57   -3.14 |    3.14    1.57    3.14
w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.08   -0.05   -0.07 |    0.08    0.07    0.05
a_f      |    0.02   -0.04 |    0.70    1.93 |   -1.49   -3.12 |    1.50    3.12
w_f      |   -0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.

ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0010   0.0006   0.0029   8.0871   2.2896   2.8947
Update Cnt = 3070    ET =    978.1   Stats:  Mean, Std, Min, Max
r_f      |    7.28    0.98  -13.74 |  194.77  164.36  204.35 | -383.57 -364.32 -373.93 |  393.11  393.81  388.73
v_f      |   -0.00    0.00    0.00 |    0.04    0.04    0.05 |   -0.10   -0.11   -0.10 |    0.09    0.12    0.09
r_i      |   29.06    8.59  -38.65 |  714.78  623.10  765.92 |-1329.92-1360.01-1273.57 | 1378.68 1316.04 1297.35
v_i      |   -0.00   -0.00    0.00 |    0.05    0.04    0.05 |   -0.09   -0.09   -0.10 |    0.10    0.09    0.09
norm_rf  |    0.19 |    0.07 |    0.02 |    0.42
norm_vf  |    0.08 |    0.01 |    0.04 |    0.14
gs_f     |    1.28 |    2.27 |    0.02 |   24.06
thrust   |   -0.00    0.00    0.00 |    0.70    0.69    0.69 |   -3.37   -3.46   -3.44 |    3.46    3.46    3.46
norm_thrust |    0.92 |    0.76 |    0.00 |    3.46
fuel     |    1.55 |    0.19 |    1.09 |    2.19
rewards  |  -18.28 

ADV1:  -0.0011233401372751836 0.008792879074361423 0.04791661358815241 -0.06181889086891251
ADV2:  0.03324539132502892 0.8358111620319812 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.4456   0.9332   4.6612  29.5271  18.5111  12.4602
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0014   0.0008   0.0029   8.0871   2.2896   2.8947
***** Episode 95497, Mean R = -18.4  Std R = 5.6  Min R = -33.3
PolicyLoss: -0.0286
Policy_Beta: 0.1
Policy_Entropy: 0.164
Policy_KL: 0.00074
Policy_SD: 0.548
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 3.52e+07
VF_0_ExplainedVarNew: 0.986
VF_0_ExplainedVarOld: 0.985
VF_0_Loss : 0.00415


ADV1:  -0.001390845860552003 0.009580319927365003 0.04419414646192055 -0.06362323012723423
ADV2:  0.03349131714958679 0.8517769649234868 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.6861   0.8627   4.6755  29.5271  18.5111  12.4602
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0019   0.0010   0.0038   8.0871   2.2896   2.8947

ADV1:  0.0018404580281179113 0.007391065128900017 0.0454407015402577 -0.12201680331218379
ADV2:  0.0070873216204124 0.735756842286488 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.8975   1.3898   7.2113  29.5271  18.5111  12.4602
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0020   0.0012   0.0048   8.0871   2.2896   2.8947
***** Episode 95776, Mean R = -16.2  Std R = 5.0  Min R = -26.4
PolicyLoss: -0.0288
Policy_Beta: 0.1
Policy_Entropy: 0.166
Policy_KL: 0.000893
Policy_SD: 0.53
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 3.53e+07
VF_0_ExplainedVarNew: 0.992
VF_0_ExplainedVarOld: 0.989
VF_0_Loss : 0.00442


ADV1:  -0.0021761393516061592 0.008406376895482454 0.055938171748447896 -0.07835072409797872
ADV2:  0.035891785805492384 0.8390736982421507 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.6745   0.8227   3.9811  29.5271  18.5111  12.4602
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0026   0.0016   0.0057   8.0871   2.2896   2.8947


ADV1:  8.711733015047846e-05 0.01094398970845285 0.20223933452142961 -0.17658787193970815
ADV2:  -0.008091568665201814 0.6801029747504861 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.8049   0.8222   4.5524  29.5271  18.5111  12.4602
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0006   0.0003   0.0012   8.0871   2.2896   2.8947
***** Episode 96055, Mean R = -17.4  Std R = 6.0  Min R = -36.6
PolicyLoss: 0.00533
Policy_Beta: 0.1
Policy_Entropy: 0.162
Policy_KL: 0.000897
Policy_SD: 0.543
Policy_lr_mult: 0.198
Steps: 1.15e+04
TotalSteps: 3.54e+07
VF_0_ExplainedVarNew: 0.986
VF_0_ExplainedVarOld: 0.977
VF_0_Loss : 0.00372


Dynamics: Max Disturbance (m/s^2):  [0.00149461 0.0018056  0.00138071] 0.002720371623523329
ADV1:  -0.0018434629382280655 0.009914119130149328 0.17048444038147087 -0.07479095302977434
ADV2:  0.014370594143422965 0.7625558443313144 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.7726   0.9040   4.4065  29.5271  18.5111  12.4602
ValFun 

ADV1:  0.0009046882049393502 0.009311757196387457 0.0676486664693583 -0.07357912758026797
ADV2:  -0.003048722922627396 0.8519045085515501 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.1389   1.1145   5.4821  29.5271  18.5111  12.4602
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0011   0.0006   0.0024   8.0871   2.2896   2.8947
***** Episode 96334, Mean R = -15.9  Std R = 5.4  Min R = -36.6
PolicyLoss: -0.00737
Policy_Beta: 0.1
Policy_Entropy: 0.167
Policy_KL: 0.00117
Policy_SD: 0.528
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 3.55e+07
VF_0_ExplainedVarNew: 0.984
VF_0_ExplainedVarOld: 0.98
VF_0_Loss : 0.00306


Dynamics: Max Disturbance (m/s^2):  [0.00149461 0.0018056  0.00138071] 0.002720371623523329
ADV1:  -0.00023522810447640323 0.0108217807389904 0.14633171114210664 -0.08904956541273062
ADV2:  0.007999336680647616 0.8405402512355877 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.6985   0.8237   4.4041  29.5271  18.5111  12.4602
ValFun  G

Dynamics: Max Disturbance (m/s^2):  [0.00149461 0.0018056  0.00138071] 0.002720371623523329
ADV1:  -5.546889846160907e-05 0.008186919546083362 0.10099717678856135 -0.10653071463932928
ADV2:  0.00761646532504745 0.7856388380638922 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.7870   0.6316   3.3416  29.5271  18.5111  12.4602
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0009   0.0005   0.0020   8.0871   2.2896   2.8947
***** Episode 96613, Mean R = -18.6  Std R = 4.6  Min R = -30.4
PolicyLoss: -0.0107
Policy_Beta: 0.1
Policy_Entropy: 0.163
Policy_KL: 0.000873
Policy_SD: 0.563
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 3.56e+07
VF_0_ExplainedVarNew: 0.989
VF_0_ExplainedVarOld: 0.988
VF_0_Loss : 0.00344


ADV1:  0.0004510239976123787 0.008334264974968728 0.07200951310702947 -0.10648199693684524
ADV2:  0.01663362615744222 0.8258076364088388 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.6440   1.3450   7.5960  29.5271  18.5111  12.4602
ValFun  G

Dynamics: Max Disturbance (m/s^2):  [0.00149461 0.0018056  0.00138071] 0.002720371623523329
ADV1:  0.001282778610248483 0.008673973500012613 0.04363822311360188 -0.10678213695685065
ADV2:  0.012853343578069758 0.8328195587531091 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.6450   0.6872   3.8393  29.5271  18.5111  12.4602
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0018   0.0010   0.0035   8.0871   2.2896   2.8947
***** Episode 96892, Mean R = -18.0  Std R = 5.5  Min R = -30.1
PolicyLoss: -0.0295
Policy_Beta: 0.1
Policy_Entropy: 0.166
Policy_KL: 0.00109
Policy_SD: 0.556
Policy_lr_mult: 0.198
Steps: 1.14e+04
TotalSteps: 3.57e+07
VF_0_ExplainedVarNew: 0.989
VF_0_ExplainedVarOld: 0.986
VF_0_Loss : 0.00334


ADV1:  0.00027385314495845703 0.006761807839934036 0.0466274692569133 -0.10478167971312036
ADV2:  0.006253637213213072 0.7933796131248001 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.8770   0.7599   3.8834  29.5271  18.5111  12.4602
ValFun  Gr

***** Episode 97140, Mean R = -15.4  Std R = 4.2  Min R = -23.5
PolicyLoss: -0.0305
Policy_Beta: 0.1
Policy_Entropy: 0.167
Policy_KL: 0.000832
Policy_SD: 0.525
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 3.58e+07
VF_0_ExplainedVarNew: 0.986
VF_0_ExplainedVarOld: 0.985
VF_0_Loss : 0.003


Dynamics: Max Disturbance (m/s^2):  [0.00149461 0.0018056  0.00138071] 0.002720371623523329
ADV1:  0.0010509738736119523 0.010347035751490522 0.13018955511638847 -0.2655650494280569
ADV2:  0.012575422096691848 0.5846523846756454 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.7118   0.2691   1.6448  29.5271  18.5111  12.4602
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0012   0.0006   0.0028   8.0871   2.2896   2.8947
***** Episode 97171, Mean R = -16.7  Std R = 6.4  Min R = -47.5
PolicyLoss: -0.022
Policy_Beta: 0.1
Policy_Entropy: 0.166
Policy_KL: 0.00105
Policy_SD: 0.544
Policy_lr_mult: 0.198
Steps: 1.16e+04
TotalSteps: 3.58e+07
VF_0_ExplainedVarNew: 0.991
VF_0_ExplainedVa

ADV1:  -0.0008794931881036624 0.007706886624832015 0.16615592170903087 -0.07542690494075871
ADV2:  0.012645941621090813 0.777185526833562 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.8534   2.2663  10.7631  29.5271  18.5111  12.4602
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0010   0.0006   0.0024   8.0871   2.2896   2.8947
***** Episode 97419, Mean R = -16.5  Std R = 4.7  Min R = -32.6
PolicyLoss: -0.00731
Policy_Beta: 0.1
Policy_Entropy: 0.165
Policy_KL: 0.00104
Policy_SD: 0.544
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 3.59e+07
VF_0_ExplainedVarNew: 0.99
VF_0_ExplainedVarOld: 0.987
VF_0_Loss : 0.00323


ADV1:  -0.0007619450297663914 0.008420726278082815 0.0680347192825077 -0.16906017327617906
ADV2:  0.0314367838466928 0.7961122258942784 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.4859   1.5097   6.0919  29.5271  18.5111  12.4602
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0013   0.0007   0.0027   8.0871   2.2896   2.8947


seeker_angles |    0.00    0.00 |    0.08    0.08 |   -0.99   -0.99 |    0.99    0.99
cs_angles |  0.0021  0.0006 |  0.0844  0.0845 | -0.9881 -0.9936 |  0.9932  0.9937
optical_flow | -0.0000 -0.0001 |  0.0214  0.0248 | -0.9832 -1.1614 |  0.9426  1.1994
v_err    | -0.0088 |  0.0558 | -0.4521 |  0.1153
landing_rewards |    9.55 |    2.08 |    0.00 |   10.00
landing_margin |   -0.03 |    0.01 |   -0.06 |    0.04
tracking_rewards |  -22.36 |    5.16 |  -42.28 |  -14.45
steps    |     375 |      20 |     335 |     419
***** Episode 97698, Mean R = -16.7  Std R = 5.4  Min R = -34.6
PolicyLoss: -0.016
Policy_Beta: 0.1
Policy_Entropy: 0.164
Policy_KL: 0.00118
Policy_SD: 0.537
Policy_lr_mult: 0.198
Steps: 1.16e+04
TotalSteps: 3.6e+07
VF_0_ExplainedVarNew: 0.993
VF_0_ExplainedVarOld: 0.991
VF_0_Loss : 0.0014


ADV1:  0.000582810005702333 0.009024674498923727 0.10157552362136502 -0.23539972734394032
ADV2:  0.020057470662710332 0.6686430573952294 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Ma

attitude |    0.10   -0.01   -0.08 |    1.20    0.64    1.83 |   -3.14   -1.56   -3.14 |    3.14    1.57    3.14
w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.06   -0.05   -0.07 |    0.08    0.07    0.05
a_f      |   -0.02   -0.03 |    0.64    1.84 |   -1.39   -3.13 |    1.47    3.14
w_f      |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.02   -0.02   -0.02 |    0.02    0.02    0.02
w_rewards |   -0.31 |    0.25 |   -1.51 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.26 |    0.31 |    0.00 |    3.13
seeker_angles |   -0.00    0.00 |    0.08    0.08 |   -0.95   -0.99 |    0.99    0.98
cs_angles | -0.0001  0.0003 |  0.0806  0.0839 | -0.9532 -0.9890 |  0.9916  0.9820
optical_flow | -0.0000 -0.0001 |  0.0211  0.0237 | -1.0204 -1.0278 |  1.1455  1.1042
v_err    | -0.0086 |  0.0559 | -0.4551 |  0.1162
landing_rewards |    9.58 |    2.00 |    0.00 |   10.00
landing_margin |   -0

thrust   |   -0.00    0.00    0.00 |    0.68    0.69    0.68 |   -3.45   -3.46   -3.44 |    3.46    3.37    3.40
norm_thrust |    0.90 |    0.76 |    0.00 |    3.46
fuel     |    1.57 |    0.19 |    1.07 |    2.42
rewards  |  -17.14 |    6.13 |  -65.33 |   -7.90
fuel_rewards |   -4.49 |    0.54 |   -6.92 |   -3.10
glideslope_rewards |    0.00 |    0.00 |    0.00 |    0.00
glideslope_penalty |    0.00 |    0.00 |    0.00 |    0.00
glideslope |    2.90 |   15.11 |    0.01 | 2247.43
norm_af  |    1.79 |    0.90 |    0.09 |    3.25
norm_wf  |    0.01 |    0.01 |    0.00 |    0.04
rh_penalty |    0.00 |    0.00 |    0.00 |    0.00
att_rewards |    0.00 |    0.00 |    0.00 |    0.00
att_penalty |    0.00 |    0.00 |    0.00 |    0.00
attitude |   -0.00   -0.01    0.03 |    1.25    0.66    1.90 |   -3.14   -1.55   -3.14 |    3.14    1.57    3.14
w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.08   -0.05   -0.07 |    0.08    0.07    0.05
a_f      |   -0.01    0.04 |    0.66

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.2314   1.3063   5.7021  29.5271  18.5111  12.4602
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0009   0.0003   0.0018   8.0871   2.2896   2.8947
Update Cnt = 3180    ET =    941.5   Stats:  Mean, Std, Min, Max
r_f      |    3.71    8.02   15.95 |  196.92  173.68  197.69 | -395.65 -373.15 -396.72 |  399.70  396.44  385.06
v_f      |   -0.00   -0.00   -0.00 |    0.04    0.04    0.05 |   -0.10   -0.09   -0.09 |    0.11    0.10    0.09
r_i      |    2.62    8.58   18.34 |  718.01  652.23  744.54 |-1315.68-1261.44-1268.12 | 1289.54 1331.59 1251.72
v_i      |    0.00   -0.00   -0.00 |    0.04    0.04    0.05 |   -0.09   -0.09   -0.09 |    0.09    0.09    0.10
norm_rf  |    0.18 |    0.07 |    0.03 |    0.45
norm_vf  |    0.07 |    0.01 |    0.03 |    0.13
gs_f     |    1.16 |    1.57 |    0.01 |   11.59
thrust   |   -0.00    0.00   -0.00 |    0.68    0.68    0.69 |   -3.43   -3.37   -3.46 |    3.41    3.40    3.44
norm_thrust |    

ADV1:  -0.0018570743976509423 0.008480906195094829 0.06343796004987617 -0.060178404366308336
ADV2:  0.03975679616745128 0.8416673206333989 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   3.6076   2.0912  10.3817  29.5271  18.5111  12.4602
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0029   0.0010   0.0049   8.0871   2.2896   2.8947
***** Episode 98907, Mean R = -17.4  Std R = 4.9  Min R = -28.7
PolicyLoss: -0.0277
Policy_Beta: 0.1
Policy_Entropy: 0.164
Policy_KL: 0.00112
Policy_SD: 0.555
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 3.65e+07
VF_0_ExplainedVarNew: 0.985
VF_0_ExplainedVarOld: 0.985
VF_0_Loss : 0.00313


ADV1:  0.0006548649685877439 0.007198059484999794 0.04329640371319815 -0.055243125236767276
ADV2:  0.01326532984517343 0.8500388843471121 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.7936   1.1428   6.1242  29.5271  18.5111  12.4602
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0013   0.0004   0.0022   8.0871   2.2896   2.89

ADV1:  -0.001778028783967858 0.008413315991674086 0.0334412935303775 -0.06436118675046765
ADV2:  0.04652740266091245 0.8055718799532986 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.9577   1.4221   7.5497  29.5271  18.5111  12.4602
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0030   0.0015   0.0050   8.0871   2.2896   2.8947
***** Episode 99186, Mean R = -17.8  Std R = 4.9  Min R = -31.8
PolicyLoss: -0.0366
Policy_Beta: 0.1
Policy_Entropy: 0.166
Policy_KL: 0.00122
Policy_SD: 0.546
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 3.66e+07
VF_0_ExplainedVarNew: 0.987
VF_0_ExplainedVarOld: 0.986
VF_0_Loss : 0.00333


ADV1:  -0.0009358271651892084 0.008211707063454287 0.04404318691079345 -0.05370290001700531
ADV2:  0.0312702630001258 0.8587309303701609 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.5781   1.7294   7.0026  29.5271  18.5111  12.4602
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0009   0.0007   0.0025   8.0871   2.2896   2.8947
*

ADV1:  0.0012583983336502996 0.007569942328384053 0.042964439117947395 -0.05873294984397279
ADV2:  0.0048191101876017065 0.8521089686236574 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.2056   1.8761   7.6282  29.5271  18.5111  12.4602
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0021   0.0013   0.0040   8.0871   2.2896   2.8947
***** Episode 99465, Mean R = -18.0  Std R = 6.4  Min R = -32.8
PolicyLoss: -0.0255
Policy_Beta: 0.1
Policy_Entropy: 0.165
Policy_KL: 0.000742
Policy_SD: 0.557
Policy_lr_mult: 0.198
Steps: 1.16e+04
TotalSteps: 3.67e+07
VF_0_ExplainedVarNew: 0.991
VF_0_ExplainedVarOld: 0.989
VF_0_Loss : 0.00381


ADV1:  7.558404443731863e-05 0.007220409851865265 0.047432010863037 -0.11573082680250601
ADV2:  0.023860932745953082 0.7282362066799801 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.1465   0.6487   2.7212  29.5271  18.5111  12.4602
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0008   0.0005   0.0018   8.0871   2.2896   2.89

ADV1:  -0.0012289882169713151 0.008158746011364128 0.03876473928838958 -0.0647204045322432
ADV2:  0.03900827352590818 0.8201420576817706 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.4584   0.8149   4.0338  29.5271  18.5111  12.4602
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0014   0.0008   0.0032   8.0871   2.2896   2.8947
***** Episode 99744, Mean R = -16.2  Std R = 4.4  Min R = -24.2
PolicyLoss: -0.0337
Policy_Beta: 0.1
Policy_Entropy: 0.169
Policy_KL: 0.000874
Policy_SD: 0.529
Policy_lr_mult: 0.198
Steps: 1.15e+04
TotalSteps: 3.68e+07
VF_0_ExplainedVarNew: 0.987
VF_0_ExplainedVarOld: 0.985
VF_0_Loss : 0.00279


ADV1:  0.0002036834063038772 0.005487989661681549 0.05338385294954792 -0.04433159148941912
ADV2:  -0.002464394168951136 0.9083928889059132 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   5.2294   2.8436  12.0526  29.5271  18.5111  12.4602
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0006   0.0003   0.0012   8.0871   2.2896   2.89

ADV1:  -0.0001230704017068542 0.007467649464324648 0.052356787217941514 -0.047911833877168734
ADV2:  0.016888553674090662 0.8380327257197113 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.6306   0.7331   4.2398  29.5271  18.5111  12.4602
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0004   0.0002   0.0008   8.0871   2.2896   2.8947
***** Episode 100023, Mean R = -17.1  Std R = 6.0  Min R = -30.5
PolicyLoss: -0.02
Policy_Beta: 0.1
Policy_Entropy: 0.169
Policy_KL: 0.00101
Policy_SD: 0.54
Policy_lr_mult: 0.198
Steps: 1.16e+04
TotalSteps: 3.69e+07
VF_0_ExplainedVarNew: 0.989
VF_0_ExplainedVarOld: 0.988
VF_0_Loss : 0.00375


ADV1:  0.000549579724408239 0.005722575228060524 0.03372801979382837 -0.041007753766385935
ADV2:  -0.008431401355626249 0.9078429481358326 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   6.2319   4.1838  14.8671  29.5271  18.5111  12.4602
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0007   0.0004   0.0015   8.0871   2.2896   2.8

ADV1:  -0.0012644801103514746 0.010886882489644334 0.05099313728670268 -0.0900939470783722
ADV2:  0.0249436096247785 0.8894118117887677 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   4.5194   2.9487  10.4799  29.5271  18.5111  12.4602
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0020   0.0010   0.0035   8.0871   2.2896   2.8947
***** Episode 100302, Mean R = -18.7  Std R = 6.8  Min R = -34.7
PolicyLoss: -0.0204
Policy_Beta: 0.1
Policy_Entropy: 0.169
Policy_KL: 0.000979
Policy_SD: 0.535
Policy_lr_mult: 0.198
Steps: 1.16e+04
TotalSteps: 3.7e+07
VF_0_ExplainedVarNew: 0.98
VF_0_ExplainedVarOld: 0.978
VF_0_Loss : 0.00326


ADV1:  -0.0011276870118765196 0.010396502820705478 0.0716937685681035 -0.0687324133344806
ADV2:  0.020861080814158987 0.9062941925539114 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   3.7232   3.4953  13.0104  29.5271  18.5111  12.4602
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0022   0.0007   0.0038   8.0871   2.2896   2.8947
*

ADV1:  0.0011223756515250799 0.006955461767682679 0.0874391087732691 -0.043841824092227366
ADV2:  -0.0029242340985552963 0.8389122214466836 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.4839   0.7199   3.2721  29.5271  18.5111  12.4602
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0020   0.0011   0.0038   8.0871   2.2896   2.8947
***** Episode 100581, Mean R = -16.4  Std R = 4.2  Min R = -28.7
PolicyLoss: -0.0145
Policy_Beta: 0.1
Policy_Entropy: 0.17
Policy_KL: 0.00104
Policy_SD: 0.533
Policy_lr_mult: 0.198
Steps: 1.16e+04
TotalSteps: 3.71e+07
VF_0_ExplainedVarNew: 0.991
VF_0_ExplainedVarOld: 0.989
VF_0_Loss : 0.00324


Dynamics: Max Disturbance (m/s^2):  [0.00149461 0.0018056  0.00138071] 0.002720371623523329
ADV1:  -0.0004036626241517286 0.009240852918319584 0.05692735231756407 -0.08483481045688679
ADV2:  0.031858704231588916 0.8201586296862563 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.0996   0.8189   4.4966  29.5271  18.5111  12.4602
ValFun

ADV1:  -0.0008001779914726247 0.00878300978375564 0.06652803358950854 -0.06067677038267467
ADV2:  0.024312466773165207 0.8362517135036338 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   7.9853   4.7555  15.6057  29.5271  18.5111  12.4602
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0015   0.0008   0.0028   8.0871   2.2896   2.8947
***** Episode 100860, Mean R = -17.0  Std R = 6.1  Min R = -35.6
PolicyLoss: -0.0205
Policy_Beta: 0.0667
Policy_Entropy: 0.17
Policy_KL: 0.000616
Policy_SD: 0.534
Policy_lr_mult: 0.198
Steps: 1.16e+04
TotalSteps: 3.72e+07
VF_0_ExplainedVarNew: 0.987
VF_0_ExplainedVarOld: 0.984
VF_0_Loss : 0.00324


Dynamics: Max Disturbance (m/s^2):  [0.00149461 0.0018056  0.00138071] 0.002720371623523329
ADV1:  -0.002410938761954535 0.0077132501694839916 0.0535265987430012 -0.06050204643806639
ADV2:  0.038816931061757355 0.87386780692613 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   8.1241   6.0752  18.5497  29.5271  18.5111  12.4602
ValFun 

***** Episode 101108, Mean R = -15.3  Std R = 3.1  Min R = -21.4
PolicyLoss: 0.00109
Policy_Beta: 0.0667
Policy_Entropy: 0.171
Policy_KL: 0.000574
Policy_SD: 0.522
Policy_lr_mult: 0.198
Steps: 1.16e+04
TotalSteps: 3.73e+07
VF_0_ExplainedVarNew: 0.994
VF_0_ExplainedVarOld: 0.994
VF_0_Loss : 0.00355


Dynamics: Max Disturbance (m/s^2):  [0.00149461 0.0018056  0.00138071] 0.002720371623523329
ADV1:  -0.0010267697468316003 0.007159592214702046 0.04011029948345135 -0.06664054183725987
ADV2:  0.032287650738165787 0.8355839369818416 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.7435   1.6288   7.8195  29.5271  18.5111  12.4602
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0019   0.0006   0.0033   8.0871   2.2896   2.8947
***** Episode 101139, Mean R = -17.9  Std R = 5.5  Min R = -29.3
PolicyLoss: -0.0251
Policy_Beta: 0.0667
Policy_Entropy: 0.17
Policy_KL: 0.000523
Policy_SD: 0.538
Policy_lr_mult: 0.198
Steps: 1.16e+04
TotalSteps: 3.73e+07
VF_0_ExplainedVarNew: 0.991
VF_

seeker_angles |    0.00    0.01 |    0.08    0.08 |   -0.97   -1.00 |    0.92    1.00
cs_angles |  0.0014  0.0067 |  0.0845  0.0843 | -0.9659 -0.9979 |  0.9223  0.9978
optical_flow | -0.0001  0.0001 |  0.0213  0.0242 | -1.0263 -1.1838 |  0.9029  1.0557
v_err    | -0.0090 |  0.0558 | -0.4520 |  0.1102
landing_rewards |    9.61 |    1.93 |    0.00 |   10.00
landing_margin |   -0.03 |    0.01 |   -0.07 |    0.01
tracking_rewards |  -22.46 |    4.65 |  -42.84 |  -14.39
steps    |     378 |      21 |     328 |     419
***** Episode 101418, Mean R = -17.1  Std R = 4.2  Min R = -26.1
PolicyLoss: -0.00392
Policy_Beta: 0.1
Policy_Entropy: 0.168
Policy_KL: 0.000712
Policy_SD: 0.53
Policy_lr_mult: 0.198
Steps: 1.18e+04
TotalSteps: 3.74e+07
VF_0_ExplainedVarNew: 0.995
VF_0_ExplainedVarOld: 0.993
VF_0_Loss : 0.00285


ADV1:  0.00026517568374006124 0.008324324285585246 0.06389752389310088 -0.07159352854086198
ADV2:  0.019189696512532693 0.8317341702536174 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/M

attitude |    0.08    0.05   -0.09 |    1.18    0.65    1.85 |   -3.14   -1.56   -3.14 |    3.14    1.55    3.14
w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.09   -0.05   -0.07 |    0.07    0.07    0.05
a_f      |    0.05   -0.09 |    0.65    1.85 |   -1.56   -3.14 |    1.43    3.13
w_f      |    0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.02   -0.02   -0.02 |    0.02    0.03    0.01
w_rewards |   -0.31 |    0.30 |   -2.99 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.26 |    0.31 |    0.00 |    3.02
seeker_angles |    0.00    0.00 |    0.09    0.08 |   -1.00   -0.97 |    1.00    1.00
cs_angles |  0.0018  0.0026 |  0.0855  0.0836 | -0.9999 -0.9675 |  0.9972  0.9991
optical_flow | -0.0001 -0.0000 |  0.0225  0.0251 | -1.1219 -1.0853 |  1.3653  1.0319
v_err    | -0.0090 |  0.0560 | -0.4525 |  0.1818
landing_rewards |    9.65 |    1.85 |    0.00 |   10.00
landing_margin |   -0

attitude |    0.06   -0.05   -0.04 |    1.26    0.66    1.88 |   -3.14   -1.57   -3.14 |    3.14    1.54    3.14
w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.08   -0.05   -0.07 |    0.08    0.07    0.05
a_f      |   -0.06   -0.03 |    0.66    1.87 |   -1.50   -3.14 |    1.34    3.13
w_f      |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.02   -0.02   -0.02 |    0.02    0.03    0.02
w_rewards |   -0.29 |    0.22 |   -1.80 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.26 |    0.31 |    0.00 |    2.96
seeker_angles |   -0.00    0.00 |    0.09    0.08 |   -0.98   -0.95 |    0.97    0.98
cs_angles | -0.0006  0.0009 |  0.0859  0.0829 | -0.9754 -0.9503 |  0.9723  0.9838
optical_flow | -0.0001  0.0001 |  0.0212  0.0238 | -0.9047 -1.0112 |  0.9048  1.0965
v_err    | -0.0090 |  0.0561 | -0.4534 |  0.1043
landing_rewards |    9.71 |    1.68 |    0.00 |   10.00
landing_margin |   -0

thrust   |   -0.01   -0.00    0.01 |    0.69    0.68    0.68 |   -3.46   -3.43   -3.44 |    3.44    3.43    3.45
norm_thrust |    0.91 |    0.76 |    0.00 |    3.46
fuel     |    1.55 |    0.20 |    1.08 |    2.49
rewards  |  -18.38 |    7.29 |  -69.42 |   -6.68
fuel_rewards |   -4.45 |    0.59 |   -7.13 |   -3.10
glideslope_rewards |    0.00 |    0.00 |    0.00 |    0.00
glideslope_penalty |    0.00 |    0.00 |    0.00 |    0.00
glideslope |    2.83 |   12.55 |    0.00 |  346.67
norm_af  |    1.73 |    0.93 |    0.05 |    3.31
norm_wf  |    0.01 |    0.01 |    0.00 |    0.03
rh_penalty |    0.00 |    0.00 |    0.00 |    0.00
att_rewards |    0.00 |    0.00 |    0.00 |    0.00
att_penalty |    0.00 |    0.00 |    0.00 |    0.00
attitude |   -0.05    0.03   -0.06 |    1.18    0.63    1.85 |   -3.14   -1.56   -3.14 |    3.14    1.57    3.14
w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.09   -0.05   -0.07 |    0.08    0.07    0.06
a_f      |    0.03   -0.04 |    0.62

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.8613   0.9087   4.1956  29.5271  18.5111  12.4602
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0020   0.0006   0.0032   8.0871   2.2896   2.8947
Update Cnt = 3310    ET =   1006.1   Stats:  Mean, Std, Min, Max
r_f      |  -13.64   -6.23   -2.33 |  185.99  172.71  200.39 | -398.44 -397.03 -397.86 |  395.86  376.48  378.36
v_f      |    0.00   -0.00   -0.00 |    0.04    0.04    0.05 |   -0.09   -0.09   -0.09 |    0.09    0.09    0.09
r_i      |  -55.44   -4.89   36.25 |  702.77  646.03  755.10 |-1331.03-1322.02-1315.00 | 1360.13 1353.78 1305.21
v_i      |    0.00    0.00   -0.00 |    0.04    0.04    0.05 |   -0.10   -0.09   -0.09 |    0.10    0.09    0.10
norm_rf  |    0.18 |    0.07 |    0.05 |    0.40
norm_vf  |    0.07 |    0.01 |    0.04 |    0.11
gs_f     |    1.19 |    1.48 |    0.01 |   10.12
thrust   |    0.00    0.00   -0.00 |    0.67    0.68    0.67 |   -3.34   -3.33   -3.46 |    3.45    3.44    3.46
norm_thrust |    

ADV1:  0.0014618753345971387 0.007395366982567695 0.06799342575403294 -0.056078709216883016
ADV2:  -0.005786269475153334 0.8259456680722098 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.7350   1.6748   7.9430  29.5271  18.5111  12.4602
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0027   0.0014   0.0047   8.0871   2.2896   2.8947
***** Episode 102937, Mean R = -15.7  Std R = 3.5  Min R = -22.5
PolicyLoss: -0.0129
Policy_Beta: 0.1
Policy_Entropy: 0.17
Policy_KL: 0.00105
Policy_SD: 0.527
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 3.8e+07
VF_0_ExplainedVarNew: 0.989
VF_0_ExplainedVarOld: 0.987
VF_0_Loss : 0.00339


ADV1:  -0.0004560373913624163 0.009294473731696958 0.032739187338757914 -0.062135335613014174
ADV2:  0.024872478288931767 0.8706289052978202 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.8657   1.9322   8.7937  29.5271  18.5111  12.4602
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0021   0.0009   0.0045   8.0871   2.2896   2

ADV1:  -0.000243643333837197 0.005360187749032758 0.033652045271420794 -0.043771532191887175
ADV2:  0.012557875537303398 0.8811916379631992 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   3.1635   1.9693  10.3244  29.5271  18.5111  12.4602
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0003   0.0002   0.0006   8.0871   2.2896   2.8947
***** Episode 103216, Mean R = -16.6  Std R = 4.1  Min R = -28.4
PolicyLoss: -0.0137
Policy_Beta: 0.1
Policy_Entropy: 0.169
Policy_KL: 0.000905
Policy_SD: 0.542
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 3.81e+07
VF_0_ExplainedVarNew: 0.995
VF_0_ExplainedVarOld: 0.994
VF_0_Loss : 0.00355


ADV1:  0.0004165575753394675 0.005235117345114172 0.04208274783386007 -0.05572718298046797
ADV2:  -0.007889665003798434 0.8774623726192716 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   3.4175   2.2435  10.1624  29.5271  18.5111  12.4602
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0008   0.0003   0.0014   8.0871   2.2896   

ADV1:  -0.0014857477885003075 0.00969025513303911 0.047207044526274555 -0.07392219977836478
ADV2:  0.039444527267929824 0.8226524082825741 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.9891   1.3129   5.4467  29.5271  18.5111  12.4602
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0018   0.0010   0.0039   8.0871   2.2896   2.8947
***** Episode 103495, Mean R = -18.3  Std R = 6.0  Min R = -33.5
PolicyLoss: -0.0328
Policy_Beta: 0.1
Policy_Entropy: 0.167
Policy_KL: 0.000927
Policy_SD: 0.545
Policy_lr_mult: 0.198
Steps: 1.16e+04
TotalSteps: 3.82e+07
VF_0_ExplainedVarNew: 0.984
VF_0_ExplainedVarOld: 0.983
VF_0_Loss : 0.00363


Dynamics: Max Disturbance (m/s^2):  [0.00149461 0.0018056  0.00138071] 0.002720371623523329
ADV1:  3.094176512922276e-05 0.008597358743245192 0.047969115858376765 -0.13692726984789838
ADV2:  0.02528370336028244 0.7743184273941988 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.8306   1.0526   4.4017  29.5271  18.5111  12.4602
ValFun

***** Episode 103743, Mean R = -17.3  Std R = 6.8  Min R = -38.3
PolicyLoss: -0.029
Policy_Beta: 0.1
Policy_Entropy: 0.17
Policy_KL: 0.000965
Policy_SD: 0.532
Policy_lr_mult: 0.198
Steps: 1.16e+04
TotalSteps: 3.83e+07
VF_0_ExplainedVarNew: 0.992
VF_0_ExplainedVarOld: 0.992
VF_0_Loss : 0.00213


ADV1:  -0.0020290535858493875 0.010457206452835838 0.03688296790761991 -0.0831212345374751
ADV2:  0.028875475112695212 0.9098035559744335 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   8.8144   3.2943  14.4787  29.5271  18.5111  12.4602
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0031   0.0020   0.0061   8.0871   2.2896   2.8947
***** Episode 103774, Mean R = -17.4  Std R = 5.7  Min R = -28.8
PolicyLoss: -0.0171
Policy_Beta: 0.1
Policy_Entropy: 0.17
Policy_KL: 0.00109
Policy_SD: 0.523
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 3.83e+07
VF_0_ExplainedVarNew: 0.979
VF_0_ExplainedVarOld: 0.977
VF_0_Loss : 0.00275


Dynamics: Max Disturbance (m/s^2):  [0.00149461 0.00180

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.7761   0.8489   4.7440  29.5271  18.5111  12.4602
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0013   0.0004   0.0020   8.0871   2.2896   2.8947
***** Episode 104022, Mean R = -17.4  Std R = 3.8  Min R = -29.0
PolicyLoss: -0.0168
Policy_Beta: 0.1
Policy_Entropy: 0.168
Policy_KL: 0.00108
Policy_SD: 0.537
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 3.84e+07
VF_0_ExplainedVarNew: 0.99
VF_0_ExplainedVarOld: 0.989
VF_0_Loss : 0.00313


ADV1:  0.0003825665213309573 0.006850364018533154 0.1228480649432841 -0.04579033060998322
ADV2:  0.007995996556857878 0.8178656564860995 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.2784   1.3745   7.0967  29.5271  18.5111  12.4602
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0008   0.0005   0.0016   8.0871   2.2896   2.8947
***** Episode 104053, Mean R = -19.0  Std R = 4.5  Min R = -28.1
PolicyLoss: -0.0154
Policy_Beta: 0.1
Policy_Entropy: 0.169
Policy_KL: 0.00102
Pol

ADV1:  -0.001831867015365972 0.008794007233058477 0.038222098076360456 -0.05227550880932669
ADV2:  0.037629940112988335 0.8719757333697229 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.4229   0.6334   3.6491  29.5271  18.5111  12.4602
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0029   0.0010   0.0048   8.0871   2.2896   2.8947
***** Episode 104301, Mean R = -15.4  Std R = 4.5  Min R = -25.9
PolicyLoss: -0.0277
Policy_Beta: 0.1
Policy_Entropy: 0.171
Policy_KL: 0.000809
Policy_SD: 0.519
Policy_lr_mult: 0.198
Steps: 1.16e+04
TotalSteps: 3.85e+07
VF_0_ExplainedVarNew: 0.982
VF_0_ExplainedVarOld: 0.98
VF_0_Loss : 0.00285


Dynamics: Max Disturbance (m/s^2):  [0.00149461 0.0018056  0.00138071] 0.002720371623523329
ADV1:  -0.0008681012707524129 0.009173738112073442 0.04971637015605762 -0.16555877709930156
ADV2:  0.031523722968855264 0.7676893369711053 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.4539   1.0729   5.2820  29.5271  18.5111  12.4602
ValFun

ADV1:  0.001685369413273807 0.005739769417316506 0.038203461848412716 -0.0613690054560303
ADV2:  -0.006020910190381265 0.8827911889414243 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.2016   1.2677   6.7176  29.5271  18.5111  12.4602
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0022   0.0013   0.0044   8.0871   2.2896   2.8947
***** Episode 104580, Mean R = -16.4  Std R = 5.3  Min R = -31.3
PolicyLoss: -0.0162
Policy_Beta: 0.1
Policy_Entropy: 0.171
Policy_KL: 0.000725
Policy_SD: 0.522
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 3.86e+07
VF_0_ExplainedVarNew: 0.994
VF_0_ExplainedVarOld: 0.993
VF_0_Loss : 0.00267


Dynamics: Max Disturbance (m/s^2):  [0.00149461 0.0018056  0.00138071] 0.002720371623523329
ADV1:  -0.0022289947069474535 0.008099447187669449 0.03421020450928593 -0.10915127546877057
ADV2:  0.053518906484004286 0.7641659163512897 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.7288   1.0607   5.3997  29.5271  18.5111  12.4602
ValFun

Dynamics: Max Disturbance (m/s^2):  [0.00149461 0.0018056  0.00138071] 0.002720371623523329
ADV1:  -0.0008758024353299 0.008264416449598178 0.0322662327011616 -0.08209711889466187
ADV2:  0.04074582118390152 0.7948322918070473 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.1150   0.7755   3.2412  29.5271  18.5111  12.4602
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0012   0.0004   0.0023   8.0871   2.2896   2.8947
***** Episode 104859, Mean R = -17.1  Std R = 4.6  Min R = -27.0
PolicyLoss: -0.039
Policy_Beta: 0.1
Policy_Entropy: 0.169
Policy_KL: 0.00124
Policy_SD: 0.539
Policy_lr_mult: 0.198
Steps: 1.16e+04
TotalSteps: 3.87e+07
VF_0_ExplainedVarNew: 0.989
VF_0_ExplainedVarOld: 0.987
VF_0_Loss : 0.00318


ADV1:  -0.0012633988642859883 0.007762977187616495 0.03511302749601097 -0.05794787908448795
ADV2:  0.031187370703870426 0.8757165896486669 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.2485   1.4885   8.1517  29.5271  18.5111  12.4602
ValFun  Grad

seeker_angles |   -0.00    0.00 |    0.08    0.08 |   -1.00   -0.97 |    0.96    0.98
cs_angles | -0.0005  0.0023 |  0.0776  0.0816 | -0.9976 -0.9700 |  0.9551  0.9812
optical_flow | -0.0001 -0.0002 |  0.0201  0.0236 | -0.9832 -1.2149 |  1.1126  0.9584
v_err    | -0.0092 |  0.0562 | -0.4520 |  0.1172
landing_rewards |    9.61 |    1.93 |    0.00 |   10.00
landing_margin |    2.75 |   48.67 |   -0.06 |  858.21
tracking_rewards |  -21.45 |    4.32 |  -38.92 |  -12.42
steps    |     375 |      29 |      20 |     419
***** Episode 105138, Mean R = -17.9  Std R = 5.6  Min R = -31.5
PolicyLoss: -0.0145
Policy_Beta: 0.1
Policy_Entropy: 0.17
Policy_KL: 0.00107
Policy_SD: 0.525
Policy_lr_mult: 0.198
Steps: 1.18e+04
TotalSteps: 3.88e+07
VF_0_ExplainedVarNew: 0.975
VF_0_ExplainedVarOld: 0.971
VF_0_Loss : 0.00301


ADV1:  -0.0010767525416025966 0.009981637911372162 0.05027429863536209 -0.06884509150599455
ADV2:  0.026516023573088274 0.8665441113201005 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max

w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.09   -0.05   -0.07 |    0.07    0.07    0.05
a_f      |    0.01    0.05 |    0.68    1.80 |   -1.46   -3.11 |    1.54    3.14
w_f      |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.02   -0.02   -0.02 |    0.02    0.03    0.02
w_rewards |   -0.29 |    0.29 |   -3.53 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.26 |    0.32 |    0.00 |    3.11
seeker_angles |   -0.00    0.00 |    0.08    0.09 |   -0.98   -1.00 |    0.97    0.99
cs_angles | -0.0013  0.0019 |  0.0844  0.0865 | -0.9803 -0.9988 |  0.9701  0.9943
optical_flow | -0.0000  0.0000 |  0.0215  0.0251 | -1.0464 -1.2516 |  0.9689  1.1522
v_err    | -0.0094 |  0.0567 | -0.4531 |  0.1121
landing_rewards |    9.45 |    2.28 |    0.00 |   10.00
landing_margin |   -0.02 |    0.01 |   -0.06 |    0.02
tracking_rewards |  -22.65 |    5.10 |  -49.17 |  -13.68
steps    |     376 |  

attitude |    0.03   -0.02    0.08 |    1.20    0.66    1.86 |   -3.14   -1.55   -3.14 |    3.14    1.54    3.14
w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.07   -0.05   -0.07 |    0.07    0.07    0.05
a_f      |   -0.02    0.14 |    0.67    1.86 |   -1.50   -3.14 |    1.48    3.11
w_f      |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.03   -0.02   -0.02 |    0.02    0.03    0.02
w_rewards |   -0.28 |    0.23 |   -1.21 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.26 |    0.31 |    0.00 |    3.04
seeker_angles |   -0.00    0.00 |    0.08    0.08 |   -0.99   -0.98 |    0.93    0.98
cs_angles | -0.0002  0.0008 |  0.0830  0.0796 | -0.9913 -0.9840 |  0.9291  0.9845
optical_flow | -0.0002  0.0000 |  0.0212  0.0238 | -1.0975 -1.2544 |  1.1133  1.1380
v_err    | -0.0092 |  0.0558 | -0.4512 |  0.1116
landing_rewards |    9.52 |    2.15 |    0.00 |   10.00
landing_margin |   -0

attitude |    0.03    0.01    0.05 |    1.20    0.66    1.81 |   -3.14   -1.56   -3.14 |    3.14    1.56    3.14
w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.07   -0.05   -0.07 |    0.07    0.07    0.07
a_f      |    0.01    0.07 |    0.67    1.81 |   -1.55   -3.11 |    1.43    3.13
w_f      |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.02   -0.02   -0.02 |    0.02    0.03    0.02
w_rewards |   -0.30 |    0.25 |   -1.67 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.25 |    0.31 |    0.00 |    3.10
seeker_angles |    0.00    0.00 |    0.08    0.08 |   -1.00   -0.97 |    0.98    0.99
cs_angles |  0.0017  0.0027 |  0.0791  0.0823 | -0.9954 -0.9723 |  0.9816  0.9894
optical_flow | -0.0001  0.0000 |  0.0223  0.0245 | -1.0630 -1.1816 |  1.1751  1.0376
v_err    | -0.0094 |  0.0561 | -0.4519 |  0.1101
landing_rewards |    9.55 |    2.08 |    0.00 |   10.00
landing_margin |   -0

attitude |   -0.13   -0.02   -0.12 |    1.23    0.67    1.87 |   -3.14   -1.57   -3.14 |    3.14    1.56    3.14
w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.07   -0.05   -0.07 |    0.10    0.08    0.06
a_f      |   -0.02   -0.02 |    0.66    1.88 |   -1.37   -3.13 |    1.45    3.14
w_f      |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.02   -0.03   -0.02 |    0.10    0.03    0.02
w_rewards |   -0.41 |    2.41 |  -42.48 |    0.00
w_penalty |   -0.32 |    5.67 | -100.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.26 |    0.32 |    0.00 |    3.12
seeker_angles |    0.00    0.00 |    0.08    0.08 |   -0.98   -1.00 |    0.95    0.99
cs_angles |  0.0002  0.0029 |  0.0791  0.0824 | -0.9776 -0.9991 |  0.9489  0.9938
optical_flow | -0.0001 -0.0000 |  0.0214  0.0260 | -0.9773 -1.2269 |  1.0633  1.4510
v_err    | -0.0103 |  0.0607 | -0.7249 |  0.1205
landing_rewards |    9.58 |    2.00 |    0.00 |   10.00
landing_margin |    3

attitude |   -0.00   -0.00    0.04 |    1.31    0.66    1.91 |   -3.14   -1.55   -3.14 |    3.14    1.57    3.14
w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.06   -0.05   -0.07 |    0.08    0.07    0.05
a_f      |   -0.01    0.07 |    0.67    1.92 |   -1.51   -3.13 |    1.45    3.13
w_f      |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.02   -0.03   -0.02 |    0.02    0.03    0.02
w_rewards |   -0.27 |    0.25 |   -2.32 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.26 |    0.31 |    0.00 |    2.98
seeker_angles |    0.00    0.00 |    0.08    0.08 |   -0.99   -1.00 |    1.00    0.97
cs_angles |  0.0010  0.0023 |  0.0797  0.0843 | -0.9871 -0.9975 |  0.9951  0.9722
optical_flow | -0.0001  0.0001 |  0.0214  0.0251 | -1.1871 -1.0595 |  1.1882  1.1840
v_err    | -0.0095 |  0.0563 | -0.4517 |  0.1092
landing_rewards |    9.65 |    1.85 |    0.00 |   10.00
landing_margin |   -0

attitude |    0.02   -0.00    0.23 |    1.20    0.64    1.87 |   -3.14   -1.56   -3.14 |    3.14    1.57    3.14
w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.05   -0.05   -0.07 |    0.07    0.07    0.05
a_f      |   -0.00    0.12 |    0.64    1.87 |   -1.47   -3.14 |    1.49    3.13
w_f      |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.02   -0.03   -0.02 |    0.02    0.03    0.02
w_rewards |   -0.27 |    0.21 |   -1.12 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.25 |    0.31 |    0.00 |    3.02
seeker_angles |   -0.00    0.01 |    0.08    0.08 |   -0.98   -0.98 |    0.99    0.99
cs_angles | -0.0001  0.0075 |  0.0833  0.0813 | -0.9822 -0.9828 |  0.9877  0.9918
optical_flow | -0.0001 -0.0001 |  0.0212  0.0226 | -1.0970 -1.1073 |  1.0791  1.0653
v_err    | -0.0097 |  0.0560 | -0.4515 |  0.1987
landing_rewards |    9.74 |    1.59 |    0.00 |   10.00
landing_margin |   -0

w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.06   -0.05   -0.07 |    0.08    0.07    0.05
a_f      |   -0.01    0.15 |    0.64    1.85 |   -1.39   -3.14 |    1.46    3.13
w_f      |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.02   -0.02   -0.02 |    0.02    0.03    0.02
w_rewards |   -0.29 |    0.23 |   -1.31 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.25 |    0.31 |    0.00 |    2.98
seeker_angles |   -0.00    0.00 |    0.08    0.08 |   -1.00   -0.99 |    0.98    0.99
cs_angles | -0.0010  0.0020 |  0.0816  0.0841 | -0.9975 -0.9911 |  0.9794  0.9928
optical_flow |  0.0000 -0.0000 |  0.0210  0.0240 | -0.9775 -1.0041 |  0.9330  0.8993
v_err    | -0.0098 |  0.0567 | -0.4527 |  0.1369
landing_rewards |    9.81 |    1.38 |    0.00 |   10.00
landing_margin |   -0.03 |    0.01 |   -0.06 |    0.05
tracking_rewards |  -22.23 |    4.77 |  -39.22 |  -12.92
steps    |     378 |  

attitude |   -0.02    0.03    0.00 |    1.17    0.66    1.81 |   -3.14   -1.56   -3.14 |    3.14    1.54    3.14
w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.07   -0.05   -0.07 |    0.08    0.07    0.05
a_f      |    0.04   -0.01 |    0.66    1.80 |   -1.49   -3.11 |    1.48    3.14
w_f      |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.02   -0.02   -0.02 |    0.03    0.04    0.02
w_rewards |   -0.27 |    0.23 |   -1.41 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.25 |    0.31 |    0.00 |    2.97
seeker_angles |    0.00    0.00 |    0.08    0.08 |   -0.95   -1.00 |    0.99    0.97
cs_angles |  0.0008  0.0043 |  0.0822  0.0785 | -0.9504 -0.9987 |  0.9930  0.9689
optical_flow | -0.0000  0.0001 |  0.0217  0.0235 | -0.8897 -1.2428 |  1.1414  0.8914
v_err    | -0.0097 |  0.0560 | -0.4532 |  0.1128
landing_rewards |    9.61 |    1.93 |    0.00 |   10.00
landing_margin |   -0

thrust   |   -0.00    0.01    0.00 |    0.68    0.67    0.67 |   -3.39   -3.43   -3.44 |    3.42    3.41    3.42
norm_thrust |    0.89 |    0.75 |    0.00 |    3.46
fuel     |    1.51 |    0.19 |    1.15 |    2.43
rewards  |  -16.95 |    5.46 |  -51.75 |   -7.65
fuel_rewards |   -4.31 |    0.53 |   -6.95 |   -3.31
glideslope_rewards |    0.00 |    0.00 |    0.00 |    0.00
glideslope_penalty |    0.00 |    0.00 |    0.00 |    0.00
glideslope |    2.73 |   12.57 |    0.00 |  180.92
norm_af  |    1.76 |    0.89 |    0.12 |    3.40
norm_wf  |    0.01 |    0.01 |    0.00 |    0.03
rh_penalty |    0.00 |    0.00 |    0.00 |    0.00
att_rewards |    0.00 |    0.00 |    0.00 |    0.00
att_penalty |    0.00 |    0.00 |    0.00 |    0.00
attitude |    0.00   -0.08    0.11 |    1.23    0.68    1.86 |   -3.14   -1.57   -3.14 |    3.14    1.56    3.14
w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.09   -0.05   -0.07 |    0.07    0.07    0.05
a_f      |   -0.07    0.10 |    0.68

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.5176   1.0075   4.3755  29.5271  18.5111  12.4602
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0012   0.0006   0.0025   8.0871   2.2896   2.8947
Update Cnt = 3490    ET =   1120.2   Stats:  Mean, Std, Min, Max
r_f      |   14.70  -20.41    5.70 |  185.72  169.34  202.74 | -385.59 -384.37 -393.09 |  368.34  370.29  378.84
v_f      |   -0.00    0.00   -0.00 |    0.04    0.04    0.05 |   -0.10   -0.08   -0.11 |    0.09    0.09    0.10
r_i      |   44.46  -79.41   30.59 |  669.85  668.28  765.80 |-1318.21-1342.91-1341.84 | 1242.81 1345.14 1290.53
v_i      |   -0.00    0.00   -0.00 |    0.04    0.04    0.05 |   -0.09   -0.09   -0.10 |    0.09    0.10    0.09
norm_rf  |    0.18 |    0.07 |    0.02 |    0.45
norm_vf  |    0.08 |    0.01 |    0.04 |    0.12
gs_f     |    1.47 |    3.13 |    0.01 |   43.00
thrust   |   -0.01    0.00    0.00 |    0.67    0.69    0.67 |   -3.46   -3.45   -3.43 |    3.45    3.38    3.46
norm_thrust |    

ADV1:  6.758761883354638e-05 0.007572393031548479 0.05581260433642987 -0.0575288460550456
ADV2:  0.02130722665027057 0.8499645793214039 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.9848   2.1259   7.9871  29.5271  18.5111  12.4602
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0005   0.0002   0.0011   8.0871   2.2896   2.8947
***** Episode 108517, Mean R = -18.6  Std R = 7.4  Min R = -37.3
PolicyLoss: -0.0271
Policy_Beta: 0.1
Policy_Entropy: 0.171
Policy_KL: 0.00119
Policy_SD: 0.543
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 4.01e+07
VF_0_ExplainedVarNew: 0.992
VF_0_ExplainedVarOld: 0.99
VF_0_Loss : 0.0028


ADV1:  0.0005568495115635825 0.008355234952126742 0.061753513423959516 -0.06869828638198217
ADV2:  0.016915507934475705 0.837446250144639 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.3436   0.9039   4.7587  29.5271  18.5111  12.4602
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0008   0.0005   0.0017   8.0871   2.2896   2.8947
U

ADV1:  -0.0001272300887321463 0.007579321956789523 0.06417141518873293 -0.12447264397507374
ADV2:  0.008619856477755917 0.7433099752128726 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.9387   0.9740   4.1720  29.5271  18.5111  12.4602
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0002   0.0001   0.0005   8.0871   2.2896   2.8947
***** Episode 108796, Mean R = -15.5  Std R = 4.6  Min R = -29.5
PolicyLoss: -0.0109
Policy_Beta: 0.1
Policy_Entropy: 0.171
Policy_KL: 0.000979
Policy_SD: 0.531
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 4.02e+07
VF_0_ExplainedVarNew: 0.99
VF_0_ExplainedVarOld: 0.987
VF_0_Loss : 0.00224


ADV1:  -0.001089023058671578 0.007958032433535933 0.04246773782145785 -0.07761327838825877
ADV2:  0.02807728204735928 0.8493397799407207 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.0055   0.9987   5.3042  29.5271  18.5111  12.4602
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0015   0.0009   0.0032   8.0871   2.2896   2.89

ADV1:  -0.0018236024359013128 0.0076905203834597875 0.06342938683006949 -0.06928133523353552
ADV2:  0.03250338935259809 0.8436314605922156 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.0420   1.1349   4.9664  29.5271  18.5111  12.4602
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0021   0.0012   0.0047   8.0871   2.2896   2.8947
***** Episode 109075, Mean R = -17.1  Std R = 6.9  Min R = -31.2
PolicyLoss: -0.0223
Policy_Beta: 0.1
Policy_Entropy: 0.173
Policy_KL: 0.00123
Policy_SD: 0.528
Policy_lr_mult: 0.198
Steps: 1.18e+04
TotalSteps: 4.03e+07
VF_0_ExplainedVarNew: 0.989
VF_0_ExplainedVarOld: 0.988
VF_0_Loss : 0.00172


Dynamics: Max Disturbance (m/s^2):  [0.00149461 0.0018056  0.00138071] 0.002720371623523329
ADV1:  0.0007547334662963426 0.007371241672944743 0.07256726856384504 -0.11724794292390006
ADV2:  -0.016729247225489963 0.80799107020667 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.4887   1.4589   7.4544  29.5271  18.5111  12.4602
ValFun  

ADV1:  -0.0008052118013055794 0.005621581925505161 0.04526979749212179 -0.05571920166209432
ADV2:  0.013967245637041907 0.8679927102296111 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.0289   0.7506   3.2850  29.5271  18.5111  12.4602
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0008   0.0005   0.0021   8.0871   2.2896   2.8947
***** Episode 109354, Mean R = -15.4  Std R = 3.4  Min R = -23.5
PolicyLoss: -0.00844
Policy_Beta: 0.1
Policy_Entropy: 0.171
Policy_KL: 0.000847
Policy_SD: 0.538
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 4.04e+07
VF_0_ExplainedVarNew: 0.994
VF_0_ExplainedVarOld: 0.993
VF_0_Loss : 0.00234


Dynamics: Max Disturbance (m/s^2):  [0.00149461 0.0018056  0.00138071] 0.002720371623523329
ADV1:  -0.00012104497125809732 0.0069663178008500925 0.049436441863321134 -0.047249913990814095
ADV2:  0.019861584921196197 0.8223259155882519 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.5195   0.6369   3.5185  29.5271  18.5111  12.4602


***** Episode 109602, Mean R = -17.4  Std R = 4.9  Min R = -26.6
PolicyLoss: -0.0115
Policy_Beta: 0.1
Policy_Entropy: 0.171
Policy_KL: 0.00108
Policy_SD: 0.546
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 4.05e+07
VF_0_ExplainedVarNew: 0.994
VF_0_ExplainedVarOld: 0.992
VF_0_Loss : 0.00239


Dynamics: Max Disturbance (m/s^2):  [0.00149461 0.0018056  0.00138071] 0.002720371623523329
ADV1:  -0.00041910130035581743 0.0071841576327170385 0.044971066444999486 -0.06659174402925921
ADV2:  0.02170929145034724 0.8106393544128171 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.9945   0.9391   4.0070  29.5271  18.5111  12.4602
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0005   0.0003   0.0011   8.0871   2.2896   2.8947
***** Episode 109633, Mean R = -17.6  Std R = 5.6  Min R = -34.9
PolicyLoss: -0.0223
Policy_Beta: 0.1
Policy_Entropy: 0.171
Policy_KL: 0.00106
Policy_SD: 0.548
Policy_lr_mult: 0.198
Steps: 1.18e+04
TotalSteps: 4.05e+07
VF_0_ExplainedVarNew: 0.99
VF_0_Expl

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.2558   0.4817   2.3223  29.5271  18.5111  12.4602
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0053   0.0029   0.0128   8.0871   2.2896   2.8947
***** Episode 109881, Mean R = -15.6  Std R = 5.6  Min R = -30.0
PolicyLoss: 0.0363
Policy_Beta: 0.1
Policy_Entropy: 0.172
Policy_KL: 0.000716
Policy_SD: 0.531
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 4.06e+07
VF_0_ExplainedVarNew: 0.967
VF_0_ExplainedVarOld: 0.92
VF_0_Loss : 0.00658


Dynamics: Max Disturbance (m/s^2):  [0.00149461 0.0018056  0.00138071] 0.002720371623523329
ADV1:  0.0034029522691859247 0.012081084064913898 0.11098115453443086 -0.109780977659511
ADV2:  -0.002849000051948951 0.8406370185416615 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.4089   1.1017   6.3885  29.5271  18.5111  12.4602
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0056   0.0030   0.0116   8.0871   2.2896   2.8947
***** Episode 109912, Mean R = -15.2  Std R = 3.5  Min

Dynamics: Max Disturbance (m/s^2):  [0.00149461 0.0018056  0.00138071] 0.002720371623523329
ADV1:  0.0003686846816870038 0.008269710746315955 0.07689212427860448 -0.12470559591929026
ADV2:  0.008730648373631114 0.8051820719044315 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.0424   1.3477   6.9255  29.5271  18.5111  12.4602
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0005   0.0003   0.0011   8.0871   2.2896   2.8947
***** Episode 110160, Mean R = -16.9  Std R = 5.7  Min R = -33.4
PolicyLoss: -0.0164
Policy_Beta: 0.1
Policy_Entropy: 0.171
Policy_KL: 0.000946
Policy_SD: 0.537
Policy_lr_mult: 0.198
Steps: 1.18e+04
TotalSteps: 4.07e+07
VF_0_ExplainedVarNew: 0.989
VF_0_ExplainedVarOld: 0.986
VF_0_Loss : 0.0032


ADV1:  -0.0013207217738391717 0.010473046863499407 0.09683033625414161 -0.1608192212687215
ADV2:  0.020696414053742156 0.7994652565705521 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.8842   0.7385   3.9421  29.5271  18.5111  12.4602
ValFun  

Dynamics: Max Disturbance (m/s^2):  [0.00149461 0.0018056  0.00138071] 0.002720371623523329
ADV1:  0.002515045358277254 0.009132201500372465 0.08313822993585623 -0.2066205530261831
ADV2:  0.004344715247334772 0.7705608437763278 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.0560   1.5391   5.7676  29.5271  18.5111  12.4602
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0033   0.0019   0.0070   8.0871   2.2896   2.8947
***** Episode 110439, Mean R = -16.6  Std R = 7.4  Min R = -44.1
PolicyLoss: -0.0294
Policy_Beta: 0.1
Policy_Entropy: 0.172
Policy_KL: 0.00093
Policy_SD: 0.533
Policy_lr_mult: 0.198
Steps: 1.16e+04
TotalSteps: 4.08e+07
VF_0_ExplainedVarNew: 0.989
VF_0_ExplainedVarOld: 0.984
VF_0_Loss : 0.00323


ADV1:  -0.002506098899302676 0.012644357882502889 0.09422678749555313 -0.2840691403150468
ADV2:  0.0449312851040319 0.5909642799886042 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.3139   0.7036   3.6478  29.5271  18.5111  12.4602
ValFun  Gradi

optical_flow | -0.0000  0.0000 |  0.0215  0.0240 | -0.8376 -1.1103 |  0.9543  1.0457
v_err    | -0.0101 |  0.0587 | -0.9453 |  0.1020
landing_rewards |    9.61 |    1.93 |    0.00 |   10.00
landing_margin |    2.83 |   50.16 |   -0.06 |  884.61
tracking_rewards |  -22.39 |    6.58 |  -95.22 |  -12.22
steps    |     375 |      26 |      87 |     415
***** Episode 110718, Mean R = -16.8  Std R = 4.8  Min R = -29.8
PolicyLoss: -0.022
Policy_Beta: 0.1
Policy_Entropy: 0.17
Policy_KL: 0.000926
Policy_SD: 0.547
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 4.09e+07
VF_0_ExplainedVarNew: 0.986
VF_0_ExplainedVarOld: 0.982
VF_0_Loss : 0.00499


ADV1:  0.0003164860093329716 0.00863406148635327 0.10906288289301208 -0.09052943334485641
ADV2:  -0.004679061450851803 0.8184451067360045 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.1162   0.6666   3.3369  29.5271  18.5111  12.4602
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0006   0.0003   0.0012   8.0871   2.2896   2.8947


attitude |   -0.01   -0.01    0.06 |    1.20    0.68    1.82 |   -3.14   -1.56   -3.14 |    3.14    1.57    3.14
w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.07   -0.05   -0.07 |    0.08    0.07    0.05
a_f      |   -0.01    0.03 |    0.68    1.83 |   -1.47   -3.14 |    1.45    3.12
w_f      |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.02   -0.03   -0.02 |    0.02    0.03    0.02
w_rewards |   -0.29 |    0.23 |   -1.65 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.26 |    0.31 |    0.00 |    3.04
seeker_angles |    0.00    0.00 |    0.08    0.09 |   -0.97   -1.00 |    0.97    0.99
cs_angles |  0.0000  0.0036 |  0.0811  0.0869 | -0.9697 -0.9989 |  0.9736  0.9874
optical_flow |  0.0000 -0.0000 |  0.0212  0.0251 | -1.3119 -1.2595 |  1.0802  0.9874
v_err    | -0.0098 |  0.0562 | -0.4514 |  0.0995
landing_rewards |    9.61 |    1.93 |    0.00 |   10.00
landing_margin |   -0

attitude |    0.03   -0.06   -0.06 |    1.15    0.64    1.88 |   -3.14   -1.54   -3.14 |    3.14    1.56    3.14
w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.09   -0.05   -0.07 |    0.09    0.07    0.06
a_f      |   -0.06   -0.08 |    0.64    1.90 |   -1.52   -3.14 |    1.49    3.12
w_f      |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.02   -0.02   -0.02 |    0.02    0.03    0.02
w_rewards |   -0.29 |    0.28 |   -2.16 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.26 |    0.31 |    0.00 |    2.93
seeker_angles |   -0.00    0.00 |    0.08    0.08 |   -0.96   -0.98 |    0.97    1.00
cs_angles | -0.0011  0.0027 |  0.0836  0.0808 | -0.9607 -0.9792 |  0.9665  0.9951
optical_flow | -0.0000 -0.0000 |  0.0217  0.0238 | -1.1205 -1.0829 |  1.0260  0.9513
v_err    | -0.0098 |  0.0564 | -0.4585 |  0.1302
landing_rewards |    9.71 |    1.68 |    0.00 |   10.00
landing_margin |   -0

attitude |    0.06   -0.00   -0.03 |    1.04    0.62    1.77 |   -3.14   -1.55   -3.14 |    3.14    1.55    3.14
w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.07   -0.05   -0.07 |    0.07    0.07    0.06
a_f      |   -0.00   -0.03 |    0.62    1.78 |   -1.53   -3.13 |    1.40    3.13
w_f      |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.02   -0.03   -0.02 |    0.03    0.03    0.02
w_rewards |   -0.28 |    0.21 |   -1.47 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.25 |    0.31 |    0.00 |    3.02
seeker_angles |    0.00    0.00 |    0.08    0.08 |   -1.00   -0.99 |    0.98    0.97
cs_angles |  0.0022  0.0028 |  0.0811  0.0808 | -0.9995 -0.9891 |  0.9787  0.9687
optical_flow | -0.0001  0.0001 |  0.0228  0.0239 | -1.1720 -1.1546 |  1.1679  1.2710
v_err    | -0.0097 |  0.0560 | -0.4535 |  0.2351
landing_rewards |    9.68 |    1.77 |    0.00 |   10.00
landing_margin |   -0

attitude |    0.04    0.02   -0.13 |    1.23    0.64    1.86 |   -3.14   -1.55   -3.14 |    3.14    1.55    3.14
w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.08   -0.06   -0.08 |    0.09    0.07    0.05
a_f      |    0.02   -0.16 |    0.64    1.86 |   -1.38   -3.13 |    1.53    3.08
w_f      |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.02   -0.02   -0.02 |    0.02    0.02    0.02
w_rewards |   -0.33 |    0.38 |   -3.65 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.26 |    0.32 |    0.00 |    3.08
seeker_angles |    0.00    0.01 |    0.08    0.09 |   -0.98   -0.94 |    0.98    1.00
cs_angles |  0.0006  0.0079 |  0.0821  0.0860 | -0.9834 -0.9432 |  0.9782  0.9973
optical_flow | -0.0001 -0.0001 |  0.0208  0.0240 | -0.8832 -1.2589 |  1.0202  1.1917
v_err    | -0.0098 |  0.0575 | -0.5498 |  0.1194
landing_rewards |    9.65 |    1.85 |    0.00 |   10.00
landing_margin |   -0

attitude |   -0.01   -0.03   -0.16 |    1.22    0.69    1.83 |   -3.14   -1.56   -3.14 |    3.14    1.55    3.14
w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.06   -0.06   -0.07 |    0.09    0.07    0.07
a_f      |   -0.03   -0.06 |    0.68    1.85 |   -1.48   -3.10 |    1.47    3.14
w_f      |   -0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.02   -0.06   -0.02 |    0.08    0.03    0.06
w_rewards |   -0.31 |    0.56 |   -9.14 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |   -0.16 |    2.84 |  -50.00 |    0.00
theta_cv |    0.26 |    0.31 |    0.00 |    2.99
seeker_angles |    0.00    0.00 |    0.08    0.08 |   -0.97   -0.97 |    1.00    1.00
cs_angles |  0.0002  0.0038 |  0.0788  0.0826 | -0.9700 -0.9664 |  0.9979  0.9986
optical_flow | -0.0002  0.0001 |  0.0226  0.0250 | -0.8659 -1.1754 |  1.2379  1.3521
v_err    | -0.0098 |  0.0580 | -0.7383 |  0.1105
landing_rewards |    9.68 |    1.77 |    0.00 |   10.00
landing_margin |    2

attitude |   -0.06    0.03   -0.13 |    1.25    0.66    1.88 |   -3.14   -1.54   -3.14 |    3.14    1.54    3.14
w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.07   -0.05   -0.07 |    0.08    0.07    0.05
a_f      |    0.02   -0.11 |    0.66    1.89 |   -1.49   -3.14 |    1.47    3.12
w_f      |   -0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.02   -0.03   -0.02 |    0.03    0.03    0.02
w_rewards |   -0.29 |    0.23 |   -1.39 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.25 |    0.31 |    0.00 |    3.03
seeker_angles |   -0.00    0.00 |    0.08    0.08 |   -0.97   -0.98 |    0.99    0.99
cs_angles | -0.0005  0.0015 |  0.0788  0.0812 | -0.9665 -0.9817 |  0.9934  0.9923
optical_flow |  0.0002 -0.0000 |  0.0225  0.0232 | -1.2500 -1.1287 |  1.1133  1.0354
v_err    | -0.0094 |  0.0563 | -0.4528 |  0.1156
landing_rewards |    9.71 |    1.68 |    0.00 |   10.00
landing_margin |   -0

w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.06   -0.05   -0.07 |    0.08    0.07    0.05
a_f      |   -0.01    0.06 |    0.70    1.81 |   -1.51   -3.14 |    1.51    3.14
w_f      |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.02   -0.02   -0.02 |    0.02    0.03    0.02
w_rewards |   -0.27 |    0.23 |   -1.67 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.26 |    0.32 |    0.00 |    3.06
seeker_angles |    0.00    0.00 |    0.08    0.08 |   -0.98   -0.98 |    0.98    0.98
cs_angles |  0.0020  0.0029 |  0.0825  0.0833 | -0.9829 -0.9819 |  0.9773  0.9815
optical_flow | -0.0000  0.0001 |  0.0219  0.0249 | -1.0444 -1.1129 |  1.0226  1.0512
v_err    | -0.0089 |  0.0556 | -0.4520 |  0.1116
landing_rewards |    9.74 |    1.59 |    0.00 |   10.00
landing_margin |   -0.03 |    0.01 |   -0.05 |    0.02
tracking_rewards |  -21.81 |    4.93 |  -41.58 |  -13.53
steps    |     376 |  

w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.05   -0.05   -0.07 |    0.08    0.07    0.05
a_f      |    0.05   -0.09 |    0.61    1.85 |   -1.44   -3.10 |    1.47    3.12
w_f      |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.02   -0.02   -0.02 |    0.02    0.03    0.02
w_rewards |   -0.29 |    0.21 |   -1.18 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.25 |    0.31 |    0.00 |    3.01
seeker_angles |   -0.00    0.00 |    0.08    0.08 |   -0.97   -0.98 |    0.98    0.99
cs_angles | -0.0009  0.0038 |  0.0819  0.0809 | -0.9652 -0.9818 |  0.9753  0.9899
optical_flow | -0.0001  0.0001 |  0.0220  0.0245 | -1.2546 -1.0131 |  1.0664  1.0638
v_err    | -0.0088 |  0.0557 | -0.4537 |  0.1519
landing_rewards |    9.71 |    1.68 |    0.00 |   10.00
landing_margin |   -0.03 |    0.01 |   -0.06 |    0.02
tracking_rewards |  -21.50 |    4.49 |  -37.57 |  -12.34
steps    |     375 |  

thrust   |    0.00    0.01    0.00 |    0.67    0.67    0.68 |   -3.45   -3.42   -3.44 |    3.46    3.43    3.46
norm_thrust |    0.89 |    0.76 |    0.00 |    3.46
fuel     |    1.53 |    0.18 |    1.10 |    2.21
rewards  |  -16.28 |    5.37 |  -37.57 |   -7.57
fuel_rewards |   -4.40 |    0.52 |   -6.34 |   -3.15
glideslope_rewards |    0.00 |    0.00 |    0.00 |    0.00
glideslope_penalty |    0.00 |    0.00 |    0.00 |    0.00
glideslope |    3.11 |   13.29 |    0.00 |  557.27
norm_af  |    1.77 |    0.93 |    0.02 |    3.25
norm_wf  |    0.01 |    0.01 |    0.00 |    0.03
rh_penalty |    0.00 |    0.00 |    0.00 |    0.00
att_rewards |    0.00 |    0.00 |    0.00 |    0.00
att_penalty |    0.00 |    0.00 |    0.00 |    0.00
attitude |   -0.07   -0.01   -0.13 |    1.29    0.67    1.88 |   -3.14   -1.57   -3.14 |    3.14    1.56    3.14
w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.07   -0.05   -0.07 |    0.08    0.07    0.05
a_f      |   -0.00   -0.13 |    0.67

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.3055   1.2536   4.7191  29.5271  18.5111  12.4602
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0014   0.0009   0.0032   8.0871   2.2896   2.8947
Update Cnt = 3670    ET =   1037.1   Stats:  Mean, Std, Min, Max
r_f      |   18.18    1.31    7.92 |  191.51  173.86  193.91 | -383.64 -389.45 -391.24 |  392.71  376.05  384.49
v_f      |   -0.00   -0.00   -0.00 |    0.05    0.04    0.05 |   -0.10   -0.13   -0.10 |    0.09    0.09    0.10
r_i      |   61.63   15.43   33.62 |  693.38  678.08  739.84 |-1345.53-1267.10-1318.92 | 1317.66 1353.64 1300.97
v_i      |   -0.00   -0.00   -0.00 |    0.04    0.04    0.05 |   -0.09   -0.10   -0.09 |    0.09    0.09    0.09
norm_rf  |    0.17 |    0.06 |    0.03 |    0.39
norm_vf  |    0.08 |    0.01 |    0.04 |    0.14
gs_f     |    1.13 |    1.53 |    0.01 |   13.74
thrust   |   -0.01   -0.00   -0.00 |    0.67    0.69    0.69 |   -3.46   -3.46   -3.44 |    3.42    3.46    3.41
norm_thrust |    

ADV1:  -0.0016033958935971163 0.008550367989491112 0.048023551113089424 -0.0657696104767754
ADV2:  0.040119380402960626 0.8302427372439363 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.3819   0.6991   3.6531  29.5271  18.5111  12.4602
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0018   0.0010   0.0042   8.0871   2.2896   2.8947
***** Episode 114097, Mean R = -16.2  Std R = 6.7  Min R = -36.3
PolicyLoss: -0.0302
Policy_Beta: 0.1
Policy_Entropy: 0.175
Policy_KL: 0.000965
Policy_SD: 0.534
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 4.22e+07
VF_0_ExplainedVarNew: 0.985
VF_0_ExplainedVarOld: 0.984
VF_0_Loss : 0.0056


ADV1:  -5.802630814043321e-05 0.008112903226006472 0.15142229449316752 -0.13474077855824695
ADV2:  0.003518527205302707 0.763337354959309 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.0981   1.3160   6.2830  29.5271  18.5111  12.4602
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0002   0.0001   0.0003   8.0871   2.2896   2.8

ADV1:  0.0008061296310393231 0.00692779662598071 0.042759823502933836 -0.05305912011186775
ADV2:  0.004141412376893667 0.882176177932359 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   4.0260   1.9734  10.4185  29.5271  18.5111  12.4602
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0009   0.0005   0.0021   8.0871   2.2896   2.8947
***** Episode 114376, Mean R = -16.6  Std R = 4.9  Min R = -26.2
PolicyLoss: -0.0174
Policy_Beta: 0.1
Policy_Entropy: 0.171
Policy_KL: 0.00117
Policy_SD: 0.55
Policy_lr_mult: 0.198
Steps: 1.15e+04
TotalSteps: 4.23e+07
VF_0_ExplainedVarNew: 0.991
VF_0_ExplainedVarOld: 0.99
VF_0_Loss : 0.00592


ADV1:  -0.0007600480742620965 0.006939052012004054 0.07444403787697468 -0.051558441308103074
ADV2:  0.020392209443481964 0.842336902991549 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.4149   1.5941   6.3757  29.5271  18.5111  12.4602
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0008   0.0005   0.0020   8.0871   2.2896   2.8947

***** Episode 114624, Mean R = -15.6  Std R = 4.4  Min R = -25.0
PolicyLoss: -0.00552
Policy_Beta: 0.1
Policy_Entropy: 0.174
Policy_KL: 0.00093
Policy_SD: 0.524
Policy_lr_mult: 0.198
Steps: 1.18e+04
TotalSteps: 4.24e+07
VF_0_ExplainedVarNew: 0.995
VF_0_ExplainedVarOld: 0.994
VF_0_Loss : 0.0057


ADV1:  0.00042324234366521613 0.0070834453667136185 0.08081139671183701 -0.05510831018532625
ADV2:  0.014151866104910347 0.8269623118835502 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.3879   0.9498   3.7563  29.5271  18.5111  12.4602
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0005   0.0003   0.0011   8.0871   2.2896   2.8947
***** Episode 114655, Mean R = -15.6  Std R = 4.9  Min R = -29.0
PolicyLoss: -0.0214
Policy_Beta: 0.1
Policy_Entropy: 0.174
Policy_KL: 0.00091
Policy_SD: 0.525
Policy_lr_mult: 0.198
Steps: 1.15e+04
TotalSteps: 4.24e+07
VF_0_ExplainedVarNew: 0.99
VF_0_ExplainedVarOld: 0.989
VF_0_Loss : 0.00467


Dynamics: Max Disturbance (m/s^2):  [0.00149461 0.00

Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.3612   1.3249   5.4147  29.5271  18.5111  12.4602
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0007   0.0003   0.0015   8.0871   2.2896   2.8947
***** Episode 114903, Mean R = -18.8  Std R = 5.9  Min R = -34.9
PolicyLoss: -0.0271
Policy_Beta: 0.1
Policy_Entropy: 0.172
Policy_KL: 0.00104
Policy_SD: 0.554
Policy_lr_mult: 0.198
Steps: 1.16e+04
TotalSteps: 4.25e+07
VF_0_ExplainedVarNew: 0.989
VF_0_ExplainedVarOld: 0.985
VF_0_Loss : 0.00819


ADV1:  -0.001173767220574873 0.009669926654313358 0.11463740525204624 -0.10216420751798644
ADV2:  0.02274477409013791 0.7796243535436141 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.6572   0.5413   3.0772  29.5271  18.5111  12.4602
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0015   0.0009   0.0031   8.0871   2.2896   2.8947
***** Episode 114934, Mean R = -17.1  Std R = 4.5  Min R = -25.9
PolicyLoss: -0.0186
Policy_Beta: 0.1
Policy_Entropy: 0.172
Policy_KL: 0.00135
Po

ADV1:  0.000689514703864162 0.008853589537606213 0.07959770494814639 -0.08162346362276252
ADV2:  -0.007880373405149223 0.8176459987653731 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.1774   0.9444   4.4643  29.5271  18.5111  12.4602
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0009   0.0005   0.0020   8.0871   2.2896   2.8947
***** Episode 115182, Mean R = -16.4  Std R = 5.3  Min R = -33.0
PolicyLoss: -0.0024
Policy_Beta: 0.1
Policy_Entropy: 0.173
Policy_KL: 0.00122
Policy_SD: 0.546
Policy_lr_mult: 0.198
Steps: 1.16e+04
TotalSteps: 4.26e+07
VF_0_ExplainedVarNew: 0.987
VF_0_ExplainedVarOld: 0.984
VF_0_Loss : 0.00989


Dynamics: Max Disturbance (m/s^2):  [0.00149461 0.0018056  0.00138071] 0.002720371623523329
ADV1:  -0.0030699940527524608 0.009493842359491897 0.045041227339221 -0.09296152284185655
ADV2:  0.04898774642389925 0.8652648363806597 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   3.2401   1.5708   8.9453  29.5271  18.5111  12.4602
ValFun  Gr

ADV1:  -0.0002208000697902353 0.006930344125111328 0.06786205170968712 -0.06903850197583583
ADV2:  0.011671311294339575 0.8606389300655714 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.7594   0.7158   3.1225  29.5271  18.5111  12.4602
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0004   0.0002   0.0008   8.0871   2.2896   2.8947
***** Episode 115461, Mean R = -15.8  Std R = 5.6  Min R = -41.7
PolicyLoss: -0.0137
Policy_Beta: 0.1
Policy_Entropy: 0.174
Policy_KL: 0.000833
Policy_SD: 0.527
Policy_lr_mult: 0.198
Steps: 1.16e+04
TotalSteps: 4.27e+07
VF_0_ExplainedVarNew: 0.991
VF_0_ExplainedVarOld: 0.99
VF_0_Loss : 0.00572


Dynamics: Max Disturbance (m/s^2):  [0.00149461 0.0018056  0.00138071] 0.002720371623523329
ADV1:  -0.0021330583573576653 0.008275583882627462 0.051523307009079755 -0.05552551783335211
ADV2:  0.038940164586987985 0.8294850221606671 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.4940   1.3224   7.1951  29.5271  18.5111  12.4602
ValFu

***** Episode 115709, Mean R = -15.8  Std R = 4.0  Min R = -27.0
PolicyLoss: 0.00309
Policy_Beta: 0.1
Policy_Entropy: 0.172
Policy_KL: 0.00106
Policy_SD: 0.541
Policy_lr_mult: 0.198
Steps: 1.15e+04
TotalSteps: 4.28e+07
VF_0_ExplainedVarNew: 0.993
VF_0_ExplainedVarOld: 0.991
VF_0_Loss : 0.00766


ADV1:  -0.0030451619260086784 0.00801596433110751 0.037488252291098756 -0.05055165267255812
ADV2:  0.043639181596696164 0.8803933842516537 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   2.4770   1.1200   5.1470  29.5271  18.5111  12.4602
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0039   0.0022   0.0084   8.0871   2.2896   2.8947
***** Episode 115740, Mean R = -16.5  Std R = 5.3  Min R = -28.2
PolicyLoss: -0.0201
Policy_Beta: 0.1
Policy_Entropy: 0.174
Policy_KL: 0.00103
Policy_SD: 0.533
Policy_lr_mult: 0.198
Steps: 1.16e+04
TotalSteps: 4.28e+07
VF_0_ExplainedVarNew: 0.987
VF_0_ExplainedVarOld: 0.986
VF_0_Loss : 0.00674


Dynamics: Max Disturbance (m/s^2):  [0.00149461 0.00

v_err    | -0.0090 |  0.0561 | -0.4540 |  0.1228
landing_rewards |    9.68 |    1.77 |    0.00 |   10.00
landing_margin |   -0.02 |    0.01 |   -0.06 |    0.01
tracking_rewards |  -21.85 |    4.83 |  -52.68 |  -12.51
steps    |     377 |      19 |     333 |     418
***** Episode 115988, Mean R = -16.8  Std R = 5.8  Min R = -31.0
PolicyLoss: -0.0258
Policy_Beta: 0.1
Policy_Entropy: 0.175
Policy_KL: 0.0011
Policy_SD: 0.533
Policy_lr_mult: 0.198
Steps: 1.17e+04
TotalSteps: 4.29e+07
VF_0_ExplainedVarNew: 0.989
VF_0_ExplainedVarOld: 0.985
VF_0_Loss : 0.00641


Dynamics: Max Disturbance (m/s^2):  [0.00149461 0.0018056  0.00138071] 0.002720371623523329
ADV1:  -0.001269566254146046 0.008510283598270049 0.0823894285517563 -0.06395093891564038
ADV2:  0.022014044628724087 0.8181341337029203 3.0 -3.0
Policy  Gradients: u/sd/Max/C Max/Max u/Max sd :   1.0591   0.6784   3.2431  29.5271  18.5111  12.4602
ValFun  Gradients: u/sd/Max/C Max/Max u/Max sd :   0.0015   0.0009   0.0034   8.0871   2.2896   2

attitude |   -0.04   -0.00    0.12 |    1.28    0.68    1.87 |   -3.14   -1.55   -3.14 |    3.14    1.53    3.14
w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.07   -0.05   -0.07 |    0.09    0.07    0.05
a_f      |    0.01    0.16 |    0.69    1.86 |   -1.45   -3.13 |    1.45    3.14
w_f      |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.03   -0.02   -0.02 |    0.02    0.03    0.02
w_rewards |   -0.25 |    0.33 |   -5.03 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.25 |    0.32 |    0.00 |    3.03
seeker_angles |   -0.00    0.00 |    0.08    0.08 |   -0.97   -1.00 |    0.99    0.99
cs_angles | -0.0016  0.0025 |  0.0819  0.0837 | -0.9667 -0.9950 |  0.9913  0.9917
optical_flow | -0.0000  0.0001 |  0.0209  0.0231 | -0.8737 -1.1615 |  0.9418  1.3666
v_err    | -0.0087 |  0.0560 | -0.4707 |  0.1337
landing_rewards |    9.77 |    1.49 |    0.00 |   10.00
landing_margin |   -0

attitude |   -0.02   -0.06   -0.17 |    1.09    0.61    1.81 |   -3.14   -1.57   -3.14 |    3.14    1.55    3.14
w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.07   -0.06   -0.07 |    0.07    0.07    0.05
a_f      |   -0.07   -0.16 |    0.61    1.81 |   -1.52   -3.13 |    1.44    3.14
w_f      |   -0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.02   -0.02   -0.02 |    0.02    0.02    0.02
w_rewards |   -0.28 |    0.22 |   -1.14 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.25 |    0.32 |    0.00 |    2.98
seeker_angles |    0.00   -0.00 |    0.08    0.09 |   -1.00   -1.00 |    0.98    1.00
cs_angles |  0.0010 -0.0023 |  0.0806  0.0857 | -0.9990 -0.9979 |  0.9838  0.9966
optical_flow |  0.0000  0.0001 |  0.0222  0.0257 | -1.2333 -1.2800 |  1.0670  1.2897
v_err    | -0.0093 |  0.0573 | -0.6020 |  0.1597
landing_rewards |    9.65 |    1.85 |    0.00 |   10.00
landing_margin |   -0

attitude |    0.05    0.06    0.03 |    1.25    0.70    1.83 |   -3.14   -1.55   -3.14 |    3.14    1.54    3.14
w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.09   -0.05   -0.07 |    0.08    0.07    0.06
a_f      |    0.06    0.08 |    0.70    1.83 |   -1.46   -3.13 |    1.50    3.14
w_f      |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.02   -0.03   -0.02 |    0.02    0.03    0.02
w_rewards |   -0.25 |    0.26 |   -2.57 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.25 |    0.32 |    0.00 |    3.05
seeker_angles |    0.00    0.01 |    0.08    0.08 |   -0.98   -1.00 |    0.97    0.99
cs_angles |  0.0015  0.0078 |  0.0816  0.0847 | -0.9803 -0.9981 |  0.9661  0.9919
optical_flow | -0.0000 -0.0002 |  0.0216  0.0243 | -1.0647 -1.1854 |  1.1536  1.0087
v_err    | -0.0089 |  0.0557 | -0.4516 |  0.1237
landing_rewards |    9.48 |    2.21 |    0.00 |   10.00
landing_margin |   -0

w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.08   -0.05   -0.07 |    0.07    0.07    0.07
a_f      |    0.08    0.12 |    0.66    1.90 |   -1.48   -3.14 |    1.44    3.14
w_f      |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.02   -0.02   -0.02 |    0.02    0.03    0.02
w_rewards |   -0.27 |    0.22 |   -1.81 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.25 |    0.31 |    0.00 |    3.06
seeker_angles |    0.00    0.01 |    0.08    0.08 |   -0.94   -0.97 |    0.97    0.99
cs_angles |  0.0010  0.0065 |  0.0817  0.0804 | -0.9375 -0.9673 |  0.9717  0.9884
optical_flow |  0.0001 -0.0001 |  0.0213  0.0244 | -0.9787 -1.0517 |  1.0036  1.0569
v_err    | -0.0094 |  0.0550 | -0.4522 |  0.1211
landing_rewards |    9.58 |    2.00 |    0.00 |   10.00
landing_margin |   -0.02 |    0.01 |   -0.05 |    0.05
tracking_rewards |  -21.80 |    4.45 |  -43.70 |  -13.23
steps    |     378 |  

attitude |   -0.00   -0.01   -0.13 |    1.15    0.68    1.86 |   -3.14   -1.57   -3.14 |    3.14    1.57    3.14
w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.09   -0.05   -0.07 |    0.07    0.07    0.05
a_f      |   -0.01   -0.16 |    0.68    1.87 |   -1.45   -3.13 |    1.50    3.13
w_f      |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.02   -0.02   -0.02 |    0.02    0.03    0.02
w_rewards |   -0.26 |    0.22 |   -2.34 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.26 |    0.32 |    0.00 |    2.96
seeker_angles |    0.00   -0.00 |    0.08    0.09 |   -1.00   -1.00 |    1.00    0.93
cs_angles |  0.0034 -0.0007 |  0.0833  0.0864 | -0.9997 -0.9966 |  0.9973  0.9275
optical_flow |  0.0000 -0.0000 |  0.0222  0.0226 | -1.1544 -1.0334 |  1.0772  1.0426
v_err    | -0.0097 |  0.0563 | -0.4522 |  0.1370
landing_rewards |    9.52 |    2.15 |    0.00 |   10.00
landing_margin |   -0

attitude |   -0.04    0.01    0.18 |    1.17    0.63    1.79 |   -3.14   -1.55   -3.14 |    3.14    1.56    3.14
w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.10   -0.05   -0.07 |    0.08    0.07    0.05
a_f      |    0.01    0.23 |    0.64    1.78 |   -1.48   -3.13 |    1.43    3.11
w_f      |   -0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.10   -0.02   -0.02 |    0.02    0.02    0.02
w_rewards |   -0.24 |    0.23 |   -2.40 |    0.00
w_penalty |   -0.32 |    5.67 | -100.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.25 |    0.32 |    0.00 |    3.11
seeker_angles |    0.00    0.00 |    0.08    0.08 |   -0.99   -1.00 |    0.94    1.00
cs_angles |  0.0030  0.0023 |  0.0839  0.0802 | -0.9873 -0.9999 |  0.9381  0.9967
optical_flow | -0.0001 -0.0001 |  0.0219  0.0222 | -0.8908 -1.2401 |  1.2605  1.2087
v_err    | -0.0094 |  0.0557 | -0.4530 |  0.2345
landing_rewards |    9.42 |    2.34 |    0.00 |   10.00
landing_margin |    3

w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.09   -0.05   -0.06 |    0.08    0.07    0.05
a_f      |    0.01   -0.05 |    0.69    1.87 |   -1.44   -3.14 |    1.44    3.13
w_f      |   -0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.03   -0.03   -0.02 |    0.01    0.03    0.02
w_rewards |   -0.26 |    0.28 |   -2.62 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.26 |    0.32 |    0.00 |    2.97
seeker_angles |    0.00    0.00 |    0.08    0.09 |   -0.97   -0.97 |    1.00    1.00
cs_angles |  0.0033  0.0029 |  0.0793  0.0866 | -0.9710 -0.9681 |  0.9964  0.9975
optical_flow |  0.0000 -0.0000 |  0.0209  0.0237 | -0.9123 -1.1886 |  1.0041  1.0333
v_err    | -0.0093 |  0.0552 | -0.4535 |  0.0997
landing_rewards |    9.68 |    1.77 |    0.00 |   10.00
landing_margin |   -0.02 |    0.01 |   -0.05 |    0.02
tracking_rewards |  -21.94 |    4.88 |  -50.70 |  -14.12
steps    |     378 |  

attitude |    0.05    0.02   -0.03 |    1.12    0.68    1.75 |   -3.14   -1.54   -3.14 |    3.14    1.54    3.14
w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.09   -0.05   -0.07 |    0.09    0.07    0.07
a_f      |    0.02   -0.06 |    0.68    1.74 |   -1.47   -3.13 |    1.51    3.13
w_f      |   -0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.02   -0.03   -0.02 |    0.02    0.03    0.02
w_rewards |   -0.24 |    0.24 |   -2.17 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.25 |    0.32 |    0.00 |    2.91
seeker_angles |    0.00    0.00 |    0.08    0.08 |   -0.99   -0.98 |    0.98    0.98
cs_angles |  0.0040  0.0012 |  0.0800  0.0831 | -0.9910 -0.9814 |  0.9762  0.9791
optical_flow | -0.0001  0.0000 |  0.0220  0.0240 | -1.1385 -1.1740 |  1.1164  0.9702
v_err    | -0.0091 |  0.0555 | -0.4525 |  0.1194
landing_rewards |    9.71 |    1.68 |    0.00 |   10.00
landing_margin |   -0

attitude |   -0.10   -0.10    0.11 |    1.28    0.67    1.90 |   -3.14   -1.54   -3.14 |    3.14    1.57    3.14
w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.06   -0.05   -0.07 |    0.07    0.07    0.05
a_f      |   -0.10    0.14 |    0.68    1.90 |   -1.51   -3.12 |    1.53    3.14
w_f      |   -0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.02   -0.02   -0.02 |    0.02    0.02    0.02
w_rewards |   -0.22 |    0.19 |   -1.35 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.25 |    0.32 |    0.00 |    3.06
seeker_angles |    0.00    0.00 |    0.08    0.08 |   -0.99   -1.00 |    0.98    0.98
cs_angles |  0.0009  0.0024 |  0.0796  0.0792 | -0.9910 -0.9992 |  0.9849  0.9782
optical_flow |  0.0001  0.0001 |  0.0215  0.0236 | -0.9806 -0.9991 |  0.9273  1.3550
v_err    | -0.0088 |  0.0552 | -0.4533 |  0.1097
landing_rewards |    9.77 |    1.49 |    0.00 |   10.00
landing_margin |   -0

w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.08   -0.05   -0.07 |    0.08    0.07    0.05
a_f      |    0.01   -0.07 |    0.66    1.85 |   -1.40   -3.13 |    1.51    3.13
w_f      |   -0.00    0.00    0.00 |    0.01    0.01    0.01 |   -0.02   -0.02   -0.02 |    0.02    0.02    0.02
w_rewards |   -0.27 |    0.24 |   -1.94 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.25 |    0.32 |    0.00 |    3.00
seeker_angles |    0.00    0.00 |    0.08    0.08 |   -0.95   -0.99 |    0.99    0.99
cs_angles |  0.0021  0.0020 |  0.0825  0.0800 | -0.9506 -0.9892 |  0.9861  0.9934
optical_flow |  0.0001 -0.0000 |  0.0212  0.0242 | -1.0323 -1.3208 |  1.0891  1.1500
v_err    | -0.0089 |  0.0557 | -0.4525 |  0.1121
landing_rewards |    9.58 |    2.00 |    0.00 |   10.00
landing_margin |   -0.02 |    0.01 |   -0.05 |    0.02
tracking_rewards |  -21.64 |    4.58 |  -44.69 |  -13.43
steps    |     377 |  

attitude |    0.00   -0.04    0.05 |    1.21    0.66    1.85 |   -3.14   -1.56   -3.14 |    3.14    1.56    3.14
w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.07   -0.05   -0.07 |    0.08    0.07    0.05
a_f      |   -0.05    0.11 |    0.65    1.84 |   -1.46   -3.13 |    1.52    3.13
w_f      |   -0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.02   -0.03   -0.01 |    0.02    0.02    0.02
w_rewards |   -0.26 |    0.25 |   -2.51 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.26 |    0.32 |    0.00 |    3.00
seeker_angles |   -0.00    0.00 |    0.09    0.08 |   -0.99   -1.00 |    0.95    0.98
cs_angles | -0.0015  0.0036 |  0.0853  0.0818 | -0.9888 -0.9954 |  0.9502  0.9849
optical_flow | -0.0002 -0.0001 |  0.0224  0.0237 | -1.2922 -1.1123 |  1.0455  1.1418
v_err    | -0.0090 |  0.0555 | -0.4534 |  0.1079
landing_rewards |    9.77 |    1.49 |    0.00 |   10.00
landing_margin |   -0

w        |    0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.07   -0.05   -0.08 |    0.07    0.07    0.05
a_f      |    0.02   -0.30 |    0.63    1.82 |   -1.43   -3.14 |    1.45    3.12
w_f      |   -0.00    0.00   -0.00 |    0.01    0.01    0.01 |   -0.02   -0.03   -0.02 |    0.03    0.03    0.02
w_rewards |   -0.28 |    0.22 |   -1.09 |    0.00
w_penalty |    0.00 |    0.00 |    0.00 |    0.00
fov_penalty |    0.00 |    0.00 |    0.00 |    0.00
theta_cv |    0.25 |    0.31 |    0.00 |    3.00
seeker_angles |   -0.00    0.00 |    0.08    0.08 |   -0.99   -0.97 |    1.00    0.98
cs_angles | -0.0011  0.0023 |  0.0799  0.0791 | -0.9902 -0.9748 |  0.9973  0.9817
optical_flow |  0.0000 -0.0001 |  0.0233  0.0229 | -1.2577 -1.4266 |  0.9735  1.2344
v_err    | -0.0091 |  0.0550 | -0.4578 |  0.1425
landing_rewards |    9.74 |    1.59 |    0.00 |   10.00
landing_margin |   -0.03 |    0.01 |   -0.06 |    0.02
tracking_rewards |  -21.18 |    4.27 |  -38.49 |  -13.45
steps    |     378 |  

In [6]:
fname = "optimize_WATTVW_FOV-AR=5-RPT1"
policy.save_params(fname)


In [5]:
env.test_policy_batch(agent,5000,print_every=100,test_mode=True)

worked 1
Dynamics: Max Disturbance (m/s^2):  [0.00149461 0.0018056  0.00138071] 0.002720371623523329


KeyboardInterrupt: 