In [2]:
"""
- Rollouts
- Define networks
- GAE
- Utils : Normal distributions and log probability of an action
- train
- logging utilities

Experiment with shared network for both policy and value function
"""

using Flux, CuArrays
using OpenAIGym
import Reinforce.action
import Reinforce:run_episode
import Flux.params
using Flux.Tracker: grad, update!
using Flux: onehot
using Statistics
using Distributed
using Distributions
using LinearAlgebra
using Base.Iterators
using BSON:@save,@load
using JLD

"""
A few intricacies : 
The policy is a Normal distribution and the `policy_net` outputs the `μ` and `logσ`.
Each action is assumed to be independent of the others.
Thus our covariance matrix is a diagonal matrix with each element representing the variance of
taking a particular action.
"""

"""
Utilities
"""
# weight initialization
function _random_normal(shape...)
    return map(Float32,rand(Normal(0,0.1),shape...))
end

function constant_init(shape...)
    return map(Float32,ones(shape...) * 0.1)
end

function normal_log_prob(μ,log_std,a)
    """
    Returns the log probability of an action under a policy Gaussian policy π
    """
    σ = exp.(log_std)
    σ² = σ.^2
    -(((a .- μ).^2)./(2.0 * σ²)) .- 0.5*log.(sqrt(2 * π)) .- log.(σ)
end

function normal_entropy(log_std)
    0.5 + 0.5 * log(2 * π) .+ log_std
end

function normalise(arr)
    (arr .- mean(arr))./(sqrt(var(arr) + 1e-10))
end

# Logging #
"""
Create logging utility
"""
mutable struct Logger
    hist_dict
end

Logger() = Logger(Dict())

function register(l::Logger,name::String)
     l.hist_dict[name] = []
end

function add(l::Logger,name,value)
    """
    Add a variable for it's history to be logged
    """
    if !(name in l.hist_dict.keys)
        err("Error...")
    else
        push!(l.hist_dict[name],value)
    end
end

"""
HYPERPARAMETERS
"""
# Policy parameters #
η = 3e-4 # Learning rate
STD = 0.0 # Standard deviation
HIDDEN_SIZE = 256
# Environment Variables #
STATE_SIZE = 3
ACTION_SIZE = 1
MIN_RANGE = -2.0f0
MAX_RANGE = 2.0f0
EPISODE_LENGTH = 20
TEST_STEPS = 10000
# GAE parameters
γ = 0.99
λ = 0.95
# Optimization parameters
PPO_EPOCHS = 4
NUM_EPISODES = 2000
BATCH_SIZE = 5
c₀ = 1.0
c₁ = 0.5
c₂ = 0.001
# PPO parameters
ϵ = 0.2
# FREQUENCIES
SAVE_FREQUENCY = 50
VERBOSE_FREQUENCY = 50
global_step = 0
# policy_type = "gaussian"

reward_hist = []

mutable struct PendulumPolicy <: Reinforce.AbstractPolicy
  train::Bool

  function PendulumPolicy(train = true)
    new(train)
  end
end

"""
Define the networks
"""
# if policy_type == "gaussian"
policy_μ = Chain(Dense(STATE_SIZE,HIDDEN_SIZE,relu;initW = _random_normal,initb=constant_init),
                 Dense(HIDDEN_SIZE,ACTION_SIZE;initW = _random_normal,initb=constant_init),
                 x->tanh.(x),
                 x->param(2.0) .* x) 
policy_Σ = param(ones(ACTION_SIZE) * STD)

value = Chain(Dense(STATE_SIZE,HIDDEN_SIZE,relu),
                  Dense(HIDDEN_SIZE,1))

# elseif policy_type == "linear"
#     policy = Chain(Dense(STATE_SIZE,HIDDEN_SIZE,relu;initW = _random_normal,initb=constant_init),
#                      Dense(HIDDEN_SIZE,ACTION_SIZE;initW = _random_normal,initb=constant_init),
#                      x->tanh.(x))
    
#     value = Chain(Dense(STATE_SIZE,HIDDEN_SIZE,relu),
#                   Dense(HIDDEN_SIZE,1))
# end

# Optimizer
opt = ADAM(η)

function action(state)
    # Acccounting for the element type
    state = reshape(Array(state),length(state),1)
    
    a = nothing
    # Our policy outputs the parameters of a Normal distribution
#     if policy_type == "gaussian"
    μ = policy_μ(state)
    μ = reshape(μ,ACTION_SIZE)
    log_std = policy_Σ
    
    σ² = (exp.(log_std)).^2
    Σ = diagm(0=>σ².data)
    
    dis = MvNormal(μ.data,Σ)
    
    a = rand(dis,ACTION_SIZE)
    
#     elseif policy_type == "linear"
#         out = policy(state)
#     end
    a
end

function run_episode(env)
    experience = []
    
    s = reset!(env)
    for i in 1:EPISODE_LENGTH
        a = action(s)
        a = convert.(Float64,a)
        a = reshape(a,ACTION_SIZE)
        
        r,s_ = step!(env,a)
        push!(experience,(s,a,r,s_))
        s = s_
        if env.done
           break 
        end
    end
    experience
end


function test_run(env)
    ep_r = 0.0
    
    s = reset!(env)
    for i in 1:TEST_STEPS
        OpenAIGym.render(env)
        a = policy_μ(s).data
        a = convert.(Float64,a)
        a = reshape(a,ACTION_SIZE)
        println("Action : $a")
        
        r,s_ = step!(env,a)
        ep_r += r
        
        s = s_
        if env.done
           break 
        end
    end
    ep_r
end

test_run (generic function with 1 method)

In [3]:
"""
Rollout collection
"""
num_processes = 9
addprocs(num_processes) 

@everywhere function collect(env)
    run_episode(env)
end

@everywhere function rollout()
  env = GymEnv(:Pendulum,:v0)
  return collect(env)
end

function get_rollouts()
    g = []
    for  w in workers()
      push!(g, rollout())
    end

    rollouts = fetch.(g)
end

get_rollouts (generic function with 1 method)

In [4]:
function gae(states,actions,rewards,next_states)
    """
    Returns a Generalized Advantage Estimate for an episode
    """
    Â = []
    A = 0.0
    for i in reverse(1:length(states))
        δ = rewards[i] + γ*value(next_states[i]).data[1] - value(states[i]).data[1]
        A = δ + (γ*λ*A)
        push!(Â,A)
    end
    
    Â = reverse(Â)
    return Â
end

function disconunted_returns(rewards)
    r = 0.0
    returns = []
    for i in reverse(1:length(rewards))
        r = rewards[i] + γ*r
        push!(returns,r)
    end
    returns = reverse(returns)
    returns
end

function log_prob_from_actions(states,actions)
    """
    Returns log probabilities of the actions taken
    
    states,actions : episode vairbles in the form of a list
    """
    log_probs = []
    
    for i in 1:length(states)
        μ = reshape(policy_μ(states[i]),ACTION_SIZE).data
        logΣ = policy_Σ.data
        push!(log_probs,normal_log_prob(μ,logΣ,actions[i]))
    end
    
    log_probs
end

function process_rollouts(rollouts)
    """
    rollouts : variable returned by calling `get_rollouts`
    
    Returns : 
    states, actions, rewards for minibatch processing
    """
    # Process the variables
    states = []
    actions = []
    rewards = []
    next_states = []
    advantages = []
    returns = []
    log_probs = []
    
    # Logging statistics
    episode_mean_returns = []
    
    for ro in rollouts
        episode_states = []
        episode_actions = []
        episode_rewards = []
        episode_next_states = []
        
        for i in 1:length(ro)
             push!(episode_states,Array(ro[i][1]))
             push!(episode_actions,ro[i][2])
             push!(episode_rewards,ro[i][3])
             push!(episode_next_states,ro[i][4])
        end
        
#         println("Ep Max A : $(maximum(episode_actions))")
        
        episode_advantages = gae(episode_states,episode_actions,episode_rewards,episode_next_states)
        episode_returns = disconunted_returns(episode_rewards)
        
        push!(episode_mean_returns,mean(episode_returns))
        
        episode_advantages = normalise(episode_advantages)
        
        push!(states,episode_states)
        push!(actions,episode_actions)
        push!(rewards,episode_rewards)
        push!(advantages,episode_advantages)
        push!(returns,episode_returns)
        push!(log_probs,log_prob_from_actions(episode_states,episode_actions))
    end
    
    states = cat(states...,dims=1)
    actions = cat(actions...,dims=1)
    rewards = cat(rewards...,dims=1)
    advantages = cat(advantages...,dims=1)
    returns = cat(returns...,dims=1)
    log_probs = cat(log_probs...,dims=1)
    
    push!(reward_hist,mean(episode_mean_returns))
    
    if length(reward_hist) <= 100
        println("RETURNS : $(mean(episode_mean_returns))")
    else
        println("LAST 100 RETURNS : $(mean(reward_hist[end-100:end]))")
    end
    
    return hcat(states...),hcat(actions...),hcat(rewards...),hcat(advantages...),hcat(returns...),hcat(log_probs...)
end

process_rollouts (generic function with 1 method)

In [5]:
function print_losses(pl,vl,el) 
   println("------")
   println("Policy Loss : $pl")
   println("Value Loss : $vl")
   println("Entropy Loss : $el") 
   println("------")
end

function loss(states,actions,advantages,returns,old_log_probs)
#     println("---")
#     println(size(states))
#     println("States : $states")
#     println("---")
#     println("Actions : $actions")
#     println("---")
    global global_step
    global_step += 1
    
    μ = policy_μ(states)
    logΣ = policy_Σ
    
#     println("μ : $μ")
#     println("---")
#     println("logΣ : $logΣ")
#     println("---")
    
    new_log_probs = normal_log_prob(μ,logΣ,actions)
#     println("New Log Probs : $new_log_probs")
#     println("Old Log Probs : $old_log_probs")
    
    # Surrogate loss computation
    ratio = exp.(new_log_probs .- old_log_probs)
    surr1 = ratio .* advantages
    surr2 = clamp.(ratio,1.0 - ϵ,1.0 + ϵ)
    policy_loss = mean(min.(surr1,surr2))
    
#     println("Surr1 : $surr1")
#     println("Surr2 : $surr2")
#     println("Policy Loss : $policy_loss")
    
    value_predicted = value(states)
    value_loss = mean((value_predicted .- returns).^2)
#     println("Value Loss : $value_loss")
    
    entropy_loss = mean(normal_entropy(logΣ))
    
#     if global_step % VERBOSE_FREQUENCY == 0
#         print_losses(policy_loss.data,value_loss.data,entropy_loss.data)
#     end
    
    -c₀*policy_loss + c₁*value_loss # - c₂*entropy_loss
end

function ppo_update(states,actions,advantages,returns,old_log_probs)
    # Define model parameters
    model_params = params(params(policy_μ)...,params(policy_Σ)...,params(value)...)

    # Calculate gradients
    gs = Tracker.gradient(() -> loss(states,actions,advantages,returns,old_log_probs),model_params)
#     println("Gradient Done")
    
    g = gs[policy_μ.layers[1].W]
#     println("GRAD : $(mean(g))")
    # Take a step of optimisation
    update!(opt,model_params,gs)
#     println("Update Done")
end

function train_step()    
    routs = get_rollouts()
    states,actions,rewards,advantages,returns,log_probs = process_rollouts(routs)
    
    idxs = partition(1:size(states)[end],BATCH_SIZE)
    
    for epoch in 1:PPO_EPOCHS
#         println("Epoch : $epoch")
        for i in idxs
#             println(i)
            mb_states = states[:,i] 
            mb_actions = actions[:,i] 
            mb_advantages = advantages[:,i] 
            mb_returns = returns[:,i] 
            mb_log_probs = log_probs[:,i]
            
            ppo_update(mb_states,mb_actions,mb_advantages,mb_returns,mb_log_probs)
        end
    end
end

function train()
    for i in 1:NUM_EPISODES
        println("EP : $i")
        train_step()
        println("Ep done")
        
        if i%SAVE_FREQUENCY == 0
            @save "weights/policy_mu.bson" policy_μ
            @save "weights/policy_sigma.bson" policy_Σ
            @save "weights/value.bson" value
            
            save("stats.jld","rewards",reward_hist)
            println("\n\n\n----MAX REWRD SO FAR : $(maximum(reward_hist))---\n\n\n")
        end
    end
end

train (generic function with 1 method)

In [6]:
train()

EP : 1


│   caller = #GymEnv#1(::Type, ::Type, ::Symbol, ::Symbol) at OpenAIGym.jl:49
└ @ OpenAIGym /home/shreyas/.julia/packages/OpenAIGym/wZkkM/src/OpenAIGym.jl:49
│   caller = GymEnv(::Symbol, ::Symbol, ::PyCall.PyObject, ::Type) at OpenAIGym.jl:56
└ @ OpenAIGym /home/shreyas/.julia/packages/OpenAIGym/wZkkM/src/OpenAIGym.jl:56
│   caller = GymEnv{PyCall.PyArray{Float64,1}}(::Symbol, ::Symbol, ::PyCall.PyObject, ::PyCall.PyObject, ::PyCall.PyArray{Float64,1}) at OpenAIGym.jl:34
└ @ OpenAIGym /home/shreyas/.julia/packages/OpenAIGym/wZkkM/src/OpenAIGym.jl:34
│   caller = GymEnv{PyCall.PyArray{Float64,1}}(::Symbol, ::Symbol, ::PyCall.PyObject, ::PyCall.PyObject, ::PyCall.PyArray{Float64,1}) at OpenAIGym.jl:34
└ @ OpenAIGym /home/shreyas/.julia/packages/OpenAIGym/wZkkM/src/OpenAIGym.jl:34
│   caller = actions(::GymEnv{PyCall.PyArray{Float64,1}}, ::Nothing) at OpenAIGym.jl:117
└ @ OpenAIGym /home/shreyas/.julia/packages/OpenAIGym/wZkkM/src/OpenAIGym.jl:117
│   caller = actionset(::PyCall.PyObject

RETURNS : -66.00464906199679
Ep done
EP : 2
RETURNS : -60.828709201813844
Ep done
EP : 3
RETURNS : -57.1118626688542
Ep done
EP : 4
RETURNS : -66.91570343846391
Ep done
EP : 5
RETURNS : -67.03777485796535
Ep done
EP : 6
RETURNS : -51.236294703649676
Ep done
EP : 7
RETURNS : -72.27709944958444
Ep done
EP : 8
RETURNS : -66.82793205969216
Ep done
EP : 9
RETURNS : -66.03147814761293
Ep done
EP : 10
RETURNS : -71.97654893416939
Ep done
EP : 11
RETURNS : -68.03935338051677
Ep done
EP : 12
RETURNS : -70.48327752896024
Ep done
EP : 13
RETURNS : -66.15414226963698
Ep done
EP : 14
RETURNS : -62.60670216483017
Ep done
EP : 15
RETURNS : -71.13771082882575
Ep done
EP : 16
RETURNS : -60.84374520416228
Ep done
EP : 17
RETURNS : -61.565031032573316
Ep done
EP : 18
RETURNS : -64.76381695486268
Ep done
EP : 19
RETURNS : -64.24812487235162
Ep done
EP : 20
RETURNS : -64.14245531604512
Ep done
EP : 21
RETURNS : -72.89172176439018
Ep done
EP : 22
RETURNS : -55.89434810008264
Ep done
EP : 23
RETURNS : -65.43

Ep done
EP : 166
LAST 100 RETURNS : -59.530977459617645
Ep done
EP : 167
LAST 100 RETURNS : -59.77231549746605
Ep done
EP : 168
LAST 100 RETURNS : -59.656715766947414
Ep done
EP : 169
LAST 100 RETURNS : -59.64484988989452
Ep done
EP : 170
LAST 100 RETURNS : -59.767777526827146
Ep done
EP : 171
LAST 100 RETURNS : -59.91332550202707
Ep done
EP : 172
LAST 100 RETURNS : -59.797620678982476
Ep done
EP : 173
LAST 100 RETURNS : -59.741178337026
Ep done
EP : 174
LAST 100 RETURNS : -59.61504400486295
Ep done
EP : 175
LAST 100 RETURNS : -59.669749012844676
Ep done
EP : 176
LAST 100 RETURNS : -59.595128950837875
Ep done
EP : 177
LAST 100 RETURNS : -59.57613673453536
Ep done
EP : 178
LAST 100 RETURNS : -59.51126378915249
Ep done
EP : 179
LAST 100 RETURNS : -59.59598684376885
Ep done
EP : 180
LAST 100 RETURNS : -59.548778041992385
Ep done
EP : 181
LAST 100 RETURNS : -59.59243234149027
Ep done
EP : 182
LAST 100 RETURNS : -59.617965854788885
Ep done
EP : 183
LAST 100 RETURNS : -59.82313472229839
Ep d

Ep done
EP : 312
LAST 100 RETURNS : -61.37048405712367
Ep done
EP : 313
LAST 100 RETURNS : -61.51757872999305
Ep done
EP : 314
LAST 100 RETURNS : -61.56296049630587
Ep done
EP : 315
LAST 100 RETURNS : -61.74333510461918
Ep done
EP : 316
LAST 100 RETURNS : -61.835247706468856
Ep done
EP : 317
LAST 100 RETURNS : -61.97934162858311
Ep done
EP : 318
LAST 100 RETURNS : -61.84956949715615
Ep done
EP : 319
LAST 100 RETURNS : -61.88274733966528
Ep done
EP : 320
LAST 100 RETURNS : -61.8941804173273
Ep done
EP : 321
LAST 100 RETURNS : -61.9581113659169
Ep done
EP : 322
LAST 100 RETURNS : -62.083078133318516
Ep done
EP : 323
LAST 100 RETURNS : -62.19221662584962
Ep done
EP : 324
LAST 100 RETURNS : -62.15917974627676
Ep done
EP : 325
LAST 100 RETURNS : -62.23285360240853
Ep done
EP : 326
LAST 100 RETURNS : -62.30572692545622
Ep done
EP : 327
LAST 100 RETURNS : -62.33115645165028
Ep done
EP : 328
LAST 100 RETURNS : -62.33638549228592
Ep done
EP : 329
LAST 100 RETURNS : -62.33533534502625
Ep done
EP

Ep done
EP : 458
LAST 100 RETURNS : -61.61515672409891
Ep done
EP : 459
LAST 100 RETURNS : -61.580891411015365
Ep done
EP : 460
LAST 100 RETURNS : -61.61973010669915
Ep done
EP : 461
LAST 100 RETURNS : -61.48453017875212
Ep done
EP : 462
LAST 100 RETURNS : -61.34396784689967
Ep done
EP : 463
LAST 100 RETURNS : -61.42322604987527
Ep done
EP : 464
LAST 100 RETURNS : -61.27410813366755
Ep done
EP : 465
LAST 100 RETURNS : -61.25313919988316
Ep done
EP : 466
LAST 100 RETURNS : -61.17552514506918
Ep done
EP : 467
LAST 100 RETURNS : -61.06987231384808
Ep done
EP : 468
LAST 100 RETURNS : -61.06499275295687
Ep done
EP : 469
LAST 100 RETURNS : -61.06836986747331
Ep done
EP : 470
LAST 100 RETURNS : -61.055549728957004
Ep done
EP : 471
LAST 100 RETURNS : -60.9537376590339
Ep done
EP : 472
LAST 100 RETURNS : -60.808462152295824
Ep done
EP : 473
LAST 100 RETURNS : -60.74849770774949
Ep done
EP : 474
LAST 100 RETURNS : -60.609594778262256
Ep done
EP : 475
LAST 100 RETURNS : -60.55383938702073
Ep done

Ep done
EP : 604
LAST 100 RETURNS : -56.882190718739594
Ep done
EP : 605
LAST 100 RETURNS : -56.83804287725083
Ep done
EP : 606
LAST 100 RETURNS : -57.077834765782015
Ep done
EP : 607
LAST 100 RETURNS : -57.061216312216665
Ep done
EP : 608
LAST 100 RETURNS : -57.31299787999038
Ep done
EP : 609
LAST 100 RETURNS : -57.4958099286556
Ep done
EP : 610
LAST 100 RETURNS : -57.40221682331022
Ep done
EP : 611
LAST 100 RETURNS : -57.324968721877674
Ep done
EP : 612
LAST 100 RETURNS : -57.20449075758443
Ep done
EP : 613
LAST 100 RETURNS : -57.21289566397633
Ep done
EP : 614
LAST 100 RETURNS : -57.2815802639924
Ep done
EP : 615
LAST 100 RETURNS : -57.25321068610032
Ep done
EP : 616
LAST 100 RETURNS : -57.19591850696057
Ep done
EP : 617
LAST 100 RETURNS : -56.94449769047363
Ep done
EP : 618
LAST 100 RETURNS : -56.79643625572396
Ep done
EP : 619
LAST 100 RETURNS : -56.78865155914278
Ep done
EP : 620
LAST 100 RETURNS : -56.851437474047316
Ep done
EP : 621
LAST 100 RETURNS : -56.732622223235595
Ep don

Ep done



----MAX REWRD SO FAR : -30.480256129577597---



EP : 751
LAST 100 RETURNS : -56.55737775089401
Ep done
EP : 752
LAST 100 RETURNS : -56.62685314686318
Ep done
EP : 753
LAST 100 RETURNS : -56.54547030214488
Ep done
EP : 754
LAST 100 RETURNS : -56.56924262582453
Ep done
EP : 755
LAST 100 RETURNS : -56.60348064447818
Ep done
EP : 756
LAST 100 RETURNS : -56.49221194342424
Ep done
EP : 757
LAST 100 RETURNS : -56.44467214049979
Ep done
EP : 758
LAST 100 RETURNS : -56.491753287466146
Ep done
EP : 759
LAST 100 RETURNS : -56.50660710530338
Ep done
EP : 760
LAST 100 RETURNS : -56.37586323273913
Ep done
EP : 761
LAST 100 RETURNS : -56.45424075264099
Ep done
EP : 762
LAST 100 RETURNS : -56.399256348483746
Ep done
EP : 763
LAST 100 RETURNS : -56.584462253203654
Ep done
EP : 764
LAST 100 RETURNS : -56.42965943697618
Ep done
EP : 765
LAST 100 RETURNS : -56.35457283220631
Ep done
EP : 766
LAST 100 RETURNS : -56.382183432170436
Ep done
EP : 767
LAST 100 RETURNS : -56.4693794646393
Ep done
EP

Ep done
EP : 897
LAST 100 RETURNS : -58.1634351120712
Ep done
EP : 898
LAST 100 RETURNS : -58.249188551100794
Ep done
EP : 899
LAST 100 RETURNS : -58.12509842008714
Ep done
EP : 900
LAST 100 RETURNS : -58.08442090685707
Ep done



----MAX REWRD SO FAR : -29.02747243644125---



EP : 901
LAST 100 RETURNS : -58.06173345800494
Ep done
EP : 902
LAST 100 RETURNS : -58.00961500369156
Ep done
EP : 903
LAST 100 RETURNS : -57.958331180522656
Ep done
EP : 904
LAST 100 RETURNS : -58.122124073889495
Ep done
EP : 905
LAST 100 RETURNS : -58.0048031578213
Ep done
EP : 906
LAST 100 RETURNS : -58.13813463545854
Ep done
EP : 907
LAST 100 RETURNS : -58.37648773807521
Ep done
EP : 908
LAST 100 RETURNS : -58.409043993297445
Ep done
EP : 909
LAST 100 RETURNS : -58.329770993514735
Ep done
EP : 910
LAST 100 RETURNS : -58.336508395130465
Ep done
EP : 911
LAST 100 RETURNS : -58.30793682970338
Ep done
EP : 912
LAST 100 RETURNS : -58.27488041062632
Ep done
EP : 913
LAST 100 RETURNS : -58.170580631265146
Ep done
E

Ep done
EP : 1042
LAST 100 RETURNS : -56.76249726174659
Ep done
EP : 1043
LAST 100 RETURNS : -56.66786134329499
Ep done
EP : 1044
LAST 100 RETURNS : -56.95541636127733
Ep done
EP : 1045
LAST 100 RETURNS : -56.958271962406776
Ep done
EP : 1046
LAST 100 RETURNS : -56.96991809789827
Ep done
EP : 1047
LAST 100 RETURNS : -56.97888734957773
Ep done
EP : 1048
LAST 100 RETURNS : -56.921432034522034
Ep done
EP : 1049
LAST 100 RETURNS : -56.95109382079234
Ep done
EP : 1050
LAST 100 RETURNS : -56.80072769303314
Ep done



----MAX REWRD SO FAR : -29.02747243644125---



EP : 1051
LAST 100 RETURNS : -56.35209425715856
Ep done
EP : 1052
LAST 100 RETURNS : -56.25344985191351
Ep done
EP : 1053
LAST 100 RETURNS : -56.28783233554689
Ep done
EP : 1054
LAST 100 RETURNS : -56.32599696874746
Ep done
EP : 1055
LAST 100 RETURNS : -56.342912640137435
Ep done
EP : 1056
LAST 100 RETURNS : -56.386541933952756
Ep done
EP : 1057
LAST 100 RETURNS : -56.44388259770586
Ep done
EP : 1058
LAST 100 RETURNS : -56.56986212

Ep done
EP : 1185
LAST 100 RETURNS : -55.87756255529062
Ep done
EP : 1186
LAST 100 RETURNS : -55.70335696434533
Ep done
EP : 1187
LAST 100 RETURNS : -55.72540123169472
Ep done
EP : 1188
LAST 100 RETURNS : -55.67921214690146
Ep done
EP : 1189
LAST 100 RETURNS : -55.680515026904175
Ep done
EP : 1190
LAST 100 RETURNS : -55.62203349945998
Ep done
EP : 1191
LAST 100 RETURNS : -55.49205791193152
Ep done
EP : 1192
LAST 100 RETURNS : -55.48474468363326
Ep done
EP : 1193
LAST 100 RETURNS : -55.61899823216661
Ep done
EP : 1194
LAST 100 RETURNS : -55.754038216329505
Ep done
EP : 1195
LAST 100 RETURNS : -55.615354644060375
Ep done
EP : 1196
LAST 100 RETURNS : -55.510822939788454
Ep done
EP : 1197
LAST 100 RETURNS : -55.64723965459773
Ep done
EP : 1198
LAST 100 RETURNS : -55.61401399747686
Ep done
EP : 1199
LAST 100 RETURNS : -55.837989935583344
Ep done
EP : 1200
LAST 100 RETURNS : -55.70162543418272
Ep done



----MAX REWRD SO FAR : -28.23331241495526---



EP : 1201
LAST 100 RETURNS : -55.5762148

Ep done
EP : 1329
LAST 100 RETURNS : -54.64863802621157
Ep done
EP : 1330
LAST 100 RETURNS : -54.33234096822663
Ep done
EP : 1331
LAST 100 RETURNS : -54.34814174486406
Ep done
EP : 1332
LAST 100 RETURNS : -54.15754911896204
Ep done
EP : 1333
LAST 100 RETURNS : -54.27607604523148
Ep done
EP : 1334
LAST 100 RETURNS : -54.269780081938265
Ep done
EP : 1335
LAST 100 RETURNS : -54.01381244130253
Ep done
EP : 1336
LAST 100 RETURNS : -53.9418330580874
Ep done
EP : 1337
LAST 100 RETURNS : -53.831853830480135
Ep done
EP : 1338
LAST 100 RETURNS : -53.91029382504604
Ep done
EP : 1339
LAST 100 RETURNS : -54.075379466857136
Ep done
EP : 1340
LAST 100 RETURNS : -54.011669482597725
Ep done
EP : 1341
LAST 100 RETURNS : -54.01933261303194
Ep done
EP : 1342
LAST 100 RETURNS : -54.15750760427548
Ep done
EP : 1343
LAST 100 RETURNS : -54.081275895014855
Ep done
EP : 1344
LAST 100 RETURNS : -54.055358944067855
Ep done
EP : 1345
LAST 100 RETURNS : -54.04176186114419
Ep done
EP : 1346
LAST 100 RETURNS : -54.12

Ep done
EP : 1473
LAST 100 RETURNS : -54.42490267168713
Ep done
EP : 1474
LAST 100 RETURNS : -54.562854691859705
Ep done
EP : 1475
LAST 100 RETURNS : -54.55849120008899
Ep done
EP : 1476
LAST 100 RETURNS : -54.5699454947591
Ep done
EP : 1477
LAST 100 RETURNS : -54.49522519650563
Ep done
EP : 1478
LAST 100 RETURNS : -54.77324591818042
Ep done
EP : 1479
LAST 100 RETURNS : -54.911685781011755
Ep done
EP : 1480
LAST 100 RETURNS : -54.87873237493131
Ep done
EP : 1481
LAST 100 RETURNS : -54.83805401758855
Ep done
EP : 1482
LAST 100 RETURNS : -54.790118443066696
Ep done
EP : 1483
LAST 100 RETURNS : -54.819744536940796
Ep done
EP : 1484
LAST 100 RETURNS : -54.75147564166127
Ep done
EP : 1485
LAST 100 RETURNS : -54.79109918774068
Ep done
EP : 1486
LAST 100 RETURNS : -54.724245421306804
Ep done
EP : 1487
LAST 100 RETURNS : -54.75357368482329
Ep done
EP : 1488
LAST 100 RETURNS : -54.80788580793162
Ep done
EP : 1489
LAST 100 RETURNS : -54.798686936287346
Ep done
EP : 1490
LAST 100 RETURNS : -54.88

Ep done
EP : 1617
LAST 100 RETURNS : -54.66297595201352
Ep done
EP : 1618
LAST 100 RETURNS : -54.76840052340524
Ep done
EP : 1619
LAST 100 RETURNS : -54.8155334812908
Ep done
EP : 1620
LAST 100 RETURNS : -54.96266532168291
Ep done
EP : 1621
LAST 100 RETURNS : -55.02676709537943
Ep done
EP : 1622
LAST 100 RETURNS : -55.011742268067636
Ep done
EP : 1623
LAST 100 RETURNS : -54.97147538333194
Ep done
EP : 1624
LAST 100 RETURNS : -54.94542169818551
Ep done
EP : 1625
LAST 100 RETURNS : -54.70587305164047
Ep done
EP : 1626
LAST 100 RETURNS : -54.91712039204153
Ep done
EP : 1627
LAST 100 RETURNS : -55.21854169967721
Ep done
EP : 1628
LAST 100 RETURNS : -55.19915062873086
Ep done
EP : 1629
LAST 100 RETURNS : -55.325721782286635
Ep done
EP : 1630
LAST 100 RETURNS : -55.216657065640334
Ep done
EP : 1631
LAST 100 RETURNS : -55.25043933486639
Ep done
EP : 1632
LAST 100 RETURNS : -55.220623045564686
Ep done
EP : 1633
LAST 100 RETURNS : -55.24776600573672
Ep done
EP : 1634
LAST 100 RETURNS : -55.0166

Ep done
EP : 1761
LAST 100 RETURNS : -51.636191731840945
Ep done
EP : 1762
LAST 100 RETURNS : -51.85866367021753
Ep done
EP : 1763
LAST 100 RETURNS : -51.75550554544604
Ep done
EP : 1764
LAST 100 RETURNS : -51.62018425924078
Ep done
EP : 1765
LAST 100 RETURNS : -51.60195941716847
Ep done
EP : 1766
LAST 100 RETURNS : -51.59532843662116
Ep done
EP : 1767
LAST 100 RETURNS : -51.36107785711511
Ep done
EP : 1768
LAST 100 RETURNS : -51.46168158461151
Ep done
EP : 1769
LAST 100 RETURNS : -51.31250812545547
Ep done
EP : 1770
LAST 100 RETURNS : -51.228962262773294
Ep done
EP : 1771
LAST 100 RETURNS : -51.20613993349179
Ep done
EP : 1772
LAST 100 RETURNS : -51.25086001739423
Ep done
EP : 1773
LAST 100 RETURNS : -51.10423665796817
Ep done
EP : 1774
LAST 100 RETURNS : -51.075198636972885
Ep done
EP : 1775
LAST 100 RETURNS : -51.29283721995675
Ep done
EP : 1776
LAST 100 RETURNS : -51.28752122874235
Ep done
EP : 1777
LAST 100 RETURNS : -51.66938029708504
Ep done
EP : 1778
LAST 100 RETURNS : -51.7451

Ep done
EP : 1904
LAST 100 RETURNS : -55.633971241038225
Ep done
EP : 1905
LAST 100 RETURNS : -55.7349668475996
Ep done
EP : 1906
LAST 100 RETURNS : -55.9311748281624
Ep done
EP : 1907
LAST 100 RETURNS : -55.87617337386036
Ep done
EP : 1908
LAST 100 RETURNS : -55.85104111765458
Ep done
EP : 1909
LAST 100 RETURNS : -55.784550230420564
Ep done
EP : 1910
LAST 100 RETURNS : -55.864038600731
Ep done
EP : 1911
LAST 100 RETURNS : -55.854853695829526
Ep done
EP : 1912
LAST 100 RETURNS : -55.94747986384444
Ep done
EP : 1913
LAST 100 RETURNS : -55.96253638729337
Ep done
EP : 1914
LAST 100 RETURNS : -56.012407713459886
Ep done
EP : 1915
LAST 100 RETURNS : -55.97559449458571
Ep done
EP : 1916
LAST 100 RETURNS : -55.99839786802544
Ep done
EP : 1917
LAST 100 RETURNS : -55.99683793806681
Ep done
EP : 1918
LAST 100 RETURNS : -55.85662960484118
Ep done
EP : 1919
LAST 100 RETURNS : -55.82623638121209
Ep done
EP : 1920
LAST 100 RETURNS : -55.91810147609837
Ep done
EP : 1921
LAST 100 RETURNS : -55.8601670

In [8]:
# Test the policy #
env = GymEnv("Pendulum-v0")
env.pyenv._max_episode_steps = 50000
TEST_STEPS = 50000

r = test_run(env)

Action : [-2.0]
Action : [-2.0]
Action : [-2.0]
Action : [-2.0]
Action : [-2.0]
Action : [-2.0]
Action : [-2.0]
Action : [-2.0]
Action : [-2.0]
Action : [-2.0]
Action : [-2.0]
Action : [-2.0]
Action : [-2.0]
Action : [-2.0]
Action : [-2.0]
Action : [-2.0]
Action : [-2.0]
Action : [-2.0]
Action : [-2.0]
Action : [-2.0]
Action : [-2.0]
Action : [-2.0]
Action : [-2.0]
Action : [-2.0]
Action : [-2.0]
Action : [-1.99986]
Action : [-0.467727]
Action : [1.9996]
Action : [2.0]
Action : [2.0]
Action : [2.0]
Action : [2.0]
Action : [2.0]
Action : [2.0]
Action : [2.0]
Action : [2.0]
Action : [2.0]
Action : [1.99999]
Action : [1.99969]
Action : [1.99078]
Action : [1.72303]
Action : [-1.22844]
Action : [-1.99976]
Action : [-1.99995]
Action : [-1.99999]
Action : [-2.0]
Action : [-2.0]
Action : [-2.0]
Action : [-2.0]
Action : [-2.0]
Action : [-1.99999]
Action : [-1.99728]
Action : [-1.65396]
Action : [1.15847]
Action : [1.29891]
Action : [1.06539]
Action : [0.400123]
Action : [1.15889]
Action : [1.48

Action : [0.706098]
Action : [0.955142]
Action : [1.23482]
Action : [1.52781]
Action : [1.45999]
Action : [1.03043]
Action : [-0.0638304]
Action : [-1.28729]
Action : [-1.78557]
Action : [-1.91106]
Action : [-1.93717]
Action : [-1.92416]
Action : [-1.76165]
Action : [-0.744402]
Action : [0.671355]
Action : [0.89431]
Action : [1.14269]
Action : [1.49691]
Action : [1.50198]
Action : [1.18633]
Action : [0.259959]
Action : [-1.05637]
Action : [-1.71982]
Action : [-1.89559]
Action : [-1.93568]
Action : [-1.93195]
Action : [-1.8428]
Action : [-1.16789]
Action : [0.546369]
Action : [0.813648]
Action : [1.05781]
Action : [1.42958]
Action : [1.52489]
Action : [1.3022]
Action : [0.554437]
Action : [-0.766124]
Action : [-1.62078]
Action : [-1.8705]
Action : [-1.92999]
Action : [-1.93474]
Action : [-1.88605]
Action : [-1.43589]
Action : [0.276637]
Action : [0.735653]
Action : [1.00365]
Action : [1.34705]
Action : [1.53293]
Action : [1.38081]
Action : [0.783224]
Action : [-0.468997]
Action : [-1.49

Action : [-1.93263]
Action : [-1.8525]
Action : [-1.22375]
Action : [0.508275]
Action : [0.797937]
Action : [1.04789]
Action : [1.4159]
Action : [1.52686]
Action : [1.31767]
Action : [0.59769]
Action : [-0.715118]
Action : [-1.60131]
Action : [-1.8655]
Action : [-1.92877]
Action : [-1.93489]
Action : [-1.89057]
Action : [-1.46876]
Action : [0.217053]
Action : [0.726826]
Action : [0.997728]
Action : [1.33365]
Action : [1.53426]
Action : [1.3928]
Action : [0.818055]
Action : [-0.418772]
Action : [-1.47552]
Action : [-1.83371]
Action : [-1.92162]
Action : [-1.9359]
Action : [-1.90858]
Action : [-1.62969]
Action : [-0.193038]
Action : [0.70676]
Action : [0.963402]
Action : [1.25123]
Action : [1.53038]
Action : [1.451]
Action : [0.999711]
Action : [-0.120522]
Action : [-1.32113]
Action : [-1.79453]
Action : [-1.91307]
Action : [-1.93713]
Action : [-1.92229]
Action : [-1.74448]
Action : [-0.659586]
Action : [0.680103]
Action : [0.90652]
Action : [1.15897]
Action : [1.50524]
Action : [1.496]


Action : [-1.49953]
Action : [0.154428]
Action : [0.718899]
Action : [0.99148]
Action : [1.32005]
Action : [1.53517]
Action : [1.4045]
Action : [0.852228]
Action : [-0.367796]
Action : [-1.45183]
Action : [-1.82797]
Action : [-1.92053]
Action : [-1.93634]
Action : [-1.91156]
Action : [-1.65392]
Action : [-0.277811]
Action : [0.70602]
Action : [0.954778]
Action : [1.23411]
Action : [1.52768]
Action : [1.46037]
Action : [1.03173]
Action : [-0.0614005]
Action : [-1.2858]
Action : [-1.78517]
Action : [-1.91097]
Action : [-1.93717]
Action : [-1.92423]
Action : [-1.76237]
Action : [-0.748004]
Action : [0.670908]
Action : [0.893802]
Action : [1.14199]
Action : [1.49654]
Action : [1.50221]
Action : [1.1873]
Action : [0.262263]
Action : [-1.05442]
Action : [-1.7192]
Action : [-1.89543]
Action : [-1.93565]
Action : [-1.93197]
Action : [-1.8432]
Action : [-1.17025]
Action : [0.544922]
Action : [0.813022]
Action : [1.05738]
Action : [1.42904]
Action : [1.52498]
Action : [1.30285]
Action : [0.55621

Action : [1.0623]
Action : [-0.00292651]
Action : [-1.24909]
Action : [-1.77532]
Action : [-1.90877]
Action : [-1.93716]
Action : [-1.92595]
Action : [-1.77952]
Action : [-0.833096]
Action : [0.65843]
Action : [0.881132]
Action : [1.12493]
Action : [1.48692]
Action : [1.50767]
Action : [1.21051]
Action : [0.317871]
Action : [-1.00591]
Action : [-1.70383]
Action : [-1.89155]
Action : [-1.93482]
Action : [-1.93265]
Action : [-1.85286]
Action : [-1.22588]
Action : [0.506658]
Action : [0.797347]
Action : [1.04748]
Action : [1.41534]
Action : [1.52692]
Action : [1.31825]
Action : [0.599351]
Action : [-0.713099]
Action : [-1.60053]
Action : [-1.8653]
Action : [-1.92872]
Action : [-1.93489]
Action : [-1.89072]
Action : [-1.46997]
Action : [0.214687]
Action : [0.726491]
Action : [0.997497]
Action : [1.33313]
Action : [1.53431]
Action : [1.39326]
Action : [0.819394]
Action : [-0.416815]
Action : [-1.47462]
Action : [-1.83349]
Action : [-1.92159]
Action : [-1.93592]
Action : [-1.9087]
Action : [

Action : [-1.90625]
Action : [-1.93705]
Action : [-1.92765]
Action : [-1.79681]
Action : [-0.9193]
Action : [0.642027]
Action : [0.867032]
Action : [1.10754]
Action : [1.47545]
Action : [1.51264]
Action : [1.23351]
Action : [0.375004]
Action : [-0.952991]
Action : [-1.6865]
Action : [-1.88714]
Action : [-1.93382]
Action : [-1.93321]
Action : [-1.86182]
Action : [-1.27952]
Action : [0.461854]
Action : [0.781674]
Action : [1.03768]
Action : [1.40051]
Action : [1.52829]
Action : [1.333]
Action : [0.64204]
Action : [-0.659885]
Action : [-1.57935]
Action : [-1.8598]
Action : [-1.92732]
Action : [-1.9349]
Action : [-1.89425]
Action : [-1.50085]
Action : [0.151599]
Action : [0.718559]
Action : [0.991255]
Action : [1.31944]
Action : [1.53519]
Action : [1.40498]
Action : [0.853669]
Action : [-0.365594]
Action : [-1.45078]
Action : [-1.82771]
Action : [-1.92048]
Action : [-1.93636]
Action : [-1.91168]
Action : [-1.6549]
Action : [-0.281421]
Action : [0.705935]
Action : [0.954395]
Action : [1.233

Action : [0.766589]
Action : [1.02704]
Action : [1.3846]
Action : [1.52952]
Action : [1.34762]
Action : [0.685033]
Action : [-0.603729]
Action : [-1.55621]
Action : [-1.85379]
Action : [-1.92582]
Action : [-1.9349]
Action : [-1.89741]
Action : [-1.53146]
Action : [0.0817571]
Action : [0.711751]
Action : [0.986504]
Action : [1.30464]
Action : [1.53537]
Action : [1.41603]
Action : [0.887131]
Action : [-0.313193]
Action : [-1.42522]
Action : [-1.82138]
Action : [-1.91909]
Action : [-1.93666]
Action : [-1.9143]
Action : [-1.67688]
Action : [-0.365582]
Action : [0.703422]
Action : [0.945283]
Action : [1.2167]
Action : [1.52414]
Action : [1.46952]
Action : [1.06356]
Action : [-0.000453573]
Action : [-1.2475]
Action : [-1.77489]
Action : [-1.90867]
Action : [-1.93715]
Action : [-1.92602]
Action : [-1.78024]
Action : [-0.836624]
Action : [0.657844]
Action : [0.880581]
Action : [1.12423]
Action : [1.48647]
Action : [1.50788]
Action : [1.21144]
Action : [0.320164]
Action : [-1.00383]
Action : [-

Action : [1.42685]
Action : [0.919943]
Action : [-0.260171]
Action : [-1.39844]
Action : [-1.81471]
Action : [-1.91769]
Action : [-1.93698]
Action : [-1.91693]
Action : [-1.69814]
Action : [-0.451396]
Action : [0.698981]
Action : [0.935059]
Action : [1.19925]
Action : [1.51948]
Action : [1.47807]
Action : [1.09444]
Action : [0.0608618]
Action : [-1.20686]
Action : [-1.76377]
Action : [-1.90613]
Action : [-1.93705]
Action : [-1.92772]
Action : [-1.79755]
Action : [-0.922945]
Action : [0.641207]
Action : [0.866397]
Action : [1.10681]
Action : [1.47494]
Action : [1.51284]
Action : [1.2345]
Action : [0.377457]
Action : [-0.950665]
Action : [-1.68573]
Action : [-1.88694]
Action : [-1.93377]
Action : [-1.93324]
Action : [-1.8622]
Action : [-1.28179]
Action : [0.459793]
Action : [0.781031]
Action : [1.03723]
Action : [1.39983]
Action : [1.52834]
Action : [1.33363]
Action : [0.643878]
Action : [-0.657525]
Action : [-1.57839]
Action : [-1.85955]
Action : [-1.92726]
Action : [-1.9349]
Action : [

Action : [-0.53546]
Action : [0.692201]
Action : [0.924252]
Action : [1.18333]
Action : [1.51439]
Action : [1.48565]
Action : [1.12291]
Action : [0.119576]
Action : [-1.16569]
Action : [-1.75226]
Action : [-1.90345]
Action : [-1.93684]
Action : [-1.92921]
Action : [-1.81296]
Action : [-1.00188]
Action : [0.620635]
Action : [0.851884]
Action : [1.09045]
Action : [1.46246]
Action : [1.51726]
Action : [1.25635]
Action : [0.432478]
Action : [-0.897148]
Action : [-1.66774]
Action : [-1.88243]
Action : [-1.93279]
Action : [-1.93384]
Action : [-1.87053]
Action : [-1.33271]
Action : [0.410285]
Action : [0.76604]
Action : [1.02666]
Action : [1.38401]
Action : [1.52957]
Action : [1.34815]
Action : [0.686586]
Action : [-0.601661]
Action : [-1.55535]
Action : [-1.85357]
Action : [-1.92577]
Action : [-1.9349]
Action : [-1.89752]
Action : [-1.53258]
Action : [0.0790722]
Action : [0.711526]
Action : [0.986322]
Action : [1.30406]
Action : [1.53538]
Action : [1.41645]
Action : [0.888398]
Action : [-0.3

Action : [-1.64964]
Action : [-1.87785]
Action : [-1.93174]
Action : [-1.93427]
Action : [-1.87732]
Action : [-1.37706]
Action : [0.360396]
Action : [0.752658]
Action : [1.01672]
Action : [1.36903]
Action : [1.53079]
Action : [1.3614]
Action : [0.726043]
Action : [-0.54866]
Action : [-1.5329]
Action : [-1.84785]
Action : [-1.92444]
Action : [-1.93503]
Action : [-1.90052]
Action : [-1.5611]
Action : [0.00761933]
Action : [0.706023]
Action : [0.981542]
Action : [1.28973]
Action : [1.53509]
Action : [1.42723]
Action : [0.921094]
Action : [-0.258287]
Action : [-1.39748]
Action : [-1.81447]
Action : [-1.91764]
Action : [-1.937]
Action : [-1.91702]
Action : [-1.69888]
Action : [-0.454475]
Action : [0.698773]
Action : [0.934672]
Action : [1.19861]
Action : [1.5193]
Action : [1.47837]
Action : [1.09555]
Action : [0.063093]
Action : [-1.20534]
Action : [-1.76335]
Action : [-1.90603]
Action : [-1.93704]
Action : [-1.92778]
Action : [-1.79817]
Action : [-0.926016]
Action : [0.640508]
Action : [0.

Action : [-1.84194]
Action : [-1.92317]
Action : [-1.93527]
Action : [-1.90371]
Action : [-1.58979]
Action : [-0.0718495]
Action : [0.705234]
Action : [0.975158]
Action : [1.27488]
Action : [1.53381]
Action : [1.43731]
Action : [0.953278]
Action : [-0.203595]
Action : [-1.36832]
Action : [-1.80698]
Action : [-1.91597]
Action : [-1.93715]
Action : [-1.91936]
Action : [-1.71831]
Action : [-0.537995]
Action : [0.69196]
Action : [0.923918]
Action : [1.18285]
Action : [1.51423]
Action : [1.48587]
Action : [1.12374]
Action : [0.121316]
Action : [-1.16443]
Action : [-1.7519]
Action : [-1.90336]
Action : [-1.93684]
Action : [-1.92925]
Action : [-1.81339]
Action : [-1.00419]
Action : [0.619948]
Action : [0.851435]
Action : [1.08998]
Action : [1.46207]
Action : [1.51739]
Action : [1.25699]
Action : [0.434114]
Action : [-0.895509]
Action : [-1.66718]
Action : [-1.88229]
Action : [-1.93276]
Action : [-1.93386]
Action : [-1.87077]
Action : [-1.3342]
Action : [0.408726]
Action : [0.765584]
Action : 

Action : [1.16719]
Action : [1.50867]
Action : [1.49251]
Action : [1.14969]
Action : [0.176842]
Action : [-1.12324]
Action : [-1.74006]
Action : [-1.90057]
Action : [-1.93655]
Action : [-1.93054]
Action : [-1.82631]
Action : [-1.07563]
Action : [0.595227]
Action : [0.836628]
Action : [1.07599]
Action : [1.44952]
Action : [1.52086]
Action : [1.27627]
Action : [0.484402]
Action : [-0.843525]
Action : [-1.64902]
Action : [-1.8777]
Action : [-1.9317]
Action : [-1.93428]
Action : [-1.87752]
Action : [-1.37846]
Action : [0.358711]
Action : [0.752239]
Action : [1.01639]
Action : [1.36854]
Action : [1.53083]
Action : [1.36182]
Action : [0.72731]
Action : [-0.546927]
Action : [-1.53215]
Action : [-1.84766]
Action : [-1.92439]
Action : [-1.93503]
Action : [-1.90062]
Action : [-1.56201]
Action : [0.00517076]
Action : [0.705929]
Action : [0.981388]
Action : [1.28929]
Action : [1.53508]
Action : [1.42758]
Action : [0.922143]
Action : [-0.256565]
Action : [-1.39659]
Action : [-1.81425]
Action : [-1.

Action : [1.53218]
Action : [1.37497]
Action : [0.766261]
Action : [-0.492897]
Action : [-1.50864]
Action : [-1.84176]
Action : [-1.92313]
Action : [-1.93528]
Action : [-1.90382]
Action : [-1.59066]
Action : [-0.0743466]
Action : [0.705276]
Action : [0.974918]
Action : [1.2744]
Action : [1.53374]
Action : [1.43759]
Action : [0.954242]
Action : [-0.201897]
Action : [-1.36738]
Action : [-1.80673]
Action : [-1.91591]
Action : [-1.93715]
Action : [-1.91942]
Action : [-1.71886]
Action : [-0.540424]
Action : [0.691726]
Action : [0.923598]
Action : [1.1824]
Action : [1.51408]
Action : [1.48608]
Action : [1.12453]
Action : [0.122987]
Action : [-1.16323]
Action : [-1.75156]
Action : [-1.90328]
Action : [-1.93683]
Action : [-1.92929]
Action : [-1.81381]
Action : [-1.00641]
Action : [0.619284]
Action : [0.851003]
Action : [1.08954]
Action : [1.46169]
Action : [1.5175]
Action : [1.25759]
Action : [0.43566]
Action : [-0.893953]
Action : [-1.66664]
Action : [-1.88216]
Action : [-1.93273]
Action : [-

Action : [1.53146]
Action : [1.44676]
Action : [0.985276]
Action : [-0.146576]
Action : [-1.33621]
Action : [-1.7985]
Action : [-1.91398]
Action : [-1.93712]
Action : [-1.9214]
Action : [-1.73637]
Action : [-0.620619]
Action : [0.68368]
Action : [0.912312]
Action : [1.16666]
Action : [1.50846]
Action : [1.49271]
Action : [1.15052]
Action : [0.178657]
Action : [-1.12185]
Action : [-1.73965]
Action : [-1.90047]
Action : [-1.93654]
Action : [-1.93058]
Action : [-1.82671]
Action : [-1.07782]
Action : [0.594281]
Action : [0.836121]
Action : [1.07554]
Action : [1.4491]
Action : [1.52096]
Action : [1.27689]
Action : [0.486023]
Action : [-0.8418]
Action : [-1.64841]
Action : [-1.87754]
Action : [-1.93167]
Action : [-1.93429]
Action : [-1.87773]
Action : [-1.37985]
Action : [0.357023]
Action : [0.751821]
Action : [1.01607]
Action : [1.36804]
Action : [1.53086]
Action : [1.36225]
Action : [0.728576]
Action : [-0.545189]
Action : [-1.5314]
Action : [-1.84746]
Action : [-1.92435]
Action : [-1.9350

Action : [1.43541]
Action : [1.52386]
Action : [1.29508]
Action : [0.534906]
Action : [-0.78832]
Action : [-1.62903]
Action : [-1.87261]
Action : [-1.9305]
Action : [-1.93462]
Action : [-1.88372]
Action : [-1.42048]
Action : [0.301561]
Action : [0.739836]
Action : [1.00676]
Action : [1.35302]
Action : [1.53223]
Action : [1.37539]
Action : [0.767487]
Action : [-0.49118]
Action : [-1.50789]
Action : [-1.84158]
Action : [-1.92309]
Action : [-1.93529]
Action : [-1.90392]
Action : [-1.59159]
Action : [-0.0770082]
Action : [0.705318]
Action : [0.974663]
Action : [1.27389]
Action : [1.53367]
Action : [1.4379]
Action : [0.955271]
Action : [-0.200086]
Action : [-1.36638]
Action : [-1.80647]
Action : [-1.91584]
Action : [-1.93714]
Action : [-1.91948]
Action : [-1.71945]
Action : [-0.543016]
Action : [0.691475]
Action : [0.923255]
Action : [1.18191]
Action : [1.51392]
Action : [1.4863]
Action : [1.12538]
Action : [0.124773]
Action : [-1.16194]
Action : [-1.7512]
Action : [-1.9032]
Action : [-1.93

Action : [1.38768]
Action : [0.803243]
Action : [-0.440287]
Action : [-1.48526]
Action : [-1.83606]
Action : [-1.92205]
Action : [-1.9357]
Action : [-1.90718]
Action : [-1.61856]
Action : [-0.15774]
Action : [0.706449]
Action : [0.966873]
Action : [1.25821]
Action : [1.53139]
Action : [1.44703]
Action : [0.986214]
Action : [-0.144894]
Action : [-1.33525]
Action : [-1.79825]
Action : [-1.91392]
Action : [-1.93712]
Action : [-1.92146]
Action : [-1.7369]
Action : [-0.623097]
Action : [0.68342]
Action : [0.911944]
Action : [1.16615]
Action : [1.50826]
Action : [1.49291]
Action : [1.15132]
Action : [0.180403]
Action : [-1.12051]
Action : [-1.73926]
Action : [-1.90038]
Action : [-1.93652]
Action : [-1.93062]
Action : [-1.82709]
Action : [-1.07992]
Action : [0.593343]
Action : [0.835633]
Action : [1.07511]
Action : [1.44869]
Action : [1.52106]
Action : [1.27748]
Action : [0.487588]
Action : [-0.840131]
Action : [-1.64781]
Action : [-1.87739]
Action : [-1.93163]
Action : [-1.93431]
Action : [-

Action : [1.17649]
Action : [0.236884]
Action : [-1.07569]
Action : [-1.72582]
Action : [-1.89711]
Action : [-1.93601]
Action : [-1.93165]
Action : [-1.83864]
Action : [-1.14399]
Action : [0.560469]
Action : [0.819854]
Action : [1.06231]
Action : [1.43499]
Action : [1.52394]
Action : [1.29562]
Action : [0.536368]
Action : [-0.78668]
Action : [-1.62843]
Action : [-1.87246]
Action : [-1.93046]
Action : [-1.93464]
Action : [-1.8839]
Action : [-1.42166]
Action : [0.299735]
Action : [0.739497]
Action : [1.00649]
Action : [1.35256]
Action : [1.53228]
Action : [1.3758]
Action : [0.768694]
Action : [-0.489487]
Action : [-1.50714]
Action : [-1.8414]
Action : [-1.92306]
Action : [-1.93531]
Action : [-1.90403]
Action : [-1.5925]
Action : [-0.0796345]
Action : [0.705359]
Action : [0.974411]
Action : [1.27338]
Action : [1.5336]
Action : [1.4382]
Action : [0.956284]
Action : [-0.198298]
Action : [-1.36539]
Action : [-1.8062]
Action : [-1.91578]
Action : [-1.93714]
Action : [-1.91955]
Action : [-1.72

Action : [0.730268]
Action : [1.00011]
Action : [1.33893]
Action : [1.53373]
Action : [1.38805]
Action : [0.804314]
Action : [-0.438741]
Action : [-1.48456]
Action : [-1.83589]
Action : [-1.92202]
Action : [-1.93571]
Action : [-1.90728]
Action : [-1.61937]
Action : [-0.160256]
Action : [0.706477]
Action : [0.966628]
Action : [1.25772]
Action : [1.53132]
Action : [1.44732]
Action : [0.987177]
Action : [-0.143165]
Action : [-1.33426]
Action : [-1.79799]
Action : [-1.91386]
Action : [-1.93712]
Action : [-1.92152]
Action : [-1.73744]
Action : [-0.625647]
Action : [0.683151]
Action : [0.911563]
Action : [1.16562]
Action : [1.50805]
Action : [1.49311]
Action : [1.15214]
Action : [0.182199]
Action : [-1.11913]
Action : [-1.73885]
Action : [-1.90028]
Action : [-1.93651]
Action : [-1.93065]
Action : [-1.82749]
Action : [-1.08206]
Action : [0.592347]
Action : [0.835127]
Action : [1.07466]
Action : [1.44827]
Action : [1.52116]
Action : [1.27809]
Action : [0.48921]
Action : [-0.8384]
Action : [-1.

Action : [1.2413]
Action : [1.52892]
Action : [1.45653]
Action : [1.01853]
Action : [-0.0860297]
Action : [-1.30073]
Action : [-1.78914]
Action : [-1.91186]
Action : [-1.93716]
Action : [-1.92347]
Action : [-1.75505]
Action : [-0.711358]
Action : [0.675166]
Action : [0.898864]
Action : [1.14912]
Action : [1.5003]
Action : [1.49981]
Action : [1.17735]
Action : [0.238884]
Action : [-1.07404]
Action : [-1.72531]
Action : [-1.89698]
Action : [-1.93598]
Action : [-1.93168]
Action : [-1.83901]
Action : [-1.14608]
Action : [0.559273]
Action : [0.819319]
Action : [1.06189]
Action : [1.43452]
Action : [1.52403]
Action : [1.29621]
Action : [0.53797]
Action : [-0.78488]
Action : [-1.62777]
Action : [-1.87229]
Action : [-1.93042]
Action : [-1.93465]
Action : [-1.8841]
Action : [-1.42295]
Action : [0.297727]
Action : [0.739127]
Action : [1.0062]
Action : [1.35206]
Action : [1.53234]
Action : [1.37626]
Action : [0.77002]
Action : [-0.487626]
Action : [-1.50633]
Action : [-1.8412]
Action : [-1.92302]

Action : [0.522208]
Action : [0.803505]
Action : [1.05139]
Action : [1.42076]
Action : [1.52617]
Action : [1.31226]
Action : [0.582511]
Action : [-0.73326]
Action : [-1.6083]
Action : [-1.86729]
Action : [-1.9292]
Action : [-1.93484]
Action : [-1.88903]
Action : [-1.45725]
Action : [0.238768]
Action : [0.729982]
Action : [0.999912]
Action : [1.3385]
Action : [1.53378]
Action : [1.38844]
Action : [0.805453]
Action : [-0.437094]
Action : [-1.48382]
Action : [-1.83571]
Action : [-1.92198]
Action : [-1.93573]
Action : [-1.90739]
Action : [-1.62022]
Action : [-0.162942]
Action : [0.706507]
Action : [0.966366]
Action : [1.25719]
Action : [1.53124]
Action : [1.44762]
Action : [0.988205]
Action : [-0.141318]
Action : [-1.33319]
Action : [-1.79771]
Action : [-1.9138]
Action : [-1.93712]
Action : [-1.92158]
Action : [-1.73802]
Action : [-0.628405]
Action : [0.682891]
Action : [0.911164]
Action : [1.16506]
Action : [1.50783]
Action : [1.49333]
Action : [1.15302]
Action : [0.184116]
Action : [-1.1

Action : [-1.58806]
Action : [-1.86205]
Action : [-1.92789]
Action : [-1.93489]
Action : [-1.89284]
Action : [-1.48839]
Action : [0.177705]
Action : [0.721764]
Action : [0.993778]
Action : [1.3251]
Action : [1.53489]
Action : [1.4002]
Action : [0.839654]
Action : [-0.386748]
Action : [-1.46072]
Action : [-1.83012]
Action : [-1.92097]
Action : [-1.93617]
Action : [-1.91046]
Action : [-1.64514]
Action : [-0.246193]
Action : [0.706667]
Action : [0.958122]
Action : [1.24065]
Action : [1.52882]
Action : [1.45688]
Action : [1.01973]
Action : [-0.0838036]
Action : [-1.2994]
Action : [-1.78879]
Action : [-1.91179]
Action : [-1.93716]
Action : [-1.92355]
Action : [-1.75573]
Action : [-0.714707]
Action : [0.674807]
Action : [0.89841]
Action : [1.14846]
Action : [1.49996]
Action : [1.50003]
Action : [1.17827]
Action : [0.241031]
Action : [-1.07225]
Action : [-1.72476]
Action : [-1.89684]
Action : [-1.93595]
Action : [-1.93171]
Action : [-1.8394]
Action : [-1.14832]
Action : [0.557982]
Action : [0

Action : [-1.7789]
Action : [-1.90957]
Action : [-1.93717]
Action : [-1.92535]
Action : [-1.77344]
Action : [-0.803321]
Action : [0.663176]
Action : [0.885725]
Action : [1.13098]
Action : [1.49056]
Action : [1.50581]
Action : [1.20239]
Action : [0.298197]
Action : [-1.0234]
Action : [-1.70943]
Action : [-1.89297]
Action : [-1.93513]
Action : [-1.93242]
Action : [-1.84953]
Action : [-1.20664]
Action : [0.520794]
Action : [0.80293]
Action : [1.05102]
Action : [1.42026]
Action : [1.52625]
Action : [1.31282]
Action : [0.584086]
Action : [-0.73139]
Action : [-1.60758]
Action : [-1.86711]
Action : [-1.92915]
Action : [-1.93484]
Action : [-1.8892]
Action : [-1.45844]
Action : [0.236555]
Action : [0.729658]
Action : [0.999688]
Action : [1.338]
Action : [1.53383]
Action : [1.38889]
Action : [0.806745]
Action : [-0.435225]
Action : [-1.48298]
Action : [-1.83551]
Action : [-1.92195]
Action : [-1.93575]
Action : [-1.90751]
Action : [-1.62119]
Action : [-0.165997]
Action : [0.706541]
Action : [0.96

Action : [-1.93301]
Action : [-1.85868]
Action : [-1.26057]
Action : [0.478555]
Action : [0.78733]
Action : [1.04126]
Action : [1.40595]
Action : [1.52781]
Action : [1.32768]
Action : [0.626593]
Action : [-0.679397]
Action : [-1.58719]
Action : [-1.86183]
Action : [-1.92783]
Action : [-1.93489]
Action : [-1.89299]
Action : [-1.48965]
Action : [0.175104]
Action : [0.721442]
Action : [0.993517]
Action : [1.32453]
Action : [1.53492]
Action : [1.40068]
Action : [0.841068]
Action : [-0.384627]
Action : [-1.45973]
Action : [-1.82988]
Action : [-1.92092]
Action : [-1.93619]
Action : [-1.91059]
Action : [-1.64613]
Action : [-0.249721]
Action : [0.706605]
Action : [0.957753]
Action : [1.23993]
Action : [1.52871]
Action : [1.45727]
Action : [1.02107]
Action : [-0.0813246]
Action : [-1.2979]
Action : [-1.78839]
Action : [-1.9117]
Action : [-1.93716]
Action : [-1.92363]
Action : [-1.75647]
Action : [-0.718396]
Action : [0.674401]
Action : [0.897908]
Action : [1.14773]
Action : [1.49959]
Action : [

Action : [-0.335109]
Action : [0.704412]
Action : [0.94866]
Action : [1.22264]
Action : [1.52552]
Action : [1.46642]
Action : [1.05267]
Action : [-0.021576]
Action : [-1.26101]
Action : [-1.77854]
Action : [-1.90949]
Action : [-1.93717]
Action : [-1.92542]
Action : [-1.77407]
Action : [-0.806403]
Action : [0.662696]
Action : [0.885259]
Action : [1.13035]
Action : [1.49022]
Action : [1.50601]
Action : [1.20324]
Action : [0.300235]
Action : [-1.02162]
Action : [-1.70887]
Action : [-1.89283]
Action : [-1.9351]
Action : [-1.93245]
Action : [-1.84988]
Action : [-1.20868]
Action : [0.519339]
Action : [0.802339]
Action : [1.05065]
Action : [1.41974]
Action : [1.52632]
Action : [1.3134]
Action : [0.585702]
Action : [-0.729469]
Action : [-1.60684]
Action : [-1.86692]
Action : [-1.92911]
Action : [-1.93485]
Action : [-1.88937]
Action : [-1.45966]
Action : [0.234273]
Action : [0.729324]
Action : [0.999457]
Action : [1.33749]
Action : [1.53388]
Action : [1.38935]
Action : [0.808076]
Action : [-0.4

Action : [0.476706]
Action : [0.786686]
Action : [1.04087]
Action : [1.40534]
Action : [1.52786]
Action : [1.32828]
Action : [0.628329]
Action : [-0.677221]
Action : [-1.58632]
Action : [-1.8616]
Action : [-1.92777]
Action : [-1.93489]
Action : [-1.89313]
Action : [-1.49091]
Action : [0.17249]
Action : [0.721118]
Action : [0.993254]
Action : [1.32396]
Action : [1.53495]
Action : [1.40117]
Action : [0.84249]
Action : [-0.382493]
Action : [-1.45874]
Action : [-1.82964]
Action : [-1.92087]
Action : [-1.93621]
Action : [-1.91071]
Action : [-1.64712]
Action : [-0.253272]
Action : [0.706537]
Action : [0.957379]
Action : [1.23919]
Action : [1.52859]
Action : [1.45766]
Action : [1.02242]
Action : [-0.0788155]
Action : [-1.29639]
Action : [-1.78799]
Action : [-1.91161]
Action : [-1.93717]
Action : [-1.9237]
Action : [-1.75722]
Action : [-0.722127]
Action : [0.673985]
Action : [0.897398]
Action : [1.14699]
Action : [1.49921]
Action : [1.50053]
Action : [1.1803]
Action : [0.245776]
Action : [-1.0

Action : [0.704305]
Action : [0.948306]
Action : [1.22201]
Action : [1.5254]
Action : [1.46675]
Action : [1.05383]
Action : [-0.0193353]
Action : [-1.25959]
Action : [-1.77815]
Action : [-1.9094]
Action : [-1.93717]
Action : [-1.92548]
Action : [-1.77473]
Action : [-0.809637]
Action : [0.662187]
Action : [0.884767]
Action : [1.12969]
Action : [1.48985]
Action : [1.50622]
Action : [1.20414]
Action : [0.302381]
Action : [-1.01973]
Action : [-1.70827]
Action : [-1.89268]
Action : [-1.93507]
Action : [-1.93248]
Action : [-1.85026]
Action : [-1.21083]
Action : [0.517798]
Action : [0.801714]
Action : [1.05026]
Action : [1.4192]
Action : [1.5264]
Action : [1.31401]
Action : [0.587409]
Action : [-0.727436]
Action : [-1.60606]
Action : [-1.86672]
Action : [-1.92906]
Action : [-1.93485]
Action : [-1.88955]
Action : [-1.46095]
Action : [0.231852]
Action : [0.72897]
Action : [0.999212]
Action : [1.33695]
Action : [1.53393]
Action : [1.38984]
Action : [0.809487]
Action : [-0.431249]
Action : [-1.48

Action : [0.474912]
Action : [0.786063]
Action : [1.04048]
Action : [1.40476]
Action : [1.52792]
Action : [1.32886]
Action : [0.630011]
Action : [-0.675111]
Action : [-1.58548]
Action : [-1.86139]
Action : [-1.92772]
Action : [-1.93489]
Action : [-1.89327]
Action : [-1.49214]
Action : [0.169947]
Action : [0.720803]
Action : [0.992999]
Action : [1.32341]
Action : [1.53498]
Action : [1.40164]
Action : [0.843872]
Action : [-0.380416]
Action : [-1.45776]
Action : [-1.82941]
Action : [-1.92082]
Action : [-1.93623]
Action : [-1.91083]
Action : [-1.64809]
Action : [-0.256732]
Action : [0.706469]
Action : [0.957014]
Action : [1.23848]
Action : [1.52846]
Action : [1.45805]
Action : [1.02373]
Action : [-0.0763642]
Action : [-1.29491]
Action : [-1.7876]
Action : [-1.91152]
Action : [-1.93717]
Action : [-1.92378]
Action : [-1.75795]
Action : [-0.72577]
Action : [0.67357]
Action : [0.896899]
Action : [1.14627]
Action : [1.49884]
Action : [1.50077]
Action : [1.1813]
Action : [0.248114]
Action : [-1.

Action : [-1.56272]
Action : [-1.85547]
Action : [-1.92623]
Action : [-1.93489]
Action : [-1.89654]
Action : [-1.52295]
Action : [0.101876]
Action : [0.713449]
Action : [0.987872]
Action : [1.30893]
Action : [1.53533]
Action : [1.41291]
Action : [0.877653]
Action : [-0.328207]
Action : [-1.43263]
Action : [-1.82321]
Action : [-1.91949]
Action : [-1.93657]
Action : [-1.91355]
Action : [-1.67069]
Action : [-0.341335]
Action : [0.704209]
Action : [0.947982]
Action : [1.22144]
Action : [1.52527]
Action : [1.46705]
Action : [1.05489]
Action : [-0.0172943]
Action : [-1.25829]
Action : [-1.77781]
Action : [-1.90933]
Action : [-1.93717]
Action : [-1.92554]
Action : [-1.77533]
Action : [-0.812575]
Action : [0.661718]
Action : [0.884319]
Action : [1.12908]
Action : [1.48949]
Action : [1.50642]
Action : [1.20496]
Action : [0.304353]
Action : [-1.01799]
Action : [-1.70772]
Action : [-1.89254]
Action : [-1.93504]
Action : [-1.9325]
Action : [-1.8506]
Action : [-1.21281]
Action : [0.516374]
Action :

Action : [-1.90689]
Action : [-1.93709]
Action : [-1.92725]
Action : [-1.79263]
Action : [-0.898571]
Action : [0.646503]
Action : [0.870585]
Action : [1.11177]
Action : [1.47833]
Action : [1.51147]
Action : [1.22792]
Action : [0.36101]
Action : [-0.966164]
Action : [-1.69085]
Action : [-1.88824]
Action : [-1.93406]
Action : [-1.93307]
Action : [-1.85966]
Action : [-1.26648]
Action : [0.473433]
Action : [0.78555]
Action : [1.04017]
Action : [1.40428]
Action : [1.52797]
Action : [1.32934]
Action : [0.631393]
Action : [-0.673373]
Action : [-1.58478]
Action : [-1.86121]
Action : [-1.92767]
Action : [-1.93489]
Action : [-1.89338]
Action : [-1.49315]
Action : [0.167847]
Action : [0.720544]
Action : [0.992788]
Action : [1.32295]
Action : [1.53501]
Action : [1.40203]
Action : [0.845011]
Action : [-0.378701]
Action : [-1.45696]
Action : [-1.82921]
Action : [-1.92078]
Action : [-1.93625]
Action : [-1.91093]
Action : [-1.64889]
Action : [-0.259595]
Action : [0.706412]
Action : [0.956711]
Action :

Action : [-1.89664]
Action : [-1.52387]
Action : [0.0997272]
Action : [0.713266]
Action : [0.987726]
Action : [1.30848]
Action : [1.53533]
Action : [1.41324]
Action : [0.878662]
Action : [-0.326615]
Action : [-1.43185]
Action : [-1.82302]
Action : [-1.91945]
Action : [-1.93658]
Action : [-1.91363]
Action : [-1.67135]
Action : [-0.343893]
Action : [0.704131]
Action : [0.9477]
Action : [1.22094]
Action : [1.52516]
Action : [1.46731]
Action : [1.0558]
Action : [-0.0155288]
Action : [-1.25717]
Action : [-1.7775]
Action : [-1.90926]
Action : [-1.93717]
Action : [-1.92559]
Action : [-1.77584]
Action : [-0.815103]
Action : [0.66131]
Action : [0.883932]
Action : [1.12856]
Action : [1.48918]
Action : [1.50659]
Action : [1.20566]
Action : [0.306047]
Action : [-1.01649]
Action : [-1.70724]
Action : [-1.89242]
Action : [-1.93502]
Action : [-1.93253]
Action : [-1.8509]
Action : [-1.2145]
Action : [0.515143]
Action : [0.800641]
Action : [1.04959]
Action : [1.41826]
Action : [1.52653]
Action : [1.315

Action : [-1.6928]
Action : [-0.429532]
Action : [0.700398]
Action : [0.937785]
Action : [1.20373]
Action : [1.52074]
Action : [1.47593]
Action : [1.08659]
Action : [0.0450528]
Action : [-1.21755]
Action : [-1.76672]
Action : [-1.90681]
Action : [-1.93708]
Action : [-1.92729]
Action : [-1.79314]
Action : [-0.901098]
Action : [0.645975]
Action : [0.870158]
Action : [1.11124]
Action : [1.47798]
Action : [1.51161]
Action : [1.2286]
Action : [0.362718]
Action : [-0.964557]
Action : [-1.69032]
Action : [-1.88811]
Action : [-1.93403]
Action : [-1.93309]
Action : [-1.85992]
Action : [-1.26807]
Action : [0.472035]
Action : [0.785066]
Action : [1.03987]
Action : [1.40382]
Action : [1.52801]
Action : [1.32979]
Action : [0.632698]
Action : [-0.671733]
Action : [-1.58413]
Action : [-1.86104]
Action : [-1.92763]
Action : [-1.9349]
Action : [-1.89349]
Action : [-1.4941]
Action : [0.165861]
Action : [0.720299]
Action : [0.99259]
Action : [1.32252]
Action : [1.53503]
Action : [1.4024]
Action : [0.8460

Action : [-1.3201]
Action : [0.423196]
Action : [0.769863]
Action : [1.02935]
Action : [1.38807]
Action : [1.52922]
Action : [1.34445]
Action : [0.675732]
Action : [-0.616049]
Action : [-1.56134]
Action : [-1.85511]
Action : [-1.92614]
Action : [-1.93489]
Action : [-1.89673]
Action : [-1.52476]
Action : [0.09765]
Action : [0.713091]
Action : [0.987584]
Action : [1.30805]
Action : [1.53534]
Action : [1.41356]
Action : [0.879638]
Action : [-0.325072]
Action : [-1.43109]
Action : [-1.82283]
Action : [-1.91941]
Action : [-1.93659]
Action : [-1.9137]
Action : [-1.67198]
Action : [-0.346374]
Action : [0.704054]
Action : [0.947425]
Action : [1.22046]
Action : [1.52505]
Action : [1.46757]
Action : [1.05669]
Action : [-0.0138144]
Action : [-1.25607]
Action : [-1.77721]
Action : [-1.90919]
Action : [-1.93717]
Action : [-1.92564]
Action : [-1.77634]
Action : [-0.817556]
Action : [0.660922]
Action : [0.883549]
Action : [1.12805]
Action : [1.48888]
Action : [1.50674]
Action : [1.20634]
Action : [0.

Action : [0.71587]
Action : [-0.562525]
Action : [-1.53885]
Action : [-1.84936]
Action : [-1.92479]
Action : [-1.935]
Action : [-1.89975]
Action : [-1.55381]
Action : [0.0267449]
Action : [0.707166]
Action : [0.982781]
Action : [1.2933]
Action : [1.53518]
Action : [1.42444]
Action : [0.91267]
Action : [-0.272045]
Action : [-1.40451]
Action : [-1.81622]
Action : [-1.918]
Action : [-1.9369]
Action : [-1.91633]
Action : [-1.69342]
Action : [-0.432076]
Action : [0.700238]
Action : [0.93747]
Action : [1.2032]
Action : [1.5206]
Action : [1.47618]
Action : [1.08751]
Action : [0.0469008]
Action : [-1.21631]
Action : [-1.76638]
Action : [-1.90673]
Action : [-1.93708]
Action : [-1.92735]
Action : [-1.79366]
Action : [-0.903668]
Action : [0.645434]
Action : [0.86972]
Action : [1.1107]
Action : [1.47763]
Action : [1.51176]
Action : [1.2293]
Action : [0.364461]
Action : [-0.962915]
Action : [-1.68978]
Action : [-1.88797]
Action : [-1.934]
Action : [-1.9331]
Action : [-1.86019]
Action : [-1.26971]
A

Action : [1.1168]
Action : [0.106803]
Action : [-1.17483]
Action : [-1.75484]
Action : [-1.90405]
Action : [-1.93689]
Action : [-1.92889]
Action : [-1.80978]
Action : [-0.984863]
Action : [0.625543]
Action : [0.855142]
Action : [1.09404]
Action : [1.46534]
Action : [1.51631]
Action : [1.25158]
Action : [0.420381]
Action : [-0.909157]
Action : [-1.67182]
Action : [-1.88345]
Action : [-1.93301]
Action : [-1.93371]
Action : [-1.86875]
Action : [-1.32157]
Action : [0.42171]
Action : [0.769419]
Action : [1.02904]
Action : [1.3876]
Action : [1.52926]
Action : [1.34488]
Action : [0.676993]
Action : [-0.614384]
Action : [-1.56065]
Action : [-1.85494]
Action : [-1.9261]
Action : [-1.93489]
Action : [-1.89682]
Action : [-1.52566]
Action : [0.0955154]
Action : [0.712911]
Action : [0.987439]
Action : [1.3076]
Action : [1.53534]
Action : [1.41389]
Action : [0.880639]
Action : [-0.323489]
Action : [-1.43031]
Action : [-1.82264]
Action : [-1.91937]
Action : [-1.93659]
Action : [-1.91378]
Action : [-1

Action : [-1.90137]
Action : [-1.93665]
Action : [-1.93022]
Action : [-1.82298]
Action : [-1.05713]
Action : [0.602638]
Action : [0.840735]
Action : [1.07965]
Action : [1.45295]
Action : [1.52]
Action : [1.27125]
Action : [0.471115]
Action : [-0.857565]
Action : [-1.654]
Action : [-1.87896]
Action : [-1.932]
Action : [-1.93419]
Action : [-1.87584]
Action : [-1.36702]
Action : [0.372321]
Action : [0.755646]
Action : [1.01906]
Action : [1.37254]
Action : [1.53053]
Action : [1.35838]
Action : [0.716999]
Action : [-0.560993]
Action : [-1.53819]
Action : [-1.84919]
Action : [-1.92475]
Action : [-1.935]
Action : [-1.89983]
Action : [-1.55461]
Action : [0.0246848]
Action : [0.706996]
Action : [0.982639]
Action : [1.2929]
Action : [1.53517]
Action : [1.42475]
Action : [0.9136]
Action : [-0.270526]
Action : [-1.40374]
Action : [-1.81603]
Action : [-1.91796]
Action : [-1.93691]
Action : [-1.91641]
Action : [-1.69402]
Action : [-0.434523]
Action : [0.700083]
Action : [0.937168]
Action : [1.20269]

Action : [1.37151]
Action : [0.756187]
Action : [-0.506942]
Action : [-1.51477]
Action : [-1.84327]
Action : [-1.92343]
Action : [-1.93518]
Action : [-1.90293]
Action : [-1.58303]
Action : [-0.0527353]
Action : [0.704942]
Action : [0.976979]
Action : [1.27855]
Action : [1.53434]
Action : [1.43512]
Action : [0.945855]
Action : [-0.216601]
Action : [-1.37547]
Action : [-1.80886]
Action : [-1.91642]
Action : [-1.93716]
Action : [-1.91888]
Action : [-1.71408]
Action : [-0.519389]
Action : [0.693689]
Action : [0.92635]
Action : [1.18632]
Action : [1.51538]
Action : [1.48427]
Action : [1.11764]
Action : [0.10856]
Action : [-1.17358]
Action : [-1.75449]
Action : [-1.90397]
Action : [-1.93689]
Action : [-1.92894]
Action : [-1.81022]
Action : [-0.987213]
Action : [0.624881]
Action : [0.854697]
Action : [1.09353]
Action : [1.46494]
Action : [1.51644]
Action : [1.25225]
Action : [0.422056]
Action : [-0.907504]
Action : [-1.67126]
Action : [-1.88331]
Action : [-1.93298]
Action : [-1.93372]
Action 

Action : [1.44433]
Action : [0.977056]
Action : [-0.161316]
Action : [-1.34463]
Action : [-1.80072]
Action : [-1.91449]
Action : [-1.93712]
Action : [-1.9209]
Action : [-1.73174]
Action : [-0.599012]
Action : [0.685855]
Action : [0.91549]
Action : [1.17106]
Action : [1.51022]
Action : [1.491]
Action : [1.14359]
Action : [0.163546]
Action : [-1.13335]
Action : [-1.74302]
Action : [-1.90127]
Action : [-1.93664]
Action : [-1.93026]
Action : [-1.82338]
Action : [-1.05934]
Action : [0.601807]
Action : [0.84026]
Action : [1.07922]
Action : [1.45255]
Action : [1.52011]
Action : [1.27184]
Action : [0.47267]
Action : [-0.855932]
Action : [-1.65342]
Action : [-1.87882]
Action : [-1.93197]
Action : [-1.9342]
Action : [-1.87604]
Action : [-1.36836]
Action : [0.370747]
Action : [0.755249]
Action : [1.01875]
Action : [1.37207]
Action : [1.53057]
Action : [1.35879]
Action : [0.718201]
Action : [-0.559358]
Action : [-1.53749]
Action : [-1.84902]
Action : [-1.92471]
Action : [-1.935]
Action : [-1.89992

Action : [1.49776]
Action : [1.16917]
Action : [0.220008]
Action : [-1.0895]
Action : [-1.73005]
Action : [-1.89817]
Action : [-1.93622]
Action : [-1.93141]
Action : [-1.83548]
Action : [-1.12601]
Action : [0.57044]
Action : [0.8244]
Action : [1.0659]
Action : [1.43895]
Action : [1.52316]
Action : [1.29055]
Action : [0.522646]
Action : [-0.801987]
Action : [-1.63404]
Action : [-1.87388]
Action : [-1.9308]
Action : [-1.93454]
Action : [-1.88223]
Action : [-1.41047]
Action : [0.316463]
Action : [0.742631]
Action : [1.00897]
Action : [1.3568]
Action : [1.5318]
Action : [1.37196]
Action : [0.757497]
Action : [-0.505121]
Action : [-1.51398]
Action : [-1.84308]
Action : [-1.92339]
Action : [-1.93519]
Action : [-1.90304]
Action : [-1.58402]
Action : [-0.0555208]
Action : [0.704973]
Action : [0.97672]
Action : [1.27802]
Action : [1.53427]
Action : [1.43544]
Action : [0.946948]
Action : [-0.214697]
Action : [-1.37443]
Action : [-1.80859]
Action : [-1.91635]
Action : [-1.93716]
Action : [-1.9189

Action : [-0.453493]
Action : [-1.4912]
Action : [-1.8375]
Action : [-1.92232]
Action : [-1.93559]
Action : [-1.90634]
Action : [-1.61172]
Action : [-0.136508]
Action : [0.70619]
Action : [0.968928]
Action : [1.26235]
Action : [1.53199]
Action : [1.44465]
Action : [0.978108]
Action : [-0.159425]
Action : [-1.34355]
Action : [-1.80044]
Action : [-1.91442]
Action : [-1.93712]
Action : [-1.92097]
Action : [-1.73234]
Action : [-0.601763]
Action : [0.685587]
Action : [0.915089]
Action : [1.1705]
Action : [1.51]
Action : [1.49122]
Action : [1.14447]
Action : [0.165458]
Action : [-1.1319]
Action : [-1.7426]
Action : [-1.90117]
Action : [-1.93662]
Action : [-1.9303]
Action : [-1.8238]
Action : [-1.06172]
Action : [0.600909]
Action : [0.839749]
Action : [1.07877]
Action : [1.45212]
Action : [1.52021]
Action : [1.27247]
Action : [0.474342]
Action : [-0.854174]
Action : [-1.6528]
Action : [-1.87866]
Action : [-1.93193]
Action : [-1.93421]
Action : [-1.87625]
Action : [-1.3698]
Action : [0.369049]

Action : [-1.79188]
Action : [-1.91247]
Action : [-1.93714]
Action : [-1.92287]
Action : [-1.74973]
Action : [-0.685156]
Action : [0.677807]
Action : [0.902457]
Action : [1.15421]
Action : [1.50289]
Action : [1.49801]
Action : [1.1701]
Action : [0.22211]
Action : [-1.08781]
Action : [-1.72954]
Action : [-1.89805]
Action : [-1.9362]
Action : [-1.93145]
Action : [-1.8359]
Action : [-1.12838]
Action : [0.569175]
Action : [0.823804]
Action : [1.06543]
Action : [1.43843]
Action : [1.52326]
Action : [1.29123]
Action : [0.524469]
Action : [-0.799966]
Action : [-1.6333]
Action : [-1.87369]
Action : [-1.93075]
Action : [-1.93456]
Action : [-1.88245]
Action : [-1.41198]
Action : [0.314284]
Action : [0.742218]
Action : [1.00865]
Action : [1.35624]
Action : [1.53186]
Action : [1.37247]
Action : [0.758975]
Action : [-0.503067]
Action : [-1.51308]
Action : [-1.84286]
Action : [-1.92335]
Action : [-1.93521]
Action : [-1.90317]
Action : [-1.58514]
Action : [-0.0586687]
Action : [0.705018]
Action : [0.

Action : [-1.86873]
Action : [-1.92955]
Action : [-1.9348]
Action : [-1.88775]
Action : [-1.44789]
Action : [0.255943]
Action : [0.732518]
Action : [1.00159]
Action : [1.34234]
Action : [1.53342]
Action : [1.38501]
Action : [0.795467]
Action : [-0.4515]
Action : [-1.4903]
Action : [-1.83729]
Action : [-1.92228]
Action : [-1.93561]
Action : [-1.90646]
Action : [-1.61275]
Action : [-0.139695]
Action : [0.70623]
Action : [0.96862]
Action : [1.26173]
Action : [1.5319]
Action : [1.445]
Action : [0.97932]
Action : [-0.157245]
Action : [-1.34231]
Action : [-1.80011]
Action : [-1.91435]
Action : [-1.93712]
Action : [-1.92105]
Action : [-1.73302]
Action : [-0.604939]
Action : [0.685274]
Action : [0.914625]
Action : [1.16986]
Action : [1.50974]
Action : [1.49147]
Action : [1.14548]
Action : [0.167671]
Action : [-1.13022]
Action : [-1.7421]
Action : [-1.90106]
Action : [-1.93661]
Action : [-1.93035]
Action : [-1.82429]
Action : [-1.06444]
Action : [0.599833]
Action : [0.83915]
Action : [1.07823]


Action : [0.995651]
Action : [1.32912]
Action : [1.53467]
Action : [1.39676]
Action : [0.829575]
Action : [-0.401795]
Action : [-1.46772]
Action : [-1.83182]
Action : [-1.92128]
Action : [-1.93605]
Action : [-1.90959]
Action : [-1.63812]
Action : [-0.221079]
Action : [0.706772]
Action : [0.960607]
Action : [1.24564]
Action : [1.52955]
Action : [1.45412]
Action : [1.01034]
Action : [-0.101099]
Action : [-1.3097]
Action : [-1.79151]
Action : [-1.91239]
Action : [-1.93715]
Action : [-1.92295]
Action : [-1.75045]
Action : [-0.688696]
Action : [0.677469]
Action : [0.901934]
Action : [1.15354]
Action : [1.50256]
Action : [1.49827]
Action : [1.17111]
Action : [0.224416]
Action : [-1.08594]
Action : [-1.72898]
Action : [-1.89791]
Action : [-1.93617]
Action : [-1.93149]
Action : [-1.83635]
Action : [-1.13089]
Action : [0.56781]
Action : [0.823172]
Action : [1.06493]
Action : [1.43788]
Action : [1.52337]
Action : [1.29194]
Action : [0.526388]
Action : [-0.797835]
Action : [-1.63252]
Action : [-1

Action : [-1.78163]
Action : [-1.91018]
Action : [-1.93718]
Action : [-1.92488]
Action : [-1.76872]
Action : [-0.779812]
Action : [0.666669]
Action : [0.889223]
Action : [1.13573]
Action : [1.49314]
Action : [1.50428]
Action : [1.19596]
Action : [0.282805]
Action : [-1.03681]
Action : [-1.71367]
Action : [-1.89404]
Action : [-1.93535]
Action : [-1.93223]
Action : [-1.84683]
Action : [-1.19123]
Action : [0.531555]
Action : [0.807342]
Action : [1.05379]
Action : [1.4241]
Action : [1.5257]
Action : [1.3085]
Action : [0.571998]
Action : [-0.745677]
Action : [-1.61304]
Action : [-1.86851]
Action : [-1.9295]
Action : [-1.9348]
Action : [-1.88794]
Action : [-1.44932]
Action : [0.253342]
Action : [0.732132]
Action : [1.00134]
Action : [1.34176]
Action : [1.53347]
Action : [1.38553]
Action : [0.796981]
Action : [-0.449323]
Action : [-1.48933]
Action : [-1.83705]
Action : [-1.92223]
Action : [-1.93563]
Action : [-1.9066]
Action : [-1.61389]
Action : [-0.143187]
Action : [0.706275]
Action : [0.96

Action : [1.32338]
Action : [0.614153]
Action : [-0.694894]
Action : [-1.59335]
Action : [-1.86343]
Action : [-1.92824]
Action : [-1.93489]
Action : [-1.89198]
Action : [-1.48063]
Action : [0.193509]
Action : [0.723722]
Action : [0.995376]
Action : [1.32853]
Action : [1.5347]
Action : [1.39726]
Action : [0.831048]
Action : [-0.399605]
Action : [-1.46671]
Action : [-1.83157]
Action : [-1.92124]
Action : [-1.93607]
Action : [-1.90972]
Action : [-1.63914]
Action : [-0.224717]
Action : [0.706761]
Action : [0.960249]
Action : [1.24492]
Action : [1.52945]
Action : [1.45452]
Action : [1.01171]
Action : [-0.0985996]
Action : [-1.30822]
Action : [-1.79112]
Action : [-1.9123]
Action : [-1.93715]
Action : [-1.92304]
Action : [-1.75122]
Action : [-0.692454]
Action : [0.677102]
Action : [0.9014]
Action : [1.15281]
Action : [1.50219]
Action : [1.49854]
Action : [1.17216]
Action : [0.226839]
Action : [-1.08397]
Action : [-1.72837]
Action : [-1.89776]
Action : [-1.93614]
Action : [-1.93152]
Action : [

Action : [-1.92675]
Action : [-1.93488]
Action : [-1.89543]
Action : [-1.51219]
Action : [0.126668]
Action : [0.715621]
Action : [0.989596]
Action : [1.31416]
Action : [1.5353]
Action : [1.40907]
Action : [0.865959]
Action : [-0.346595]
Action : [-1.44164]
Action : [-1.82546]
Action : [-1.91999]
Action : [-1.93647]
Action : [-1.91265]
Action : [-1.66308]
Action : [-0.312066]
Action : [0.705127]
Action : [0.951134]
Action : [1.22705]
Action : [1.52641]
Action : [1.46406]
Action : [1.04445]
Action : [-0.0373365]
Action : [-1.27093]
Action : [-1.78121]
Action : [-1.91009]
Action : [-1.93718]
Action : [-1.92496]
Action : [-1.76947]
Action : [-0.783566]
Action : [0.666133]
Action : [0.888671]
Action : [1.13498]
Action : [1.49273]
Action : [1.50452]
Action : [1.19698]
Action : [0.285251]
Action : [-1.03469]
Action : [-1.71301]
Action : [-1.89387]
Action : [-1.93532]
Action : [-1.93226]
Action : [-1.84726]
Action : [-1.19368]
Action : [0.529872]
Action : [0.806647]
Action : [1.05335]
Action :

Action : [0.021382]
Action : [-1.23329]
Action : [-1.77103]
Action : [-1.9078]
Action : [-1.93713]
Action : [-1.92664]
Action : [-1.78653]
Action : [-0.867903]
Action : [0.652561]
Action : [0.875666]
Action : [1.11807]
Action : [1.48245]
Action : [1.50968]
Action : [1.21969]
Action : [0.340529]
Action : [-0.985238]
Action : [-1.69711]
Action : [-1.88983]
Action : [-1.93442]
Action : [-1.93287]
Action : [-1.85648]
Action : [-1.24733]
Action : [0.489758]
Action : [0.791263]
Action : [1.04368]
Action : [1.40963]
Action : [1.52746]
Action : [1.32401]
Action : [0.615978]
Action : [-0.692631]
Action : [-1.59246]
Action : [-1.8632]
Action : [-1.92818]
Action : [-1.93489]
Action : [-1.89212]
Action : [-1.48195]
Action : [0.190845]
Action : [0.723392]
Action : [0.995106]
Action : [1.32795]
Action : [1.53473]
Action : [1.39775]
Action : [0.832499]
Action : [-0.397442]
Action : [-1.4657]
Action : [-1.83133]
Action : [-1.92119]
Action : [-1.93608]
Action : [-1.90984]
Action : [-1.64015]
Action : [

Action : [1.51454]
Action : [1.24286]
Action : [0.398412]
Action : [-0.930598]
Action : [-1.67903]
Action : [-1.88526]
Action : [-1.9334]
Action : [-1.93346]
Action : [-1.8654]
Action : [-1.3012]
Action : [0.441705]
Action : [0.775454]
Action : [1.03329]
Action : [1.39398]
Action : [1.52874]
Action : [1.33904]
Action : [0.659807]
Action : [-0.636922]
Action : [-1.56996]
Action : [-1.85735]
Action : [-1.92669]
Action : [-1.93488]
Action : [-1.89555]
Action : [-1.51339]
Action : [0.12396]
Action : [0.715356]
Action : [0.989395]
Action : [1.31357]
Action : [1.5353]
Action : [1.40949]
Action : [0.86725]
Action : [-0.344568]
Action : [-1.44065]
Action : [-1.82521]
Action : [-1.91993]
Action : [-1.93648]
Action : [-1.91275]
Action : [-1.66391]
Action : [-0.315238]
Action : [0.705033]
Action : [0.950797]
Action : [1.22645]
Action : [1.52629]
Action : [1.46439]
Action : [1.04558]
Action : [-0.0351835]
Action : [-1.26958]
Action : [-1.78084]
Action : [-1.91001]
Action : [-1.93718]
Action : [-1.

Action : [0.0539966]
Action : [0.709425]
Action : [0.98462]
Action : [1.29871]
Action : [1.53535]
Action : [1.42035]
Action : [0.900198]
Action : [-0.29228]
Action : [-1.41477]
Action : [-1.81879]
Action : [-1.91854]
Action : [-1.93678]
Action : [-1.91534]
Action : [-1.68539]
Action : [-0.399592]
Action : [0.702135]
Action : [0.941423]
Action : [1.20995]
Action : [1.52241]
Action : [1.47294]
Action : [1.07575]
Action : [0.0234543]
Action : [-1.23192]
Action : [-1.77066]
Action : [-1.90771]
Action : [-1.93712]
Action : [-1.9267]
Action : [-1.78712]
Action : [-0.870847]
Action : [0.652009]
Action : [0.875186]
Action : [1.11747]
Action : [1.48206]
Action : [1.50985]
Action : [1.22048]
Action : [0.342483]
Action : [-0.983435]
Action : [-1.69652]
Action : [-1.88968]
Action : [-1.93439]
Action : [-1.93289]
Action : [-1.85678]
Action : [-1.24915]
Action : [0.488234]
Action : [0.790724]
Action : [1.04335]
Action : [1.40913]
Action : [1.52751]
Action : [1.32451]
Action : [0.617432]
Action : [-0

Action : [-1.91711]
Action : [-1.93711]
Action : [-1.91797]
Action : [-1.70642]
Action : [-0.486095]
Action : [0.696474]
Action : [0.930648]
Action : [1.1925]
Action : [1.51741]
Action : [1.48132]
Action : [1.10652]
Action : [0.0855204]
Action : [-1.18984]
Action : [-1.75905]
Action : [-1.90504]
Action : [-1.93697]
Action : [-1.92836]
Action : [-1.80426]
Action : [-0.956406]
Action : [0.633158]
Action : [0.860427]
Action : [1.10001]
Action : [1.47001]
Action : [1.51469]
Action : [1.24362]
Action : [0.400307]
Action : [-0.928766]
Action : [-1.67842]
Action : [-1.8851]
Action : [-1.93337]
Action : [-1.93348]
Action : [-1.86569]
Action : [-1.30296]
Action : [0.440022]
Action : [0.774941]
Action : [1.03293]
Action : [1.39344]
Action : [1.52878]
Action : [1.33953]
Action : [0.661272]
Action : [-0.635012]
Action : [-1.56918]
Action : [-1.85714]
Action : [-1.92664]
Action : [-1.93488]
Action : [-1.89566]
Action : [-1.51443]
Action : [0.12161]
Action : [0.715131]
Action : [0.989223]
Action : [

Action : [1.48832]
Action : [1.13304]
Action : [0.14094]
Action : [-1.15017]
Action : [-1.74786]
Action : [-1.90242]
Action : [-1.93676]
Action : [-1.92974]
Action : [-1.81817]
Action : [-1.0302]
Action : [0.611856]
Action : [0.846283]
Action : [1.08496]
Action : [1.45762]
Action : [1.51868]
Action : [1.26398]
Action : [0.452188]
Action : [-0.877149]
Action : [-1.66083]
Action : [-1.88069]
Action : [-1.9324]
Action : [-1.93402]
Action : [-1.8733]
Action : [-1.35026]
Action : [0.391365]
Action : [0.760642]
Action : [1.02285]
Action : [1.37824]
Action : [1.53008]
Action : [1.35337]
Action : [0.702033]
Action : [-0.581141]
Action : [-1.54675]
Action : [-1.85138]
Action : [-1.92526]
Action : [-1.93495]
Action : [-1.89869]
Action : [-1.54381]
Action : [0.0517791]
Action : [0.709239]
Action : [0.98447]
Action : [1.29826]
Action : [1.53534]
Action : [1.42069]
Action : [0.901227]
Action : [-0.290622]
Action : [-1.41394]
Action : [-1.81858]
Action : [-1.9185]
Action : [-1.93679]
Action : [-1.91

Action : [-1.39398]
Action : [0.33912]
Action : [0.747509]
Action : [1.01271]
Action : [1.36291]
Action : [1.53126]
Action : [1.36664]
Action : [0.741726]
Action : [-0.527056]
Action : [-1.52354]
Action : [-1.84547]
Action : [-1.9239]
Action : [-1.93509]
Action : [-1.90174]
Action : [-1.57242]
Action : [-0.0232238]
Action : [0.705184]
Action : [0.979423]
Action : [1.28404]
Action : [1.53484]
Action : [1.43146]
Action : [0.934047]
Action : [-0.236786]
Action : [-1.38629]
Action : [-1.81166]
Action : [-1.91705]
Action : [-1.93712]
Action : [-1.91805]
Action : [-1.70707]
Action : [-0.488886]
Action : [0.696254]
Action : [0.930292]
Action : [1.19199]
Action : [1.51725]
Action : [1.48157]
Action : [1.10746]
Action : [0.0874517]
Action : [-1.18849]
Action : [-1.75867]
Action : [-1.90495]
Action : [-1.93697]
Action : [-1.92841]
Action : [-1.80478]
Action : [-0.958986]
Action : [0.632498]
Action : [0.859956]
Action : [1.09948]
Action : [1.46959]
Action : [1.51484]
Action : [1.24434]
Action : [

Action : [1.53277]
Action : [1.37949]
Action : [0.779389]
Action : [-0.474437]
Action : [-1.50052]
Action : [-1.83978]
Action : [-1.92275]
Action : [-1.93543]
Action : [-1.905]
Action : [-1.60065]
Action : [-0.103315]
Action : [0.705727]
Action : [0.972129]
Action : [1.2688]
Action : [1.53293]
Action : [1.44089]
Action : [0.965422]
Action : [-0.182113]
Action : [-1.35637]
Action : [-1.80382]
Action : [-1.91522]
Action : [-1.93713]
Action : [-1.92013]
Action : [-1.7252]
Action : [-0.568863]
Action : [0.688856]
Action : [0.919789]
Action : [1.177]
Action : [1.51228]
Action : [1.48853]
Action : [1.13386]
Action : [0.142669]
Action : [-1.1489]
Action : [-1.7475]
Action : [-1.90233]
Action : [-1.93675]
Action : [-1.92978]
Action : [-1.81859]
Action : [-1.03249]
Action : [0.611111]
Action : [0.84582]
Action : [1.08451]
Action : [1.45723]
Action : [1.51879]
Action : [1.2646]
Action : [0.453788]
Action : [-0.875507]
Action : [-1.66026]
Action : [-1.88055]
Action : [-1.93236]
Action : [-1.93403

Excessive output truncated after 524293 bytes.

Action : [-0.788654]
Action : [-1.62915]
Action : [-1.87264]
Action : [-1.93051]
Action : [-1.93462]
Action : [-1.88369]
Action : [-1.42024]
Action : [0.301932]
Action : [0.739905]
Action : [1.00682]
Action : [1.35311]
Action : [1.53222]
Action : [1.3753]
Action : [0.767241]
Action : [-0.491525]
Action : [-1.50804]
Action : [-1.84162]
Action : [-1.9231]
Action : [-1.93529]
Action : [-1.9039]
Action : [-1.5914]
Action : [-0.0764724]
Action : [0.705309]
Action : [0.974715]
Action : [1.27399]
Action : [1.53368]
Action : [1.43783]
Action : [0.955063]
Action : [-0.200451]
Action : [-1.36658]
Action : [-1.80652]
Action : [-1.91586]
Action : [-1.93714]
Action : [-1.91947]
Action : [-1.71933]
Action : [-0.542493]
Action : [0.691525]
Action : [0.923324]
Action : [1.18201]
Action : [1.51395]
Action : [1.48626]
Action : [1.12521]
Action : [0.124412]
Action : [-1.1622]
Action : [-1.75127]
Action : [-1.90321]
Action : [-1.93682]
Action : [-1.92933]
Action : [-1.81416]
Action : [-1.0083]
Action : [0

-1390.819616030872

In [None]:
policy_base(Array(ro[1][1][1]))

In [None]:
function loss(a)
    r = exp.(a .- (ones(size(a)) |> gpu))
    s1 = r .* (rand(size(a)) |> gpu)
    s2 = clamp.(a,0.9,1.1)
    -1.0 * mean(min.(s1,s2))
end

In [None]:
gs = Tracker.gradient(() -> loss(out),params(m))

In [None]:
gs[m.layers[1].W]

In [None]:
using Flux,CuArrays
using Flux:Tracker
using Statistics

m = Chain(Conv((3,3),3=>64)) |> gpu
x = rand(256,256,3,1) |> gpu

In [None]:
function loss(x)
   out = m(x)
   mean(out)
end

In [None]:
function test()
    @time o = loss(x)
    @time gs = Tracker.gradient(() -> loss(x),params(m))
end

test()

In [None]:
using Flux,CuArrays
using Flux:Tracker
using Flux:@treelike
using Statistics

In [None]:
struct Net
    u
end

@treelike Net

function Net()
   Net(Chain(Conv((3,3),3=>64))) 
end

function (n::Net)(x)
   return n.u(x) 
end

In [None]:
m = Net() |> gpu
x = rand(256,256,3,1) |> gpu

function loss(x)
   out = m(x)
   mean(out)
end

function test()
    @time o = loss(x)
    @time gs = Tracker.gradient(() -> loss(x),params(m))
end

test()

In [None]:
a = param(ones(2)) * 1.0

In [None]:
policy_Σ

In [None]:
using Pkg
Pkg.add("Plots")

In [None]:
using JLD

In [None]:
reward_hist

In [None]:
mean(reward_hist[end-100-100:end-100])

In [None]:
using JLD
save("stats.jld","rewards",reward_hist)

In [None]:
rh = load("stats.jld")

In [None]:
using Pkg
Pkg.activate("~/envs/test")

In [None]:
using JLD
using Plots

In [None]:
rh

In [None]:
policy_Σ

In [None]:
i = 1
if i == 1
    a = 3
else
    b = 5
end

In [None]:
using OpenAIGym
env = GymEnv(:Pendulum, :v0)
for i ∈ 1:20
  T = 0
  R = run_episode(env, RandomPolicy()) do (s, a, r, s′)
    render(env)
    T += 1
  end
  @info("Episode $i finished after $T steps. Total reward: $R")
end