In [1]:
import tensorflow as tf
import numpy as np
import gym
from collections import deque
import random
import cv2


from sklearn.base import BaseEstimator, ClassifierMixin
from sklearn.exceptions import NotFittedError




In [5]:
from sklearn.base import BaseEstimator, ClassifierMixin
from sklearn.exceptions import NotFittedError



class DeepQNN:
    '''
    episodes - NUMBER OF GAMES
    gamma - discount rate
    epsilon - exploration rate
    epsilon_decay - decrease the number of explorations
    epsilon_min - lower epsilon
    lr - learning rate
    '''
    def __init__(self, env, episodes = 5000 , gamma = 0.98, epsilon = 1, epsilon_decay=0.995, epsilon_min=0.05, lr=0.001, random_state=42):
    
        
        self.gamma = gamma
        self.epsilon = epsilon
        self.epsilon_decay = epsilon_decay
        self.epsilon_min = epsilon_min
        self.lr = lr
        self.random_state = random_state
        self.n_actions = env.action_space.n
        self.env = env
        self.batch_size = 100
        self.episodes = episodes
        self.model_params = None
        
        self.activation_fn = tf.nn.elu
        self.weights_initializer = tf.contrib.layers.variance_scaling_initializer()
        self.optimizer = tf.train.AdamOptimizer
        
        self._graph = None
        self._session = None
        self.training_op = None
        self.model = None
        self.init = None
        self.saver = None
        
        # Memory used for replaying actions
        '''
        using this memory improve stability. NN tends to forget previous actions learned, so the memory
        allows a esxperience replay
        '''
        self.memmory = deque()
        
        if self.random_state is not None:
            tf.set_random_seed(self.random_state)
            np.random.seed(self.random_state)
            
        self.build_dnn()
            
    def build_dnn(self):
        #Reset Tensorflow Graph
        tf.reset_default_graph()
        tf.set_random_seed(self.random_state)
        np.random.seed(self.random_state)
        
        self._graph = tf.Graph()
        with self._graph.as_default():
            n_conv_filters = 32

            X = tf.placeholder(tf.float32, shape=(None, 64, 64, 1),name= 'state')
            y = tf.placeholder(tf.float32, shape=(None), name='quality')
            self._X, self._y = X, y
            self.training = tf.placeholder_with_default(False, shape=[], name='training')

            conv_one = tf.layers.conv2d(X,filters= 16, kernel_size=5, strides=1,
                                    padding= "SAME", activation= tf.nn.relu, name="conv1"
                                   ,kernel_initializer = tf.contrib.layers.xavier_initializer_conv2d())
            conv_two = tf.layers.conv2d(conv_one,filters= 32, kernel_size=5, strides=1,
                                    padding= "SAME", activation= tf.nn.relu, name="conv1"
                                   ,kernel_initializer = tf.contrib.layers.xavier_initializer_conv2d())
            conv_three = tf.layers.conv2d(conv_three,filters= 32, kernel_size=5, strides=1,
                                    padding= "SAME", activation= tf.nn.relu, name="conv1"
                                   ,kernel_initializer = tf.contrib.layers.xavier_initializer_conv2d())
            #with tf.name_scope("pool"):
            #    pool = tf.nn.max_pool(conv, ksize=[1, 2, 2, 1], strides=[1, 2, 2, 1], padding="VALID")
            #    pool_flat = tf.reshape(pool, shape=[-1, n_conv_filters * 32 * 32])

            with tf.name_scope("fc"):
                fc1 = tf.layers.dense(conv_three, 50, activation=tf.nn.relu, name="fc1"
                                      , kernel_initializer = tf.contrib.layers.xavier_initializer())
                #fc1_dropout = tf.layers.dropout(fc1, 0.5, training = self.training)
                fc2 = tf.layers.dense(fc1, 28, activation=tf.nn.relu,name="fc2"
                                      ,kernel_initializer = tf.contrib.layers.xavier_initializer())
                #fc2_dropout = tf.layers.dropout(fc2, 0.5, training = self.training)
                # Dense with linear activation function
                self.model = tf.layers.dense(fc2, self.n_actions,name="fc3"
                                            ,kernel_initializer = tf.contrib.layers.xavier_initializer())

            with tf.name_scope("train"):
                loss = tf.losses.mean_squared_error(self._y, self.model)
                #loss = tf.reduce_mean(tf.squared_difference(x=self.model,y=self._y))
                optimizer = tf.train.AdamOptimizer(0.001)
                self.training_op = optimizer.minimize(loss, name = "training")

            with tf.name_scope("init_and_save"):
                self.init = tf.global_variables_initializer()
                self.saver = tf.train.Saver()
            
        self._session = tf.Session(graph=self._graph)
       
            
    def remember_transition(self,state, action, reward, new_state, end):
        
        self.memmory.append((state, action, reward, new_state, end))
        
    def minibatch_sample(self):
        return random.sample(self.memmory, self.batch_size)
    
    def predict(self,state):
        with self._session.as_default() as sess:
            return self.model.eval(feed_dict={self._X: state, self.training:False})
    
    def select_action(self, state):
        if np.random.rand() <= self.epsilon:
            return random.randrange(self.n_actions)
        predict = self.predict(state)[0]
        print('Action ',predict)
        #print('Predicted ',np.argmax(predict))
        return np.argmax(predict)

    def experience_learing(self):
        '''
        minibatch = random.sample(self.memmory, self.batch_size)
        for state, action, reward, next_state, end in minibatch:
            target = reward
            if not end:
                target = reward + self.gamma * np.amax(self.predict(next_state)[0])
            target_f = self.predict(state)[0]
            target_f[action] = target         

            with self._session.as_default() as sess:
                sess.run(self.training_op, feed_dict={self._X: state, self._y: target_f, self.training: True})
        if self.epsilon > self.epsilon_min:
            self.epsilon *= self.epsilon_decay
        '''
    
        states = self.minibatch_sample()
        inputs = np.zeros((self.batch_size, 64, 64, 1))
        targets = np.zeros((self.batch_size, self.n_actions))
        for i in range(len(states)):
            state = states[i][0]
            action = states[i][1] 
            reward = states[i][2]
            new_state = states[i][3]
            end = states[i][4]
            # Bellman equation
            inputs[i: i+1] = state
            quality = reward + self.gamma * np.amax(self.predict(new_state)[0])
            if end:
                quality = reward
            targets[i] = self.predict(state)
            targets[i][action] = quality
            
        with self._session.as_default() as sess:
            sess.run(self.training_op, feed_dict={self._X: inputs, self._y: targets, self.training: True})
            
        if self.epsilon > self.epsilon_min:
            self.epsilon *= self.epsilon_decay
        
         
    def state_transformation(self, state):
        state = cv2.cvtColor(np.asarray(state), cv2.COLOR_BGR2GRAY)
        state = cv2.resize(state,(64,64))   
        return state.reshape(1,64,64,1)
    
    def get_model_params(self):
        gvars = tf.get_collection(tf.GraphKeys.GLOBAL_VARIABLES)
        return {gvar.op.name: value for gvar, value in zip(gvars, tf.get_default_session().run(gvars))}

    def restore_model_params(self, model_params):
        gvar_names = list(model_params.keys())
        assign_ops = {gvar_name: tf.get_default_graph().get_operation_by_name(gvar_name + "/Assign") for gvar_name in gvar_names}
        init_values = {gvar_name: assign_op.inputs[1] for gvar_name, assign_op in assign_ops.items()}
        feed_dict = {init_values[gvar_name]: model_params[gvar_name] for gvar_name in gvar_names}
        tf.get_default_session().run(assign_ops, feed_dict=feed_dict)

    
    def train(self):
        interactions = 50
        state_size = self.env.observation_space.shape[0]
        with self._session.as_default() as sess:
            self.init.run()
        end = False
        max_iterations = 0
        for e in range(self.episodes):
            state = self.env.reset()
            state = self.env.render(mode='rgb_array')
            state = self.state_transformation(state)
            next_state = self.env.render(mode='rgb_array')
            next_state = self.state_transformation(next_state)
            state = next_state - state
            for iteration in range(interactions):
                action = self.select_action(state)
                
                next_state, reward, end, _ = env.step(action)
                
                pix  = self.env.render(mode='rgb_array')
                next_state = self.state_transformation(pix)
                reward = reward 
                if end:
                    reward = - 20
                self.remember_transition(state, action, reward, next_state, end)
                state = next_state - state
                if end:
                    print("Episode: %d/%d, score: %d" % (e, self.episodes, iteration))
                    max_iterations = iteration if iteration > max_iterations else max_iterations
                    break

            if len(self.memmory) > self.batch_size:
                self.experience_learing()
    

        print("Best Number of Iterations: %d" % (max_iterations))
        
        with tf.Session() as sess:
            saver.save(sess, "./openai.ckpt")  
            
    

In [6]:
env = gym.make('CartPole-v1')
q_dnn= DeepQNN(env)

[2017-09-09 23:27:46,994] Making new env: CartPole-v1


In [7]:
q_dnn.train()

Episode: 0/5000, score: 34
Episode: 1/5000, score: 14
Episode: 2/5000, score: 12
Episode: 3/5000, score: 14
Episode: 4/5000, score: 9
Episode: 5/5000, score: 10
Episode: 6/5000, score: 20
Episode: 7/5000, score: 15
Episode: 8/5000, score: 16
('Action ', array([ 479.99401855,  991.01940918], dtype=float32))
Episode: 9/5000, score: 24
Episode: 11/5000, score: 19
('Action ', array([ 1685.76013184,  1589.12036133], dtype=float32))
Episode: 12/5000, score: 34
Episode: 13/5000, score: 19
('Action ', array([ 15.87574768,  22.55971336], dtype=float32))
('Action ', array([ 15.87574768,  22.55971336], dtype=float32))
Episode: 14/5000, score: 29
Episode: 15/5000, score: 13
Episode: 16/5000, score: 11
('Action ', array([ 2116.35498047,  2379.27612305], dtype=float32))
Episode: 17/5000, score: 15
Episode: 18/5000, score: 8
('Action ', array([ 4.76414633,  6.49000645], dtype=float32))
Episode: 19/5000, score: 14
('Action ', array([ 103.20011902,  168.3939209 ], dtype=float32))
('Action ', array([ 15

('Action ', array([ 21.420681  ,  16.91902733], dtype=float32))
('Action ', array([ 109.53536224,   87.21315765], dtype=float32))
Episode: 55/5000, score: 16
('Action ', array([ 8.00273037,  7.05934811], dtype=float32))
('Action ', array([ 20.04801369,  14.84325027], dtype=float32))
('Action ', array([ 115.81833649,  104.39067841], dtype=float32))
('Action ', array([ 20.58901024,  15.28993797], dtype=float32))
('Action ', array([ 67.95163727,  57.82685471], dtype=float32))
('Action ', array([ 194.91279602,  172.57699585], dtype=float32))
Episode: 56/5000, score: 17
('Action ', array([ 7.87844658,  6.48337317], dtype=float32))
('Action ', array([ 253.21440125,  247.40992737], dtype=float32))
('Action ', array([ 19.36530113,  14.25833321], dtype=float32))
('Action ', array([ 274.05203247,  272.8543396 ], dtype=float32))
('Action ', array([ 18.80971909,  13.88068962], dtype=float32))
('Action ', array([ 289.61560059,  288.46102905], dtype=float32))
Episode: 57/5000, score: 14
('Action ', 

('Action ', array([ 9.28314114,  8.96770668], dtype=float32))
('Action ', array([ 18.84135246,  25.35431671], dtype=float32))
('Action ', array([ 6.89704275,  7.21175146], dtype=float32))
('Action ', array([ 41.24547577,  48.24634171], dtype=float32))
('Action ', array([ 6.70179319,  7.04249525], dtype=float32))
Episode: 79/5000, score: 13
('Action ', array([ 8.53751373,  7.58058643], dtype=float32))
('Action ', array([ 8.53751373,  7.58058643], dtype=float32))
('Action ', array([ 34.09414291,  44.71681976], dtype=float32))
('Action ', array([ 47.32713699,  75.97531128], dtype=float32))
Episode: 80/5000, score: 14
('Action ', array([ 8.59424305,  7.63444376], dtype=float32))
('Action ', array([ 8.61464787,  7.64462519], dtype=float32))
('Action ', array([ 8.63943005,  7.67865229], dtype=float32))
('Action ', array([ 8.65764141,  7.74193811], dtype=float32))
('Action ', array([ 8.6467638 ,  7.72793436], dtype=float32))
('Action ', array([ 14.72539902,  37.80562592], dtype=float32))
Epis

('Action ', array([  1.93504024, -10.35224056], dtype=float32))
('Action ', array([ 7.47400522,  7.91003036], dtype=float32))
('Action ', array([ 0.32024756, -3.74196124], dtype=float32))
('Action ', array([ 7.47400522,  7.91003036], dtype=float32))
('Action ', array([ 2.42044592, -5.60129738], dtype=float32))
('Action ', array([ 7.67265177,  8.15355873], dtype=float32))
('Action ', array([ -8.84461403, -18.63695717], dtype=float32))
('Action ', array([ 6.49471331,  6.96485138], dtype=float32))
Episode: 98/5000, score: 19
('Action ', array([ 7.20691967,  7.88528967], dtype=float32))
('Action ', array([ -5.74539948, -20.62147903], dtype=float32))
('Action ', array([ -4.98998165, -19.82498741], dtype=float32))
('Action ', array([ -5.08535862, -19.95446587], dtype=float32))
('Action ', array([ 6.80881596,  7.38135386], dtype=float32))
('Action ', array([ -4.85743809, -19.16453171], dtype=float32))
('Action ', array([ 4.82264042,  6.23323107], dtype=float32))
('Action ', array([ -5.7455453

('Action ', array([ 8.05488396,  1.28637958], dtype=float32))
('Action ', array([ 9.65868282,  7.85893965], dtype=float32))
('Action ', array([ 7.8378973 ,  7.00028372], dtype=float32))
('Action ', array([  6.44580269,  12.78207302], dtype=float32))
Episode: 117/5000, score: 10
('Action ', array([ 9.97087479,  8.02729893], dtype=float32))
('Action ', array([ 10.00219917,   8.06366634], dtype=float32))
('Action ', array([  4.63868809,  13.24110794], dtype=float32))
('Action ', array([ 9.96229744,  8.10399055], dtype=float32))
('Action ', array([ 7.20900774,  6.87234211], dtype=float32))
('Action ', array([ 13.52307034,  20.97317314], dtype=float32))
('Action ', array([ 13.22270393,  18.32433891], dtype=float32))
Episode: 118/5000, score: 10
('Action ', array([ 10.47512341,   8.12368584], dtype=float32))
('Action ', array([ 10.43745518,   8.10307312], dtype=float32))
('Action ', array([ 10.6683197 ,  23.60266876], dtype=float32))
Episode: 119/5000, score: 11
('Action ', array([ 10.247236

('Action ', array([ 1.10208762, -1.93777537], dtype=float32))
('Action ', array([ 9.59268665,  8.47491741], dtype=float32))
('Action ', array([ 9.59268665,  8.47491741], dtype=float32))
('Action ', array([ 7.10204315,  2.89959621], dtype=float32))
('Action ', array([  8.02512264,  12.69942379], dtype=float32))
('Action ', array([  8.1800909 ,  14.10128689], dtype=float32))
('Action ', array([ 9.6085844 ,  8.68640804], dtype=float32))
('Action ', array([  7.81107807,  15.70880413], dtype=float32))
('Action ', array([  6.86334181,  13.44564342], dtype=float32))
('Action ', array([ 9.56935215,  8.69750977], dtype=float32))
('Action ', array([  9.30302811,  10.65332699], dtype=float32))
('Action ', array([ 9.08580875,  8.62574196], dtype=float32))
('Action ', array([ 10.460289  ,  11.94629574], dtype=float32))
('Action ', array([ 10.31953335,  11.92636395], dtype=float32))
('Action ', array([ 6.32962894,  7.12609768], dtype=float32))
('Action ', array([ 5.55625439,  6.66464233], dtype=floa

('Action ', array([ 1.33779383, -1.66097522], dtype=float32))
('Action ', array([ 9.96911335,  8.95589066], dtype=float32))
('Action ', array([ 8.97572803,  8.25191593], dtype=float32))
Episode: 147/5000, score: 10
('Action ', array([ 9.92816925,  8.95414352], dtype=float32))
('Action ', array([ 1.36234081, -1.62556303], dtype=float32))
('Action ', array([ 10.05194664,   9.01413059], dtype=float32))
('Action ', array([  9.13741875,  10.03079605], dtype=float32))
('Action ', array([  8.74522495,  11.54555321], dtype=float32))
('Action ', array([ 10.38849258,   9.8557148 ], dtype=float32))
('Action ', array([ 9.91151047,  8.78470707], dtype=float32))
('Action ', array([ 8.65846157,  9.36586189], dtype=float32))
('Action ', array([ 7.18508148,  7.54304123], dtype=float32))
('Action ', array([ 9.69029236,  5.65848351], dtype=float32))
('Action ', array([ 7.22952843,  7.46937466], dtype=float32))
('Action ', array([ 7.30170631,  7.59853077], dtype=float32))
('Action ', array([  9.34013462, 

('Action ', array([ 8.96410465,  8.22708702], dtype=float32))
('Action ', array([ 5.81505823,  8.68369102], dtype=float32))
('Action ', array([ 10.40406704,   9.27688885], dtype=float32))
('Action ', array([ 9.76591969,  9.16273594], dtype=float32))
('Action ', array([ 10.89763451,  12.16571426], dtype=float32))
('Action ', array([ 9.80954266,  9.23947906], dtype=float32))
('Action ', array([ 10.32825947,  18.52260971], dtype=float32))
('Action ', array([  9.00301075,  19.01969528], dtype=float32))
Episode: 161/5000, score: 12
('Action ', array([ 10.14138317,   9.41109371], dtype=float32))
('Action ', array([ 11.23588467,   9.95089626], dtype=float32))
('Action ', array([ 11.47341824,  10.13679981], dtype=float32))
('Action ', array([ 11.26002407,  15.60414982], dtype=float32))
('Action ', array([ 10.10507679,   9.18315125], dtype=float32))
Episode: 162/5000, score: 16
('Action ', array([ 1.66415834, -1.26587868], dtype=float32))
('Action ', array([ 9.11771965,  8.36114311], dtype=floa

('Action ', array([ 8.16289902,  8.42181015], dtype=float32))
('Action ', array([ 7.73773336,  8.18694401], dtype=float32))
Episode: 174/5000, score: 43
('Action ', array([ 1.91447341, -1.09843075], dtype=float32))
('Action ', array([ 6.92277002,  0.94122183], dtype=float32))
('Action ', array([ 10.42514515,   9.59919071], dtype=float32))
('Action ', array([ 10.5941515 ,   9.76676083], dtype=float32))
('Action ', array([  7.54213572,  10.38269138], dtype=float32))
('Action ', array([ 7.9204154 ,  8.46516132], dtype=float32))
('Action ', array([ 5.08821821,  9.67819691], dtype=float32))
Episode: 175/5000, score: 11
('Action ', array([ 10.53041553,   9.78467464], dtype=float32))
('Action ', array([ 6.90782738,  4.94204235], dtype=float32))
('Action ', array([ 10.53041553,   9.78467464], dtype=float32))
('Action ', array([ 1.92731524, -1.07523334], dtype=float32))
('Action ', array([ 10.53041553,   9.78467464], dtype=float32))
('Action ', array([ 2.82555532, -0.24878868], dtype=float32))


('Action ', array([ 2.35258794, -0.80084592], dtype=float32))
('Action ', array([ 11.64428139,  10.28194046], dtype=float32))
('Action ', array([ 10.99785614,   4.07792997], dtype=float32))
('Action ', array([ 11.13704014,   5.23058271], dtype=float32))
('Action ', array([ 10.16768456,   9.20828056], dtype=float32))
Episode: 189/5000, score: 7
('Action ', array([ 2.3911624 , -0.77734274], dtype=float32))
('Action ', array([ 11.09685898,  10.09403229], dtype=float32))
('Action ', array([ 2.63264537,  0.28180322], dtype=float32))
('Action ', array([ 11.06231499,  10.09712315], dtype=float32))
('Action ', array([ 7.93338346, -0.58731431], dtype=float32))
('Action ', array([ 8.16090775,  8.62421036], dtype=float32))
('Action ', array([ 3.02080131,  3.20142388], dtype=float32))
('Action ', array([ 8.08641243,  8.59788799], dtype=float32))
('Action ', array([ 3.41708636,  3.5426867 ], dtype=float32))
('Action ', array([ 7.42612267,  8.16667175], dtype=float32))
('Action ', array([-0.02257935

('Action ', array([ 2.68763852, -0.50498033], dtype=float32))
('Action ', array([ 10.5944252 ,  10.25393391], dtype=float32))
('Action ', array([ 2.68763852, -0.50498033], dtype=float32))
('Action ', array([ 8.27480316,  9.26488209], dtype=float32))
('Action ', array([ 8.50239372,  2.38379002], dtype=float32))
('Action ', array([ 8.09742546,  9.13783932], dtype=float32))
('Action ', array([ 9.71378136,  9.23017216], dtype=float32))
('Action ', array([  7.26027346,  11.63168049], dtype=float32))
('Action ', array([ 8.45643806,  8.5140543 ], dtype=float32))
Episode: 202/5000, score: 13
('Action ', array([ 9.7646389 ,  9.37830448], dtype=float32))
('Action ', array([ 2.70975804, -0.48675072], dtype=float32))
('Action ', array([ 5.67015076,  9.62757015], dtype=float32))
('Action ', array([ 10.59077644,  10.07340813], dtype=float32))
('Action ', array([ 11.30768585,  11.72051334], dtype=float32))
('Action ', array([ 10.0744381 ,  10.02688599], dtype=float32))
('Action ', array([  8.79203129

('Action ', array([ 3.09944654, -0.30133316], dtype=float32))
('Action ', array([ 11.4850626 ,  10.74478436], dtype=float32))
('Action ', array([ 3.11540723, -0.28469416], dtype=float32))
('Action ', array([  9.54878139,  10.35457993], dtype=float32))
('Action ', array([ 10.3198328 ,  10.23455811], dtype=float32))
('Action ', array([ 10.94120789,  11.57449341], dtype=float32))
('Action ', array([ 10.34253025,  10.2538538 ], dtype=float32))
('Action ', array([ 10.94120789,  11.57449341], dtype=float32))
('Action ', array([ 10.73972797,  10.19714832], dtype=float32))
('Action ', array([ 10.5617609 ,  10.09083939], dtype=float32))
('Action ', array([ 10.14838505,  14.46231651], dtype=float32))
('Action ', array([ 10.21844769,   9.7315712 ], dtype=float32))
('Action ', array([ 7.86419439,  8.95731449], dtype=float32))
('Action ', array([ 12.18644905,  11.78378677], dtype=float32))
('Action ', array([ 7.93821478,  9.11190414], dtype=float32))
('Action ', array([ 12.00839329,  12.44157028], 

('Action ', array([ 8.87717342,  9.78015518], dtype=float32))
('Action ', array([ 11.10604858,   9.77885723], dtype=float32))
('Action ', array([ 8.89992619,  9.95255375], dtype=float32))
('Action ', array([ 10.81682682,   7.69832945], dtype=float32))
('Action ', array([  8.83669186,  10.01663494], dtype=float32))
('Action ', array([ 10.74822998,   5.62751722], dtype=float32))
('Action ', array([  8.92683887,  10.15594864], dtype=float32))
Episode: 227/5000, score: 44
('Action ', array([ 10.34243011,  10.4263773 ], dtype=float32))
('Action ', array([ 9.05081367,  0.3526555 ], dtype=float32))
('Action ', array([ 10.34243011,  10.4263773 ], dtype=float32))
('Action ', array([ 10.56208611,  10.61865997], dtype=float32))
('Action ', array([ 10.56208611,  10.61865997], dtype=float32))
('Action ', array([ 9.05993843,  0.36496171], dtype=float32))
('Action ', array([ 10.73491859,  10.53077316], dtype=float32))
('Action ', array([  8.41731644,  12.35772514], dtype=float32))
('Action ', array([

('Action ', array([ 3.67734957, -0.0149457 ], dtype=float32))
('Action ', array([ 8.87404823,  9.40331459], dtype=float32))
('Action ', array([ 8.88413048,  9.39889336], dtype=float32))
('Action ', array([ 8.91785431,  9.41181469], dtype=float32))
('Action ', array([ 2.78517628,  1.42221832], dtype=float32))
('Action ', array([ 8.91793823,  9.37007713], dtype=float32))
('Action ', array([ 2.87457061,  2.45857239], dtype=float32))
('Action ', array([ 8.92802238,  8.89090443], dtype=float32))
('Action ', array([ 3.05506396,  3.18605709], dtype=float32))
('Action ', array([ 8.90049171,  8.90764904], dtype=float32))
('Action ', array([ 5.18402719,  5.77734661], dtype=float32))
('Action ', array([ 9.54598808,  6.2623167 ], dtype=float32))
('Action ', array([ 10.83388042,   6.93082333], dtype=float32))
Episode: 234/5000, score: 18
('Action ', array([  3.72929835e+00,  -3.60054150e-03], dtype=float32))
('Action ', array([ 8.96576977,  9.43724442], dtype=float32))
('Action ', array([  3.729298

('Action ', array([ 4.05078506,  0.11825024], dtype=float32))
('Action ', array([ 4.05078506,  0.11825024], dtype=float32))
('Action ', array([ 8.97979736,  9.39253902], dtype=float32))
('Action ', array([ 4.05078506,  0.11825024], dtype=float32))
('Action ', array([ 8.97979736,  9.39253902], dtype=float32))
('Action ', array([ 5.63111067,  5.2412219 ], dtype=float32))
('Action ', array([ 8.50923729,  9.21522617], dtype=float32))
('Action ', array([ 10.22403431,   3.2038703 ], dtype=float32))
('Action ', array([ 8.63996506,  9.21939564], dtype=float32))
('Action ', array([ 9.25912762,  2.63966322], dtype=float32))
('Action ', array([ 8.6467247 ,  9.22835827], dtype=float32))
('Action ', array([ 7.98358822,  6.5575633 ], dtype=float32))
('Action ', array([ 7.27930593,  8.5294342 ], dtype=float32))
('Action ', array([ 7.98698664,  7.58626318], dtype=float32))
('Action ', array([ 7.21567678,  8.51664639], dtype=float32))
('Action ', array([ 12.78782272,   9.56253719], dtype=float32))
('Ac

('Action ', array([ 4.24914217,  0.29869202], dtype=float32))
('Action ', array([ 4.19387627,  0.43307474], dtype=float32))
('Action ', array([ 9.37250233,  9.88579655], dtype=float32))
('Action ', array([  9.65768147,  10.97406864], dtype=float32))
('Action ', array([ 8.96927357,  9.79192734], dtype=float32))
('Action ', array([  9.76823902,  10.49760914], dtype=float32))
('Action ', array([ 8.96927357,  9.79192734], dtype=float32))
('Action ', array([ 9.61550045,  9.93462467], dtype=float32))
('Action ', array([  9.966506  ,  10.88290119], dtype=float32))
('Action ', array([ 9.58278751,  9.92721081], dtype=float32))
('Action ', array([ 12.71790504,  10.97053623], dtype=float32))
('Action ', array([ 13.42124176,   6.32087755], dtype=float32))
('Action ', array([ 9.53231907,  9.29750156], dtype=float32))
('Action ', array([ 14.53313541,   5.42111254], dtype=float32))
('Action ', array([ 9.59274578,  9.36845493], dtype=float32))
('Action ', array([ 14.53313541,   5.42111254], dtype=floa

('Action ', array([ 10.43954372,   9.56223488], dtype=float32))
('Action ', array([ 10.79335403,  10.27850342], dtype=float32))
('Action ', array([ 9.07605743,  9.68539238], dtype=float32))
('Action ', array([ 11.87817192,  11.46575928], dtype=float32))
Episode: 258/5000, score: 39
('Action ', array([ 4.60813618,  0.42754638], dtype=float32))
('Action ', array([ 8.77173996,  9.15082741], dtype=float32))
('Action ', array([ 1.92599583,  1.55050468], dtype=float32))
('Action ', array([ 8.73106575,  9.11241436], dtype=float32))
('Action ', array([ 8.69503689,  9.62924194], dtype=float32))
('Action ', array([ 8.72011566,  9.13596725], dtype=float32))
('Action ', array([ 1.63740027,  5.65071106], dtype=float32))
('Action ', array([ 8.98072624,  9.13646698], dtype=float32))
('Action ', array([ 9.6307106 ,  8.75637817], dtype=float32))
('Action ', array([ 11.8325367 ,   9.91632462], dtype=float32))
('Action ', array([ 9.68417931,  8.7164278 ], dtype=float32))
('Action ', array([ 11.68498516, 

('Action ', array([ 8.81626225,  7.38393831], dtype=float32))
('Action ', array([ 6.60207558,  8.00648499], dtype=float32))
('Action ', array([ 9.19383717,  7.42969561], dtype=float32))
('Action ', array([ 6.79447079,  8.33742809], dtype=float32))
('Action ', array([ 9.22532845,  7.65064287], dtype=float32))
('Action ', array([ 8.83737278,  9.2026825 ], dtype=float32))
('Action ', array([ 8.22749805,  9.55146027], dtype=float32))
('Action ', array([ 6.63618469,  8.18655968], dtype=float32))
('Action ', array([ 8.80706501,  7.23630571], dtype=float32))
('Action ', array([ 6.69387913,  8.33569908], dtype=float32))
('Action ', array([  7.91932297,  10.41156769], dtype=float32))
('Action ', array([ 6.44897652,  8.11152554], dtype=float32))
('Action ', array([  8.48587418,  10.73143768], dtype=float32))
('Action ', array([ 8.26165295,  8.89225769], dtype=float32))
('Action ', array([ 4.86603689,  0.52971518], dtype=float32))
('Action ', array([ 9.39111423,  9.77350521], dtype=float32))
('Ac

('Action ', array([ 5.12830305,  0.64862674], dtype=float32))
('Action ', array([ 8.75731945,  8.90321541], dtype=float32))
('Action ', array([ 5.12830305,  0.64862674], dtype=float32))
('Action ', array([ 8.75731945,  8.90321541], dtype=float32))
('Action ', array([ 4.90808773,  5.1488266 ], dtype=float32))
('Action ', array([ 5.12830305,  0.64862674], dtype=float32))
('Action ', array([ 8.75731945,  8.90321541], dtype=float32))
('Action ', array([ 4.90808773,  5.1488266 ], dtype=float32))
('Action ', array([ 8.75731945,  8.90321541], dtype=float32))
('Action ', array([ 2.66926336,  1.02373517], dtype=float32))
('Action ', array([ 8.81831455,  8.91920662], dtype=float32))
('Action ', array([ 8.70600033,  8.34008312], dtype=float32))
('Action ', array([ 8.37964535,  8.24572563], dtype=float32))
('Action ', array([ 8.86275196,  5.95438957], dtype=float32))
('Action ', array([ 8.41565228,  8.29242039], dtype=float32))
('Action ', array([ 9.08498096,  8.71890831], dtype=float32))
('Action

('Action ', array([ 9.16207409,  9.63196468], dtype=float32))
('Action ', array([ 5.38012838,  0.75884902], dtype=float32))
('Action ', array([ 9.16357327,  9.66581821], dtype=float32))
('Action ', array([ 10.71511459,   7.27777719], dtype=float32))
('Action ', array([ 8.71766758,  9.48060417], dtype=float32))
('Action ', array([ 9.29551601,  7.85321856], dtype=float32))
('Action ', array([ 9.35477734,  9.55516624], dtype=float32))
('Action ', array([ 11.61456299,   6.31447649], dtype=float32))
('Action ', array([ 9.35477734,  9.55516624], dtype=float32))
('Action ', array([ 9.96484661, -0.85564774], dtype=float32))
('Action ', array([ 9.33112621,  9.54544735], dtype=float32))
('Action ', array([ 10.23961163,  -0.27323884], dtype=float32))
('Action ', array([ 9.33112621,  9.54544735], dtype=float32))
('Action ', array([ 9.24416065, -0.91271752], dtype=float32))
('Action ', array([ 9.40231609, -0.73463792], dtype=float32))
('Action ', array([ 9.40231609, -0.73463792], dtype=float32))
('

('Action ', array([ 8.60537434,  8.9884882 ], dtype=float32))
('Action ', array([ 2.6122942 , -2.33691049], dtype=float32))
('Action ', array([ 8.65401936,  8.90797424], dtype=float32))
('Action ', array([ 2.72580528, -1.46356988], dtype=float32))
('Action ', array([ 2.72580528, -1.46356988], dtype=float32))
('Action ', array([ 8.67211437,  8.93780041], dtype=float32))
('Action ', array([ 10.4110899 ,   5.21306372], dtype=float32))
('Action ', array([ 8.72305393,  8.48651791], dtype=float32))
('Action ', array([ 1.63811672,  0.1359708 ], dtype=float32))
('Action ', array([ 8.5592947 ,  8.81286335], dtype=float32))
('Action ', array([  4.52681971,  11.15942192], dtype=float32))
('Action ', array([ 9.44170094,  9.6289072 ], dtype=float32))
('Action ', array([  6.01989603,  13.71065712], dtype=float32))
('Action ', array([ 8.96107006,  9.41840076], dtype=float32))
('Action ', array([ 8.90874577,  9.33934689], dtype=float32))
('Action ', array([  9.7835722 ,  14.59570122], dtype=float32))


('Action ', array([ 8.46008301,  8.77281952], dtype=float32))
('Action ', array([ 8.46008301,  8.77281952], dtype=float32))
('Action ', array([ 7.14356709,  4.28158617], dtype=float32))
('Action ', array([ 8.46008301,  8.77281952], dtype=float32))
('Action ', array([ 8.46008301,  8.77281952], dtype=float32))
('Action ', array([ 12.33540344,   9.06533623], dtype=float32))
('Action ', array([ 8.71679306,  8.84414768], dtype=float32))
('Action ', array([ 12.3690033 ,   9.16514778], dtype=float32))
('Action ', array([ 11.269804  ,   9.14454079], dtype=float32))
('Action ', array([ 8.71679306,  8.84414768], dtype=float32))
('Action ', array([ 11.269804  ,   9.14454079], dtype=float32))
('Action ', array([ 11.269804  ,   9.14454079], dtype=float32))
('Action ', array([ 8.21686935,  8.1483736 ], dtype=float32))
('Action ', array([ 11.52819061,   7.52446127], dtype=float32))
('Action ', array([ 8.2213707 ,  8.14614105], dtype=float32))
('Action ', array([ 12.05110359,   9.12248802], dtype=floa

('Action ', array([ 6.21688986,  1.2213285 ], dtype=float32))
('Action ', array([ 8.76433563,  9.53153419], dtype=float32))
('Action ', array([ 9.77395058,  2.56578398], dtype=float32))
('Action ', array([ 8.4853363 ,  2.72677565], dtype=float32))
('Action ', array([ 7.93224716,  9.1023035 ], dtype=float32))
('Action ', array([ 7.34601593,  3.03589964], dtype=float32))
('Action ', array([ 6.94743633,  3.2507453 ], dtype=float32))
('Action ', array([ 8.04306602,  9.32853699], dtype=float32))
('Action ', array([ 4.09582996,  3.68898153], dtype=float32))
('Action ', array([ 7.69301987,  8.83275318], dtype=float32))
('Action ', array([ 5.97357845,  7.67104197], dtype=float32))
Episode: 304/5000, score: 13
('Action ', array([ 8.45351601,  8.74517918], dtype=float32))
('Action ', array([ 2.01697803,  3.35436583], dtype=float32))
('Action ', array([ 1.62693143,  3.88189459], dtype=float32))
('Action ', array([ 8.55802155,  8.80632877], dtype=float32))
('Action ', array([ 8.42198753,  8.236350

('Action ', array([ 9.82282257,  4.9992156 ], dtype=float32))
('Action ', array([ 8.47391701,  9.88160896], dtype=float32))
('Action ', array([ 7.71479416,  6.22149038], dtype=float32))
('Action ', array([ 8.13666916,  8.75840187], dtype=float32))
('Action ', array([ 7.14853477,  7.16817999], dtype=float32))
('Action ', array([ 8.49482918,  9.15410709], dtype=float32))
('Action ', array([ 7.62914276,  8.55250931], dtype=float32))
('Action ', array([ 6.40333462,  6.59843969], dtype=float32))
Episode: 312/5000, score: 44
('Action ', array([ 6.60251522,  1.39845383], dtype=float32))
('Action ', array([ 8.48561001,  9.53162479], dtype=float32))
('Action ', array([ 11.41157246,   8.71313095], dtype=float32))
('Action ', array([ 8.48561001,  9.53162479], dtype=float32))
('Action ', array([ 11.41157246,   8.71313095], dtype=float32))
('Action ', array([ 8.48561001,  9.53162479], dtype=float32))
('Action ', array([ 8.48561001,  9.53162479], dtype=float32))
('Action ', array([ 9.98204327,  7.00

('Action ', array([ 6.81359196,  1.56460059], dtype=float32))
('Action ', array([ 8.46371841,  8.69159794], dtype=float32))
('Action ', array([ 12.75286674,   7.05361366], dtype=float32))
('Action ', array([ 8.46371841,  8.69159794], dtype=float32))
('Action ', array([ 12.75286674,   7.05361366], dtype=float32))
('Action ', array([ 8.46371841,  8.69159794], dtype=float32))
('Action ', array([ 12.75286674,   7.05361366], dtype=float32))
('Action ', array([ 11.66822529,   6.06623745], dtype=float32))
('Action ', array([ 8.63306046,  8.82532692], dtype=float32))
('Action ', array([ 9.81877804,  8.15932655], dtype=float32))
('Action ', array([ 8.90911484,  9.50521564], dtype=float32))
('Action ', array([ 8.26724625,  6.4335537 ], dtype=float32))
('Action ', array([ 8.67444229,  9.35343838], dtype=float32))
('Action ', array([ 8.46209908,  9.30853462], dtype=float32))
('Action ', array([ 9.23110962,  4.91165733], dtype=float32))
('Action ', array([ 8.53418922,  9.43379688], dtype=float32))


('Action ', array([ 6.93709421,  1.77160573], dtype=float32))
('Action ', array([ 8.76193047,  9.45955086], dtype=float32))
('Action ', array([ 8.76193047,  9.45955086], dtype=float32))
('Action ', array([ 6.93709421,  1.77160573], dtype=float32))
('Action ', array([ 8.48441315,  8.66592216], dtype=float32))
('Action ', array([ 5.36959362,  1.69050467], dtype=float32))
('Action ', array([ 6.24740934,  6.37150431], dtype=float32))
('Action ', array([ 8.40372849,  8.32651234], dtype=float32))
('Action ', array([ 7.29987955,  6.09157801], dtype=float32))
('Action ', array([ 6.5324769 ,  7.22945356], dtype=float32))
Episode: 324/5000, score: 13
('Action ', array([ 6.96518564,  1.79923844], dtype=float32))
('Action ', array([ 8.37356567,  8.3950386 ], dtype=float32))
('Action ', array([ 5.37759542,  6.08590555], dtype=float32))
('Action ', array([ 8.46707916,  8.40389729], dtype=float32))
('Action ', array([ 6.22542477,  7.32435274], dtype=float32))
('Action ', array([ 8.46707916,  8.403897

('Action ', array([ 8.14216042,  8.24289417], dtype=float32))
('Action ', array([ 6.87357807,  6.51093388], dtype=float32))
('Action ', array([ 8.14216042,  8.24289417], dtype=float32))
('Action ', array([ 6.87357807,  6.51093388], dtype=float32))
('Action ', array([ 8.14216042,  8.24289417], dtype=float32))
('Action ', array([ 10.20746613,   9.44102192], dtype=float32))
('Action ', array([ 8.14216042,  8.24289417], dtype=float32))
('Action ', array([ 7.73528957,  9.18796253], dtype=float32))
('Action ', array([ 7.83185196,  8.10058498], dtype=float32))
('Action ', array([  7.99471807,  10.45627689], dtype=float32))
('Action ', array([ 8.01683998,  8.18406296], dtype=float32))
('Action ', array([  7.59761763,  10.26798153], dtype=float32))
('Action ', array([ 7.98749352,  8.13142204], dtype=float32))
('Action ', array([ 8.2096405 ,  8.47194004], dtype=float32))
('Action ', array([ 8.13223648,  7.72526169], dtype=float32))
('Action ', array([ 5.91586018,  5.60877323], dtype=float32))
('

('Action ', array([ 7.78786516,  7.9330492 ], dtype=float32))
('Action ', array([ 10.94485569,   6.26611042], dtype=float32))
('Action ', array([ 7.78786516,  7.9330492 ], dtype=float32))
('Action ', array([ 10.94485569,   6.26611042], dtype=float32))
('Action ', array([ 7.78786516,  7.9330492 ], dtype=float32))
('Action ', array([ 7.80742121,  7.92079353], dtype=float32))
('Action ', array([ 9.10208035,  7.26348972], dtype=float32))
('Action ', array([ 5.06484747,  1.97365654], dtype=float32))
('Action ', array([ 7.75823641,  7.94708252], dtype=float32))
('Action ', array([ 3.04062819,  2.99747372], dtype=float32))
('Action ', array([ 2.12348485,  1.73980796], dtype=float32))
('Action ', array([ 7.80096292,  8.02850533], dtype=float32))
('Action ', array([ 6.01902246,  7.1536932 ], dtype=float32))
('Action ', array([ 2.95187306,  1.71502006], dtype=float32))
('Action ', array([ 7.79044199,  8.08397388], dtype=float32))
('Action ', array([ 2.91442037,  1.7695359 ], dtype=float32))
('Ac

('Action ', array([ 8.73267746,  9.30826378], dtype=float32))
('Action ', array([ 8.9596014 ,  5.09729862], dtype=float32))
('Action ', array([ 8.78241539,  4.30386066], dtype=float32))
('Action ', array([ 8.6732502 ,  9.43554401], dtype=float32))
('Action ', array([ 7.22981262,  2.11567593], dtype=float32))
('Action ', array([ 8.6732502 ,  9.43554401], dtype=float32))
('Action ', array([ 7.52123022,  3.86340046], dtype=float32))
('Action ', array([ 8.82088089,  9.52304077], dtype=float32))
('Action ', array([ 7.75158072,  2.675107  ], dtype=float32))
('Action ', array([ 8.75824356,  9.60046673], dtype=float32))
('Action ', array([ 9.02588654,  3.89688969], dtype=float32))
('Action ', array([ 8.75189972,  9.6180172 ], dtype=float32))
('Action ', array([ 9.47272968,  4.02000523], dtype=float32))
('Action ', array([ 8.73984146,  9.56963539], dtype=float32))
('Action ', array([ 10.24663353,   3.18519306], dtype=float32))
('Action ', array([ 9.69551659,  3.88349628], dtype=float32))
Episod

('Action ', array([ 10.34314537,   1.78905118], dtype=float32))
('Action ', array([ 7.41091347,  6.96112537], dtype=float32))
('Action ', array([ 10.69202709,   2.2752459 ], dtype=float32))
('Action ', array([ 7.38768196,  6.94270039], dtype=float32))
('Action ', array([ 10.84021664,   3.6901896 ], dtype=float32))
('Action ', array([ 7.43364143,  7.12547684], dtype=float32))
('Action ', array([ 6.48884869,  1.53647244], dtype=float32))
('Action ', array([ 7.11494637,  6.83681297], dtype=float32))
('Action ', array([ 8.31838989,  7.63759136], dtype=float32))
('Action ', array([ 7.86321735,  3.01791024], dtype=float32))
('Action ', array([ 7.77138042,  2.2725718 ], dtype=float32))
('Action ', array([ 6.75917435,  7.09267712], dtype=float32))
('Action ', array([ 7.3442297 ,  1.89221203], dtype=float32))
('Action ', array([ 8.36724472,  8.23722553], dtype=float32))
('Action ', array([ 8.78815842,  8.49790764], dtype=float32))
Episode: 348/5000, score: 48
('Action ', array([ 7.49983358,  2.

('Action ', array([ 7.493608  ,  2.65978169], dtype=float32))
('Action ', array([ 8.71794701,  9.41647816], dtype=float32))
('Action ', array([ 7.57247686,  2.64723635], dtype=float32))
('Action ', array([ 8.71794701,  9.41647816], dtype=float32))
('Action ', array([ 5.90174627,  3.00066733], dtype=float32))
('Action ', array([ 8.71794701,  9.41647816], dtype=float32))
('Action ', array([ 5.90174627,  3.00066733], dtype=float32))
('Action ', array([ 8.71794701,  9.41647816], dtype=float32))
('Action ', array([ 6.18247461,  3.19869399], dtype=float32))
('Action ', array([ 6.18247461,  3.19869399], dtype=float32))
('Action ', array([ 8.71794701,  9.41647816], dtype=float32))
('Action ', array([ 7.12920475,  7.49636078], dtype=float32))
('Action ', array([ 8.71794701,  9.41647816], dtype=float32))
('Action ', array([ 8.71794701,  9.41647816], dtype=float32))
('Action ', array([ 9.08881187,  6.95256042], dtype=float32))
('Action ', array([ 8.7901535 ,  9.07450008], dtype=float32))
('Action

('Action ', array([ 5.40735912,  3.22963691], dtype=float32))
('Action ', array([ 9.87945461,  9.87999153], dtype=float32))
('Action ', array([ 5.71909142,  2.10360312], dtype=float32))
('Action ', array([ 9.92154408,  9.85018921], dtype=float32))
('Action ', array([ 5.93124008,  4.57218122], dtype=float32))
('Action ', array([ 9.90911388,  9.83429718], dtype=float32))
('Action ', array([ 5.93124008,  4.57218122], dtype=float32))
('Action ', array([ 9.95255756,  9.84338474], dtype=float32))
('Action ', array([ 7.17621994,  9.02298355], dtype=float32))
('Action ', array([ 9.26208019,  9.09874916], dtype=float32))
('Action ', array([ 7.46274757,  8.58942413], dtype=float32))
('Action ', array([ 9.25801754,  9.41883659], dtype=float32))
('Action ', array([ 7.84175014,  8.67056656], dtype=float32))
Episode: 361/5000, score: 47
('Action ', array([ 7.50265074,  2.81110668], dtype=float32))
('Action ', array([ 8.49960136,  9.03852844], dtype=float32))
('Action ', array([ 9.1734581 ,  3.798337

('Action ', array([ 7.55345058,  3.03417206], dtype=float32))
('Action ', array([ 11.57907391,   2.35003448], dtype=float32))
('Action ', array([ 8.66893959,  9.27981091], dtype=float32))
('Action ', array([ 11.84741974,   5.04550695], dtype=float32))
('Action ', array([ 8.64993286,  9.28801155], dtype=float32))
('Action ', array([ 12.21787739,   9.52490044], dtype=float32))
('Action ', array([ 12.55594063,   8.38874245], dtype=float32))
('Action ', array([ 8.67496681,  9.26720047], dtype=float32))
('Action ', array([ 12.00207424,   7.18735647], dtype=float32))
('Action ', array([ 8.55763817,  8.94557285], dtype=float32))
('Action ', array([ 7.06166697,  2.56419921], dtype=float32))
('Action ', array([ 8.53447342,  8.9374752 ], dtype=float32))
('Action ', array([ 7.70057535,  1.37169814], dtype=float32))
('Action ', array([ 8.42006874,  8.87998295], dtype=float32))
Episode: 368/5000, score: 15
('Action ', array([ 7.55485821,  3.07413101], dtype=float32))
('Action ', array([ 8.33609009,

('Action ', array([ 4.11495066, -1.31025684], dtype=float32))
('Action ', array([ 7.85785246,  8.75179768], dtype=float32))
('Action ', array([ 3.33989477, -1.0803107 ], dtype=float32))
('Action ', array([ 8.65280247,  8.60539818], dtype=float32))
('Action ', array([ 4.49340391, -2.45646644], dtype=float32))
('Action ', array([ 8.75763226,  8.69932365], dtype=float32))
('Action ', array([ 8.73265362,  0.73310488], dtype=float32))
('Action ', array([ 8.9434557 ,  8.67418003], dtype=float32))
('Action ', array([ 14.30075359,   5.35393906], dtype=float32))
Episode: 374/5000, score: 40
('Action ', array([ 7.56332159,  3.26528716], dtype=float32))
('Action ', array([ 8.27533245,  8.99535084], dtype=float32))
('Action ', array([ 8.1867609 ,  9.05374146], dtype=float32))
('Action ', array([ 8.18363857,  9.0600338 ], dtype=float32))
('Action ', array([ 8.162467  ,  9.06478786], dtype=float32))
('Action ', array([ 8.32615471,  7.10320282], dtype=float32))
('Action ', array([ 8.14173603,  9.0882

('Action ', array([ 6.77191734,  5.790555  ], dtype=float32))
('Action ', array([ 7.0543499 ,  7.21008682], dtype=float32))
('Action ', array([ 5.60450745,  3.57319736], dtype=float32))
Episode: 380/5000, score: 32
('Action ', array([ 7.6491971 ,  3.35394526], dtype=float32))
('Action ', array([ 8.19280529,  8.96092319], dtype=float32))
('Action ', array([ 7.6491971 ,  3.35394526], dtype=float32))
('Action ', array([ 8.19280529,  8.96092319], dtype=float32))
('Action ', array([ 7.66372681,  3.07122374], dtype=float32))
('Action ', array([ 8.19280529,  8.96092319], dtype=float32))
('Action ', array([ 10.80627537,  11.73438263], dtype=float32))
('Action ', array([ 8.19280529,  8.96092319], dtype=float32))
('Action ', array([ 7.6491971 ,  3.35394526], dtype=float32))
('Action ', array([ 8.69331264,  9.49227619], dtype=float32))
('Action ', array([ 10.3838501 ,   8.29285622], dtype=float32))
('Action ', array([ 8.39898777,  9.09464264], dtype=float32))
('Action ', array([ 7.64319515,  4.23

('Action ', array([ 7.75234318,  3.41671228], dtype=float32))
('Action ', array([ 8.04126072,  8.91055298], dtype=float32))
('Action ', array([ 9.72856045,  4.20656586], dtype=float32))
('Action ', array([ 8.03959751,  8.92251015], dtype=float32))
('Action ', array([ 5.01380396,  3.21032977], dtype=float32))
('Action ', array([ 8.02052402,  8.95551014], dtype=float32))
('Action ', array([  6.99499512,  10.08388424], dtype=float32))
('Action ', array([ 8.06132412,  8.94986534], dtype=float32))
('Action ', array([ 3.33885837,  3.3240993 ], dtype=float32))
('Action ', array([ 8.02845669,  9.03086853], dtype=float32))
('Action ', array([ 3.60397458,  4.37369823], dtype=float32))
('Action ', array([ 8.02564907,  9.06704712], dtype=float32))
('Action ', array([ 4.63644314,  2.64099383], dtype=float32))
('Action ', array([ 8.05510044,  9.11082363], dtype=float32))
('Action ', array([ 7.92605591,  5.84863949], dtype=float32))
('Action ', array([ 7.55066109,  9.22432613], dtype=float32))
Episod

('Action ', array([ 8.52504635,  9.1118021 ], dtype=float32))
('Action ', array([ 9.81074238,  6.72665358], dtype=float32))
('Action ', array([ 8.51726627,  9.10377026], dtype=float32))
('Action ', array([ 8.79735374,  5.33812284], dtype=float32))
('Action ', array([ 8.51726627,  9.10377026], dtype=float32))
('Action ', array([ 7.47888756,  3.11234808], dtype=float32))
('Action ', array([ 7.19655848,  1.55998755], dtype=float32))
('Action ', array([ 8.51907825,  9.13152218], dtype=float32))
('Action ', array([ 8.51117992,  9.12958241], dtype=float32))
('Action ', array([ 8.49738407,  1.60099936], dtype=float32))
('Action ', array([  9.72225285,  10.17713356], dtype=float32))
('Action ', array([ 10.28861141,   3.44057989], dtype=float32))
('Action ', array([ 9.11107731,  9.8524971 ], dtype=float32))
('Action ', array([ 11.29554272,   4.56274176], dtype=float32))
('Action ', array([ 8.59884357,  8.6101532 ], dtype=float32))
('Action ', array([ 8.60594845,  8.56820965], dtype=float32))
('

('Action ', array([ 8.37480354,  9.05490875], dtype=float32))
('Action ', array([ 10.36215878,   4.31729317], dtype=float32))
('Action ', array([ 8.37480354,  9.05490875], dtype=float32))
('Action ', array([ 7.15409946,  4.73111725], dtype=float32))
('Action ', array([ 8.37480354,  9.05490875], dtype=float32))
('Action ', array([ 7.71612883,  7.25810432], dtype=float32))
('Action ', array([ 8.41243553,  9.06012535], dtype=float32))
('Action ', array([ 9.24808502,  6.59922981], dtype=float32))
('Action ', array([ 8.41243553,  9.06012535], dtype=float32))
('Action ', array([ 8.77451229,  4.96987724], dtype=float32))
('Action ', array([ 8.46945   ,  9.36097145], dtype=float32))
('Action ', array([ 9.16004372,  5.19361305], dtype=float32))
('Action ', array([ 8.45951271,  9.30484486], dtype=float32))
('Action ', array([ 9.35598469,  5.01470375], dtype=float32))
('Action ', array([ 8.57095718,  9.48225594], dtype=float32))
('Action ', array([ 9.27546883,  4.9890461 ], dtype=float32))
('Acti

('Action ', array([ 7.89999914,  3.94578147], dtype=float32))
('Action ', array([ 8.07262802,  8.19885921], dtype=float32))
('Action ', array([ 7.8748889,  7.7864728], dtype=float32))
('Action ', array([ 8.10475731,  8.22846603], dtype=float32))
('Action ', array([ 7.66335821,  8.56983948], dtype=float32))
('Action ', array([ 8.08654404,  8.25204659], dtype=float32))
('Action ', array([ 6.55836344,  7.15480089], dtype=float32))
('Action ', array([  8.03472328,  13.15639114], dtype=float32))
('Action ', array([ 7.71307993,  7.67149496], dtype=float32))
('Action ', array([ 6.15549994,  6.6604619 ], dtype=float32))
('Action ', array([ 6.61177683,  5.01955748], dtype=float32))
('Action ', array([ 6.12630033,  6.61145639], dtype=float32))
('Action ', array([ 6.57233191,  4.24121428], dtype=float32))
('Action ', array([ 6.03638411,  6.70117712], dtype=float32))
('Action ', array([ 6.69503355,  7.07042837], dtype=float32))
('Action ', array([ 7.36133909,  3.20663428], dtype=float32))
('Action

('Action ', array([ 5.65995359,  6.52315664], dtype=float32))
('Action ', array([ 7.02000093,  8.97029209], dtype=float32))
('Action ', array([ 5.52191782,  6.42974997], dtype=float32))
('Action ', array([ 3.74065614,  6.99851751], dtype=float32))
('Action ', array([ 6.18912458,  6.80901861], dtype=float32))
Episode: 408/5000, score: 35
('Action ', array([ 7.92857265,  4.02611399], dtype=float32))
('Action ', array([ 8.32236862,  4.00710297], dtype=float32))
('Action ', array([ 8.12904358,  8.65899563], dtype=float32))
('Action ', array([ 9.41068363,  0.82958901], dtype=float32))
('Action ', array([ 8.11073875,  8.48073959], dtype=float32))
('Action ', array([ 4.29942179,  5.05029583], dtype=float32))
('Action ', array([ 8.34070015,  8.24055672], dtype=float32))
('Action ', array([-2.12864089,  0.08639064], dtype=float32))
Episode: 409/5000, score: 10
('Action ', array([ 7.92764473,  4.04405022], dtype=float32))
('Action ', array([ 8.19918442,  9.04183769], dtype=float32))
('Action ', 

('Action ', array([ 8.00215721,  4.17029238], dtype=float32))
('Action ', array([ 8.5951128 ,  9.11364174], dtype=float32))
('Action ', array([ 8.16974068,  9.38075733], dtype=float32))
('Action ', array([ 8.5951128 ,  9.11364174], dtype=float32))
('Action ', array([ 9.11613941,  3.25401688], dtype=float32))
('Action ', array([ 8.13546085,  8.19292355], dtype=float32))
('Action ', array([ 7.17747116,  3.26376629], dtype=float32))
('Action ', array([ 8.19829941,  8.16607094], dtype=float32))
('Action ', array([ 8.19829941,  8.16607094], dtype=float32))
('Action ', array([ 6.90924072,  5.76625347], dtype=float32))
('Action ', array([ 8.12127209,  8.18764305], dtype=float32))
('Action ', array([ 10.12632275,   8.90392971], dtype=float32))
('Action ', array([ 8.11483383,  8.18697834], dtype=float32))
('Action ', array([ 7.72993088,  6.93696117], dtype=float32))
('Action ', array([ 6.83499718,  7.39649105], dtype=float32))
('Action ', array([ 7.53938293,  6.63946056], dtype=float32))
('Acti

('Action ', array([ 4.38228416,  2.02910829], dtype=float32))
('Action ', array([ 7.46311283,  7.9893074 ], dtype=float32))
('Action ', array([ 5.61156845,  2.65275025], dtype=float32))
('Action ', array([ 7.60403538,  8.10404778], dtype=float32))
Episode: 420/5000, score: 33
('Action ', array([ 8.09552956,  4.2668128 ], dtype=float32))
('Action ', array([ 8.06351566,  8.05575466], dtype=float32))
('Action ', array([ 8.55087376,  6.04369879], dtype=float32))
('Action ', array([ 8.07032585,  8.06537724], dtype=float32))
('Action ', array([  9.80648327,  11.29360962], dtype=float32))
('Action ', array([ 7.91923666,  7.94854879], dtype=float32))
('Action ', array([ 9.90879154,  9.18421173], dtype=float32))
('Action ', array([ 7.47430468,  7.70710135], dtype=float32))
('Action ', array([ 9.44943905,  7.24522829], dtype=float32))
('Action ', array([ 7.45618391,  7.7139802 ], dtype=float32))
('Action ', array([ 9.28425312,  6.90892839], dtype=float32))
Episode: 421/5000, score: 11
('Action '

('Action ', array([ 8.11619663,  4.36817884], dtype=float32))
('Action ', array([ 8.1955719 ,  8.80121803], dtype=float32))
('Action ', array([ 8.19562912,  8.81247234], dtype=float32))
('Action ', array([ 10.09941673,   9.58780766], dtype=float32))
('Action ', array([ 8.52312088,  8.69375229], dtype=float32))
('Action ', array([ 9.19938087,  9.44950199], dtype=float32))
('Action ', array([ 8.52312088,  8.69375229], dtype=float32))
('Action ', array([ 10.40459824,   9.12588978], dtype=float32))
('Action ', array([ 8.53004265,  8.76886082], dtype=float32))
('Action ', array([ 10.06834793,  10.36541462], dtype=float32))
('Action ', array([ 8.52396202,  8.95455933], dtype=float32))
('Action ', array([ 9.57810593,  9.31562901], dtype=float32))
('Action ', array([ 8.41122627,  8.66889286], dtype=float32))
('Action ', array([ 8.77816582,  9.16999912], dtype=float32))
('Action ', array([ 8.44031143,  8.6575613 ], dtype=float32))
Episode: 427/5000, score: 15
('Action ', array([ 8.10426044,  4.

('Action ', array([ 9.14974689,  9.06861019], dtype=float32))
('Action ', array([ 2.98066235,  4.0059762 ], dtype=float32))
('Action ', array([ 8.94401646,  8.94849682], dtype=float32))
('Action ', array([ 9.44379902,  8.67927933], dtype=float32))
Episode: 432/5000, score: 35
('Action ', array([ 8.19907188,  8.03905392], dtype=float32))
('Action ', array([ 6.66203213,  6.54575443], dtype=float32))
('Action ', array([ 7.63156176,  8.20047092], dtype=float32))
('Action ', array([ 6.58069563,  7.01770973], dtype=float32))
('Action ', array([ 7.47326136,  7.92031002], dtype=float32))
('Action ', array([ 6.58069563,  7.01770973], dtype=float32))
('Action ', array([ 7.47042227,  8.38680363], dtype=float32))
('Action ', array([ 6.58371782,  7.02004528], dtype=float32))
('Action ', array([ 8.65642929,  8.27372837], dtype=float32))
('Action ', array([ 8.03191948,  7.9793663 ], dtype=float32))
('Action ', array([ 8.78719616,  6.89830112], dtype=float32))
('Action ', array([ 8.02836132,  8.008766

('Action ', array([ 8.12151527,  8.19341564], dtype=float32))
('Action ', array([ 6.60203743,  7.68989277], dtype=float32))
('Action ', array([ 8.61229515,  8.37450886], dtype=float32))
('Action ', array([ 6.51038265,  7.61726475], dtype=float32))
('Action ', array([ 8.84856224,  8.58947945], dtype=float32))
('Action ', array([ 6.42815113,  7.58388996], dtype=float32))
('Action ', array([ 7.646595  ,  7.42201233], dtype=float32))
('Action ', array([ 6.00788307,  4.63129902], dtype=float32))
('Action ', array([ 7.50458336,  7.44847584], dtype=float32))
('Action ', array([ 6.18163776,  3.51479053], dtype=float32))
('Action ', array([ 7.57150841,  7.93145847], dtype=float32))
Episode: 438/5000, score: 41
('Action ', array([ 8.18768406,  4.6700058 ], dtype=float32))
('Action ', array([ 8.47552586,  8.87602043], dtype=float32))
('Action ', array([ 9.69438934,  6.10262728], dtype=float32))
('Action ', array([ 8.45625019,  8.88208675], dtype=float32))
('Action ', array([ 8.46387959,  8.881703

('Action ', array([ 8.25699997,  4.79438305], dtype=float32))
('Action ', array([ 8.32238197,  8.9955616 ], dtype=float32))
('Action ', array([ 8.25699997,  4.79438305], dtype=float32))
('Action ', array([ 8.32238197,  8.9955616 ], dtype=float32))
('Action ', array([ 8.25699997,  4.79438305], dtype=float32))
('Action ', array([ 8.33431435,  8.97080708], dtype=float32))
('Action ', array([ 8.25699997,  4.79438305], dtype=float32))
('Action ', array([ 8.34348106,  8.9559288 ], dtype=float32))
('Action ', array([ 9.61268234,  6.80248117], dtype=float32))
('Action ', array([ 8.35328484,  8.93902111], dtype=float32))
('Action ', array([ 11.78759861,  11.26748848], dtype=float32))
('Action ', array([ 8.24050331,  8.95553398], dtype=float32))
('Action ', array([ 11.50186348,  10.9372654 ], dtype=float32))
('Action ', array([ 8.20256424,  8.91017342], dtype=float32))
('Action ', array([ 11.48940563,  12.90155411], dtype=float32))
('Action ', array([ 8.12742043,  8.93358612], dtype=float32))
('

('Action ', array([ 8.33650112,  4.97372484], dtype=float32))
('Action ', array([ 8.31406307,  8.98505592], dtype=float32))
('Action ', array([ 8.33650112,  4.97372484], dtype=float32))
('Action ', array([ 8.31406307,  8.98505592], dtype=float32))
('Action ', array([ 9.49186039,  7.14763403], dtype=float32))
('Action ', array([ 8.31406307,  8.98505592], dtype=float32))
('Action ', array([ 9.49186039,  7.14763403], dtype=float32))
('Action ', array([ 8.31406307,  8.98505592], dtype=float32))
('Action ', array([ 9.49186039,  7.14763403], dtype=float32))
('Action ', array([ 8.31406307,  8.98505592], dtype=float32))
('Action ', array([ 9.49186039,  7.14763403], dtype=float32))
('Action ', array([ 8.31078625,  8.98568916], dtype=float32))
('Action ', array([ 11.11895084,  11.07822704], dtype=float32))
('Action ', array([ 11.03135586,  10.89582729], dtype=float32))
('Action ', array([ 8.31078625,  8.98568916], dtype=float32))
('Action ', array([ 8.31078625,  8.98568916], dtype=float32))
('Ac

('Action ', array([ 8.33162689,  5.14578056], dtype=float32))
('Action ', array([ 8.32914162,  9.05102253], dtype=float32))
('Action ', array([ 8.33162689,  5.14578056], dtype=float32))
('Action ', array([ 8.32914162,  9.05102253], dtype=float32))
('Action ', array([ 8.32914162,  9.05102253], dtype=float32))
('Action ', array([ 9.68224335,  6.75660849], dtype=float32))
('Action ', array([ 11.25912762,  12.06312847], dtype=float32))
('Action ', array([ 10.90791416,   7.92446804], dtype=float32))
('Action ', array([ 10.16530323,   7.34889889], dtype=float32))
('Action ', array([ 11.60071945,  11.67467213], dtype=float32))
('Action ', array([ 8.20431137,  9.14407349], dtype=float32))
('Action ', array([ 10.29095459,  11.2746172 ], dtype=float32))
('Action ', array([ 8.2993288 ,  8.79618931], dtype=float32))
('Action ', array([ 8.02068901,  9.0928297 ], dtype=float32))
('Action ', array([ 7.83417082,  6.74963474], dtype=float32))
('Action ', array([ 7.21613741,  7.75518036], dtype=float32)

('Action ', array([ 8.54936695,  9.17123985], dtype=float32))
('Action ', array([ 8.56832027,  9.0946579 ], dtype=float32))
('Action ', array([ 4.35199308,  0.23647033], dtype=float32))
('Action ', array([ 8.12115002,  8.73549557], dtype=float32))
('Action ', array([ 3.94081831,  2.47629261], dtype=float32))
('Action ', array([ 7.88601732,  8.61517525], dtype=float32))
('Action ', array([ 2.95014334,  2.67022038], dtype=float32))
Episode: 464/5000, score: 38
('Action ', array([ 8.32923412,  5.2480526 ], dtype=float32))
('Action ', array([ 8.30109215,  9.0797596 ], dtype=float32))
('Action ', array([ 8.32923412,  5.2480526 ], dtype=float32))
('Action ', array([ 8.30109215,  9.0797596 ], dtype=float32))
('Action ', array([ 10.24772549,  11.18513966], dtype=float32))
('Action ', array([ 8.30109215,  9.0797596 ], dtype=float32))
('Action ', array([ 10.24772549,  11.18513966], dtype=float32))
('Action ', array([ 10.05892372,  10.38193035], dtype=float32))
('Action ', array([ 8.51329231,  9.

('Action ', array([ 8.36301041,  5.31462526], dtype=float32))
('Action ', array([ 8.60905552,  9.17370224], dtype=float32))
('Action ', array([ 9.39109898,  6.33381462], dtype=float32))
('Action ', array([ 10.70478058,   4.8901329 ], dtype=float32))
('Action ', array([ 8.6410284 ,  9.17664528], dtype=float32))
('Action ', array([ 9.93801975,  4.8810215 ], dtype=float32))
('Action ', array([ 8.6410284 ,  9.17664528], dtype=float32))
('Action ', array([ 7.63973904,  3.5920372 ], dtype=float32))
('Action ', array([ 8.6467123 ,  9.17686176], dtype=float32))
('Action ', array([ 7.76328564,  2.89113617], dtype=float32))
('Action ', array([ 8.50417423,  9.05249882], dtype=float32))
('Action ', array([ 7.92112589,  3.28606796], dtype=float32))
('Action ', array([ 8.50417423,  9.05249882], dtype=float32))
('Action ', array([ 7.86733532,  3.3039856 ], dtype=float32))
('Action ', array([ 8.53636074,  9.22281265], dtype=float32))
('Action ', array([ 5.67715883,  4.13116074], dtype=float32))
('Acti

('Action ', array([ 8.42020893,  5.447124  ], dtype=float32))
('Action ', array([ 8.62289429,  9.22647476], dtype=float32))
('Action ', array([ 10.56656551,   8.92338753], dtype=float32))
('Action ', array([ 8.62289429,  9.22647476], dtype=float32))
('Action ', array([ 10.40443802,   5.94764376], dtype=float32))
('Action ', array([ 10.05575085,   6.06929064], dtype=float32))
('Action ', array([ 8.74908829,  9.711133  ], dtype=float32))
('Action ', array([ 9.92684174,  6.98673677], dtype=float32))
('Action ', array([ 8.73937607,  9.73640823], dtype=float32))
('Action ', array([ 8.83988762,  8.10077667], dtype=float32))
('Action ', array([ 8.73112297,  9.79604721], dtype=float32))
('Action ', array([ 9.40779495,  8.18085861], dtype=float32))
('Action ', array([ 8.52700233,  9.76585197], dtype=float32))
('Action ', array([ 8.82213116,  9.0260582 ], dtype=float32))
('Action ', array([ 8.14864159,  8.99780178], dtype=float32))
('Action ', array([ 4.54638386,  6.73490191], dtype=float32))
('

('Action ', array([ 4.6593914 ,  1.75786054], dtype=float32))
Episode: 480/5000, score: 30
('Action ', array([ 8.38066292,  5.57964897], dtype=float32))
('Action ', array([ 8.53685856,  9.25139523], dtype=float32))
('Action ', array([ 12.12261105,   5.28566456], dtype=float32))
('Action ', array([ 8.54266453,  9.25725937], dtype=float32))
('Action ', array([ 11.81973648,   6.03746891], dtype=float32))
('Action ', array([ 8.54266453,  9.25725937], dtype=float32))
('Action ', array([ 11.81695843,   6.03088856], dtype=float32))
('Action ', array([ 8.0477457 ,  8.80854702], dtype=float32))
('Action ', array([ 11.81695843,   6.03088856], dtype=float32))
('Action ', array([ 8.0477457 ,  8.80854702], dtype=float32))
('Action ', array([ 11.69582272,   5.91160297], dtype=float32))
('Action ', array([ 8.0477457 ,  8.80854702], dtype=float32))
('Action ', array([ 11.69582272,   5.91160297], dtype=float32))
('Action ', array([ 8.0370512 ,  8.80916214], dtype=float32))
('Action ', array([ 11.695822

('Action ', array([ 8.33140278,  5.72082233], dtype=float32))
('Action ', array([ 8.29384613,  9.24031448], dtype=float32))
('Action ', array([ 7.64252043,  9.76698875], dtype=float32))
('Action ', array([ 8.29003525,  9.32270145], dtype=float32))
('Action ', array([  6.8814435 ,  10.71482754], dtype=float32))
('Action ', array([ 8.67055893,  9.71885872], dtype=float32))
('Action ', array([  6.69122648,  10.54098034], dtype=float32))
('Action ', array([  6.60786581,  10.50986767], dtype=float32))
('Action ', array([ 8.43386459,  8.64150524], dtype=float32))
('Action ', array([  5.95038652,  10.98153973], dtype=float32))
('Action ', array([ 6.48843718,  7.04861736], dtype=float32))
Episode: 487/5000, score: 12
('Action ', array([ 8.3410387 ,  5.73590231], dtype=float32))
('Action ', array([ 8.84639549,  9.74575806], dtype=float32))
('Action ', array([ 8.84639549,  9.74575806], dtype=float32))
('Action ', array([ 8.3410387 ,  5.73590231], dtype=float32))
('Action ', array([ 8.55026436,  

('Action ', array([ 8.40079403,  9.17691612], dtype=float32))
('Action ', array([ 8.447855  ,  5.81700039], dtype=float32))
('Action ', array([ 8.40079403,  9.17691612], dtype=float32))
('Action ', array([ 8.447855  ,  5.81700039], dtype=float32))
('Action ', array([ 8.40079403,  9.17691612], dtype=float32))
('Action ', array([ 8.447855  ,  5.81700039], dtype=float32))
('Action ', array([ 8.40079403,  9.17691612], dtype=float32))
('Action ', array([ 9.20606899,  6.36726856], dtype=float32))
('Action ', array([ 8.40079403,  9.17691612], dtype=float32))
('Action ', array([ 9.20606899,  6.36726856], dtype=float32))
('Action ', array([ 8.40079403,  9.17691612], dtype=float32))
('Action ', array([ 10.15673542,   6.74319649], dtype=float32))
('Action ', array([ 8.40079403,  9.17691612], dtype=float32))
('Action ', array([  8.71449757,  10.33613586], dtype=float32))
('Action ', array([  9.9549818 ,  10.30772591], dtype=float32))
('Action ', array([ 8.82225895,  9.45240021], dtype=float32))
('

('Action ', array([ 8.44271564,  5.8780632 ], dtype=float32))
('Action ', array([ 8.54204178,  8.45533466], dtype=float32))
('Action ', array([ 10.01346874,   9.18078709], dtype=float32))
('Action ', array([ 8.56505203,  8.46771812], dtype=float32))
('Action ', array([ 10.59178734,  10.63134384], dtype=float32))
('Action ', array([ 11.30075932,   7.55874634], dtype=float32))
('Action ', array([ 8.44612122,  8.35016251], dtype=float32))
('Action ', array([ 11.41666126,   7.47826385], dtype=float32))
('Action ', array([ 8.90292358,  8.60011292], dtype=float32))
('Action ', array([ 6.95075178,  1.7047503 ], dtype=float32))
('Action ', array([ 8.97994041,  8.68004799], dtype=float32))
Episode: 500/5000, score: 11
('Action ', array([ 8.44342899,  5.89389038], dtype=float32))
('Action ', array([ 8.79198837,  9.38408184], dtype=float32))
('Action ', array([ 10.29679489,   7.03121376], dtype=float32))
('Action ', array([ 8.79198837,  9.38408184], dtype=float32))
('Action ', array([ 10.14999008

('Action ', array([ 8.41616917,  8.56106377], dtype=float32))
('Action ', array([ 9.87513065,  9.83163548], dtype=float32))
('Action ', array([ 8.41976452,  8.57678413], dtype=float32))
('Action ', array([  9.66937733,  11.78557682], dtype=float32))
('Action ', array([ 8.52313519,  8.07671261], dtype=float32))
('Action ', array([ 6.87963533,  7.04362059], dtype=float32))
('Action ', array([ 5.00080156,  6.38630342], dtype=float32))
('Action ', array([ 6.74972677,  6.95417452], dtype=float32))
('Action ', array([ 4.52875185,  5.10704088], dtype=float32))
('Action ', array([ 5.96571779,  6.355762  ], dtype=float32))
('Action ', array([ 5.2881856 ,  6.95117235], dtype=float32))
('Action ', array([ 7.39995432,  8.12533855], dtype=float32))
Episode: 507/5000, score: 13
('Action ', array([ 8.52539349,  6.05873346], dtype=float32))
('Action ', array([ 8.43082523,  9.29368114], dtype=float32))
('Action ', array([ 8.52539349,  6.05873346], dtype=float32))
('Action ', array([ 8.43082523,  9.2936

('Action ', array([ 8.63596058,  6.12791395], dtype=float32))
('Action ', array([ 8.87587833,  9.79006481], dtype=float32))
('Action ', array([ 9.41629696,  6.06804419], dtype=float32))
('Action ', array([ 8.87587833,  9.79006481], dtype=float32))
('Action ', array([ 9.41629696,  6.06804419], dtype=float32))
('Action ', array([ 8.87587833,  9.79006481], dtype=float32))
('Action ', array([ 11.65248585,  10.27813148], dtype=float32))
('Action ', array([ 8.87587833,  9.79006481], dtype=float32))
('Action ', array([ 11.65248585,  10.27813148], dtype=float32))
('Action ', array([ 8.87587833,  9.79006481], dtype=float32))
('Action ', array([ 11.74413013,  10.31448936], dtype=float32))
('Action ', array([ 8.39280415,  9.25109291], dtype=float32))
('Action ', array([ 10.47586155,  10.50650024], dtype=float32))
('Action ', array([ 8.39280415,  9.25109291], dtype=float32))
('Action ', array([ 11.74413013,  10.31448936], dtype=float32))
('Action ', array([ 11.75216007,  10.32307243], dtype=float3

('Action ', array([ 8.66487312,  6.24078417], dtype=float32))
('Action ', array([ 8.39635563,  9.33576393], dtype=float32))
('Action ', array([ 8.66487312,  6.24078417], dtype=float32))
('Action ', array([ 8.39635563,  9.33576393], dtype=float32))
('Action ', array([ 8.66487312,  6.24078417], dtype=float32))
('Action ', array([ 8.39635563,  9.33576393], dtype=float32))
('Action ', array([ 9.41386414,  6.03448963], dtype=float32))
('Action ', array([ 8.39635563,  9.33576393], dtype=float32))
('Action ', array([ 10.00787449,  10.36278152], dtype=float32))
('Action ', array([ 8.39635563,  9.33576393], dtype=float32))
('Action ', array([ 8.66487312,  6.24078417], dtype=float32))
('Action ', array([ 11.15811634,   9.4224844 ], dtype=float32))
('Action ', array([ 8.63792896,  9.49540043], dtype=float32))
('Action ', array([ 9.82218838,  5.70619583], dtype=float32))
('Action ', array([ 8.37777233,  6.8838501 ], dtype=float32))
('Action ', array([ 8.29043102,  8.53104305], dtype=float32))
('Ac

('Action ', array([ 8.69261169,  6.33174896], dtype=float32))
('Action ', array([ 8.81841469,  9.47618294], dtype=float32))
('Action ', array([ 10.88302231,   7.7890892 ], dtype=float32))
('Action ', array([ 8.75481987,  9.47494221], dtype=float32))
('Action ', array([ 12.13581467,   8.86756516], dtype=float32))
('Action ', array([ 8.73819542,  9.51541519], dtype=float32))
('Action ', array([ 12.15317154,   8.88534546], dtype=float32))
('Action ', array([ 8.6897068 ,  9.53212547], dtype=float32))
('Action ', array([ 10.37299728,   9.39190865], dtype=float32))
('Action ', array([ 8.36145592,  9.55261421], dtype=float32))
('Action ', array([ 10.40704918,   6.85343361], dtype=float32))
('Action ', array([ 8.32938766,  9.54687119], dtype=float32))
('Action ', array([ 10.05737686,   6.69849205], dtype=float32))
('Action ', array([ 8.31606102,  9.51148987], dtype=float32))
('Action ', array([ 9.70708179,  6.68398857], dtype=float32))
('Action ', array([ 8.11664963,  9.19647312], dtype=float3

('Action ', array([ 8.77468777,  6.3923254 ], dtype=float32))
('Action ', array([ 8.93154144,  9.84895325], dtype=float32))
('Action ', array([ 8.87844658,  6.41498137], dtype=float32))
('Action ', array([ 8.93154144,  9.84895325], dtype=float32))
('Action ', array([ 10.15019512,   6.9268589 ], dtype=float32))
('Action ', array([ 8.79661179,  9.66666794], dtype=float32))
('Action ', array([ 10.09487057,   6.88232231], dtype=float32))
('Action ', array([ 8.79661179,  9.66666794], dtype=float32))
('Action ', array([ 10.54231453,   9.62586975], dtype=float32))
('Action ', array([ 8.79661179,  9.66666794], dtype=float32))
('Action ', array([ 10.54231453,   9.62586975], dtype=float32))
('Action ', array([ 8.79661179,  9.66666794], dtype=float32))
('Action ', array([ 10.67301178,   9.70849991], dtype=float32))
('Action ', array([ 9.00614738,  9.60473061], dtype=float32))
('Action ', array([ 10.88053799,  10.73941803], dtype=float32))
('Action ', array([ 8.99614906,  9.63856983], dtype=float3

('Action ', array([ 8.81345558,  6.46660757], dtype=float32))
('Action ', array([ 8.84532833,  9.37168217], dtype=float32))
('Action ', array([ 10.34466457,   5.06101847], dtype=float32))
('Action ', array([ 8.84532833,  9.37168217], dtype=float32))
('Action ', array([ 11.38635159,   6.56395197], dtype=float32))
('Action ', array([ 8.84351635,  9.37052155], dtype=float32))
('Action ', array([ 11.50382519,   6.52204561], dtype=float32))
('Action ', array([ 8.84351635,  9.37052155], dtype=float32))
('Action ', array([ 10.02481365,   5.71521044], dtype=float32))
('Action ', array([ 8.84208202,  9.37061977], dtype=float32))
('Action ', array([ 10.02481365,   5.71521044], dtype=float32))
('Action ', array([ 8.84208202,  9.37061977], dtype=float32))
('Action ', array([ 10.18225193,   5.78271151], dtype=float32))
('Action ', array([ 8.84208202,  9.37061977], dtype=float32))
('Action ', array([ 11.14293194,   7.89698839], dtype=float32))
('Action ', array([ 8.84208202,  9.37061977], dtype=floa

('Action ', array([ 8.81632042,  6.55333853], dtype=float32))
('Action ', array([ 8.54351425,  9.2430315 ], dtype=float32))
('Action ', array([ 8.81632042,  6.55333853], dtype=float32))
('Action ', array([ 8.54351425,  9.2430315 ], dtype=float32))
('Action ', array([ 8.81632042,  6.55333853], dtype=float32))
('Action ', array([ 8.54351425,  9.2430315 ], dtype=float32))
('Action ', array([ 8.81632042,  6.55333853], dtype=float32))
('Action ', array([ 8.54351425,  9.2430315 ], dtype=float32))
('Action ', array([ 8.81632042,  6.55333853], dtype=float32))
('Action ', array([ 8.54351425,  9.2430315 ], dtype=float32))
('Action ', array([ 9.42963505,  7.59000158], dtype=float32))
('Action ', array([ 8.54351425,  9.2430315 ], dtype=float32))
('Action ', array([ 9.42963505,  7.59000158], dtype=float32))
('Action ', array([ 8.54351425,  9.2430315 ], dtype=float32))
('Action ', array([  9.74953079,  10.68530083], dtype=float32))
('Action ', array([ 8.54351425,  9.2430315 ], dtype=float32))
('Acti

('Action ', array([ 8.7874794 ,  6.66748524], dtype=float32))
('Action ', array([ 8.623106 ,  8.4626255], dtype=float32))
('Action ', array([ 9.49054623,  9.41030121], dtype=float32))
('Action ', array([ 8.80137444,  9.16396332], dtype=float32))
('Action ', array([ 8.24066162,  9.06213188], dtype=float32))
('Action ', array([ 8.35968399,  8.78298092], dtype=float32))
('Action ', array([ 8.73588848,  7.37044907], dtype=float32))
('Action ', array([ 8.35968399,  8.78298092], dtype=float32))
('Action ', array([ 5.88682842,  9.49740982], dtype=float32))
('Action ', array([ 8.36055183,  8.92013359], dtype=float32))
('Action ', array([  5.21301746,  10.5123291 ], dtype=float32))
('Action ', array([ 8.52456474,  9.33777237], dtype=float32))
('Action ', array([ 6.30739212,  8.81240082], dtype=float32))
('Action ', array([ 8.19061184,  8.411973  ], dtype=float32))
('Action ', array([ 8.39156532,  6.83742905], dtype=float32))
('Action ', array([ 8.17724228,  8.38774586], dtype=float32))
('Action

('Action ', array([ 8.89508343,  6.69239044], dtype=float32))
('Action ', array([ 10.18942738,   9.75396061], dtype=float32))
('Action ', array([ 8.85514545,  9.09872246], dtype=float32))
('Action ', array([ 10.02981472,  10.47992611], dtype=float32))
('Action ', array([ 8.82117176,  9.18232536], dtype=float32))
('Action ', array([  9.95655727,  11.01847363], dtype=float32))
('Action ', array([ 10.11732197,  11.33450603], dtype=float32))
('Action ', array([ 8.64708424,  9.27367401], dtype=float32))
('Action ', array([ 10.12215424,  12.34884548], dtype=float32))
('Action ', array([ 8.60365963,  9.25144386], dtype=float32))
('Action ', array([  9.96609497,  11.64386272], dtype=float32))
('Action ', array([ 8.75983715,  7.7988081 ], dtype=float32))
('Action ', array([  9.25030708,  10.96500301], dtype=float32))
('Action ', array([ 9.28442669,  8.31681347], dtype=float32))
('Action ', array([ 6.36209536,  3.71132541], dtype=float32))
('Action ', array([ 9.42741871,  8.31397724], dtype=floa

('Action ', array([ 8.88257313,  6.7761693 ], dtype=float32))
('Action ', array([ 8.83034134,  8.61311054], dtype=float32))
('Action ', array([ 10.68445492,  10.45153904], dtype=float32))
('Action ', array([ 8.60213661,  8.49742126], dtype=float32))
('Action ', array([ 10.42545795,   9.62938976], dtype=float32))
('Action ', array([ 7.70392799,  7.95792866], dtype=float32))
('Action ', array([ 10.21542549,   9.56524372], dtype=float32))
('Action ', array([ 7.70301914,  7.95889378], dtype=float32))
('Action ', array([  9.67231369,  10.55293751], dtype=float32))
('Action ', array([ 6.24729633,  6.42751503], dtype=float32))
('Action ', array([ 8.63266945,  8.54297352], dtype=float32))
('Action ', array([ 6.37975407,  6.43873215], dtype=float32))
('Action ', array([  9.83711815,  10.94142628], dtype=float32))
('Action ', array([ 6.72300911,  6.38681602], dtype=float32))
('Action ', array([  8.9133215 ,  10.85065937], dtype=float32))
('Action ', array([ 8.321455  ,  7.45562077], dtype=float3

('Action ', array([ 8.91711521,  6.86576128], dtype=float32))
('Action ', array([ 8.79759502,  8.5646534 ], dtype=float32))
('Action ', array([ 9.80128002,  7.84375   ], dtype=float32))
('Action ', array([ 8.80112934,  8.50965881], dtype=float32))
('Action ', array([ 11.1722517 ,   9.33486557], dtype=float32))
('Action ', array([ 8.75442982,  8.8298502 ], dtype=float32))
('Action ', array([ 10.77302265,   9.68393517], dtype=float32))
('Action ', array([ 8.84619999,  8.85993767], dtype=float32))
('Action ', array([ 10.82937431,   9.76263618], dtype=float32))
('Action ', array([ 8.6789217 ,  8.53991795], dtype=float32))
('Action ', array([ 6.19300747,  1.97702217], dtype=float32))
('Action ', array([ 8.54490376,  8.50954819], dtype=float32))
Episode: 563/5000, score: 11
('Action ', array([ 8.91111565,  6.88968277], dtype=float32))
('Action ', array([ 9.01858616,  9.43106556], dtype=float32))
('Action ', array([ 10.53338337,   5.04576015], dtype=float32))
('Action ', array([ 9.12357616,  

Episode: 568/5000, score: 32
('Action ', array([ 8.89911652,  6.99685764], dtype=float32))
('Action ', array([ 8.65917301,  8.61922646], dtype=float32))
('Action ', array([ 9.67975807,  7.4960475 ], dtype=float32))
('Action ', array([ 8.36781025,  8.41297436], dtype=float32))
('Action ', array([ 10.58234882,  10.64493656], dtype=float32))
('Action ', array([ 7.09438658,  7.6485796 ], dtype=float32))
('Action ', array([ 7.09438658,  7.6485796 ], dtype=float32))
('Action ', array([ 7.34182501,  7.8597765 ], dtype=float32))
('Action ', array([  9.55578804,  10.62640667], dtype=float32))
('Action ', array([  9.56296062,  10.07983303], dtype=float32))
('Action ', array([ 7.75165129,  8.38093853], dtype=float32))
('Action ', array([ 9.49529934,  7.42920589], dtype=float32))
('Action ', array([ 7.21032667,  7.79209423], dtype=float32))
('Action ', array([ 9.24318123,  6.28633022], dtype=float32))
Episode: 569/5000, score: 16
('Action ', array([ 8.9076004 ,  7.00374842], dtype=float32))
('Acti

('Action ', array([ 8.95935249,  7.08926535], dtype=float32))
('Action ', array([ 8.74026108,  9.39319706], dtype=float32))
('Action ', array([ 8.95935249,  7.08926535], dtype=float32))
('Action ', array([ 8.74026108,  9.39319706], dtype=float32))
('Action ', array([ 10.65103436,   6.28741646], dtype=float32))
('Action ', array([ 8.73185349,  9.39758587], dtype=float32))
('Action ', array([  8.37052727,  10.74258423], dtype=float32))
('Action ', array([ 8.73353195,  9.39836693], dtype=float32))
('Action ', array([ 8.07091331,  9.99881554], dtype=float32))
('Action ', array([ 8.63480377,  9.40795708], dtype=float32))
('Action ', array([ 7.01425266,  7.64860868], dtype=float32))
('Action ', array([ 8.63082314,  9.43044853], dtype=float32))
('Action ', array([ 7.87560081,  8.26320171], dtype=float32))
('Action ', array([ 7.37528324,  6.86593771], dtype=float32))
Episode: 577/5000, score: 14
('Action ', array([ 8.97209835,  7.09887266], dtype=float32))
('Action ', array([ 8.67978954,  8.74

('Action ', array([ 8.96511555,  7.12937737], dtype=float32))
('Action ', array([ 8.63229847,  8.73782444], dtype=float32))
('Action ', array([  9.95640755,  10.12862968], dtype=float32))
('Action ', array([ 8.68191624,  8.72457123], dtype=float32))
('Action ', array([ 9.6263504 ,  8.14924145], dtype=float32))
('Action ', array([ 8.71273899,  8.69640923], dtype=float32))
('Action ', array([ 9.56291866,  6.83071184], dtype=float32))
('Action ', array([ 8.7104311,  8.6794281], dtype=float32))
('Action ', array([ 9.57137775,  6.44865179], dtype=float32))
('Action ', array([ 8.66997051,  8.71858501], dtype=float32))
('Action ', array([ 9.25309849,  7.94351435], dtype=float32))
('Action ', array([ 8.69928837,  8.77910233], dtype=float32))
('Action ', array([ 8.25869274,  8.42107868], dtype=float32))
('Action ', array([ 8.73716068,  6.70254564], dtype=float32))
('Action ', array([ 7.94156218,  8.20435715], dtype=float32))
('Action ', array([ 8.76791096,  6.74704409], dtype=float32))
('Action

('Action ', array([ 8.94309521,  7.17226648], dtype=float32))
('Action ', array([ 8.66373158,  9.49073696], dtype=float32))
('Action ', array([ 8.94309521,  7.17226648], dtype=float32))
('Action ', array([ 8.66373158,  9.49073696], dtype=float32))
('Action ', array([ 8.94309521,  7.17226648], dtype=float32))
('Action ', array([ 8.66373158,  9.49073696], dtype=float32))
('Action ', array([ 8.94309521,  7.17226648], dtype=float32))
('Action ', array([ 8.66373158,  9.49073696], dtype=float32))
('Action ', array([ 9.45815659,  7.39633131], dtype=float32))
('Action ', array([ 8.66373158,  9.49073696], dtype=float32))
('Action ', array([ 9.53634834,  7.47989893], dtype=float32))
('Action ', array([ 8.66373158,  9.49073696], dtype=float32))
('Action ', array([ 9.53634834,  7.47989893], dtype=float32))
('Action ', array([ 8.66373158,  9.49073696], dtype=float32))
('Action ', array([ 9.44952297,  7.13025808], dtype=float32))
('Action ', array([ 8.66373158,  9.49073696], dtype=float32))
('Action

('Action ', array([ 9.01950932,  7.31115818], dtype=float32))
('Action ', array([ 8.69241333,  9.48939705], dtype=float32))
('Action ', array([ 9.78791428,  7.32006645], dtype=float32))
('Action ', array([ 8.69504738,  9.48817444], dtype=float32))
('Action ', array([ 9.71337223,  7.51905727], dtype=float32))
('Action ', array([ 9.6954689 ,  7.58323002], dtype=float32))
('Action ', array([ 8.70939827,  9.4903574 ], dtype=float32))
('Action ', array([ 9.877285  ,  8.75698566], dtype=float32))
('Action ', array([ 8.7864151 ,  9.66087341], dtype=float32))
('Action ', array([ 7.42031765,  6.03624153], dtype=float32))
('Action ', array([ 7.29768229,  8.52676964], dtype=float32))
('Action ', array([ 7.37196636,  5.31888771], dtype=float32))
('Action ', array([ 7.15694857,  8.36065292], dtype=float32))
('Action ', array([ 1.53296125,  2.98827934], dtype=float32))
('Action ', array([ 7.72877359,  8.33970356], dtype=float32))
Episode: 593/5000, score: 15
('Action ', array([ 9.05409622,  7.341129

('Action ', array([ 9.20187187,  7.4389925 ], dtype=float32))
('Action ', array([ 8.56286907,  8.66444016], dtype=float32))
('Action ', array([ 10.87581539,  14.271101  ], dtype=float32))
('Action ', array([ 8.95555019,  9.49592018], dtype=float32))
('Action ', array([ 10.87581539,  14.271101  ], dtype=float32))
('Action ', array([ 8.95555019,  9.49592018], dtype=float32))
('Action ', array([ 11.40592289,  11.87172508], dtype=float32))
('Action ', array([ 8.97840214,  8.94452763], dtype=float32))
('Action ', array([ 10.30772018,   9.74566078], dtype=float32))
('Action ', array([ 8.24685383,  8.30926514], dtype=float32))
('Action ', array([ 7.75852346,  6.72968435], dtype=float32))
('Action ', array([ 8.23135662,  8.23992443], dtype=float32))
('Action ', array([ 6.74325895,  7.59700918], dtype=float32))
Episode: 599/5000, score: 12
('Action ', array([ 9.214468  ,  7.45170116], dtype=float32))
('Action ', array([ 9.01291275,  9.59359837], dtype=float32))
('Action ', array([ 11.22473621, 

('Action ', array([ 9.17969894,  7.49373865], dtype=float32))
('Action ', array([ 8.64302063,  9.3485651 ], dtype=float32))
('Action ', array([ 9.87164497,  8.23642635], dtype=float32))
('Action ', array([ 8.78886795,  9.32800961], dtype=float32))
('Action ', array([ 10.10568619,   7.9754262 ], dtype=float32))
('Action ', array([ 9.86561394,  8.51341248], dtype=float32))
('Action ', array([ 8.81462669,  9.38594151], dtype=float32))
('Action ', array([ 11.24972439,   8.91213322], dtype=float32))
('Action ', array([ 8.81990433,  9.38776302], dtype=float32))
('Action ', array([ 11.12569237,   8.52633381], dtype=float32))
('Action ', array([ 8.70066833,  9.02541256], dtype=float32))
('Action ', array([ 8.42131042,  6.90903711], dtype=float32))
('Action ', array([ 6.83572912,  7.74786806], dtype=float32))
('Action ', array([ 7.87831306,  6.76505518], dtype=float32))
('Action ', array([ 6.74995947,  7.68715715], dtype=float32))
('Action ', array([ 8.75625706,  3.93006015], dtype=float32))
Ep

('Action ', array([ 9.15087986,  7.54303646], dtype=float32))
('Action ', array([ 8.36193562,  8.54667759], dtype=float32))
('Action ', array([ 10.0934763 ,   7.50480461], dtype=float32))
('Action ', array([ 9.95721722,  7.43783665], dtype=float32))
('Action ', array([ 8.36193562,  8.54667759], dtype=float32))
('Action ', array([ 10.34771347,   8.83092117], dtype=float32))
('Action ', array([ 8.89106274,  9.42636585], dtype=float32))
('Action ', array([ 9.81330395,  8.65698242], dtype=float32))
('Action ', array([ 8.23827267,  8.91331673], dtype=float32))
('Action ', array([ 7.50459003,  7.77748108], dtype=float32))
('Action ', array([ 8.36656857,  9.15517426], dtype=float32))
('Action ', array([ 7.25427818,  7.58317947], dtype=float32))
('Action ', array([ 8.35386753,  9.14618969], dtype=float32))
('Action ', array([ 5.1445055 ,  7.10393143], dtype=float32))
('Action ', array([ 8.19858265,  8.96170998], dtype=float32))
('Action ', array([ 5.92363358,  8.89167023], dtype=float32))
('Ac

('Action ', array([ 9.16483498,  7.59677792], dtype=float32))
('Action ', array([ 8.56205463,  9.51667213], dtype=float32))
('Action ', array([ 9.16483498,  7.59677792], dtype=float32))
('Action ', array([ 8.56205463,  9.51667213], dtype=float32))
('Action ', array([ 9.16483498,  7.59677792], dtype=float32))
('Action ', array([ 8.56205463,  9.51667213], dtype=float32))
('Action ', array([ 10.14999485,   9.85232162], dtype=float32))
('Action ', array([ 8.56205463,  9.51667213], dtype=float32))
('Action ', array([ 10.14999485,   9.85232162], dtype=float32))
('Action ', array([ 8.54380894,  9.38587475], dtype=float32))
('Action ', array([ 9.63088608,  9.09693241], dtype=float32))
('Action ', array([ 8.54930782,  9.3887043 ], dtype=float32))
('Action ', array([ 9.69855785,  8.74808502], dtype=float32))
('Action ', array([ 8.56310558,  9.44022465], dtype=float32))
('Action ', array([  9.63850975,  10.85032463], dtype=float32))
('Action ', array([ 9.82484055,  9.97558212], dtype=float32))
('

('Action ', array([ 10.5732336 ,   9.79675674], dtype=float32))
Episode: 619/5000, score: 30
('Action ', array([ 9.16909122,  7.69323301], dtype=float32))
('Action ', array([ 8.20258808,  8.66402626], dtype=float32))
('Action ', array([ 10.20867729,   7.56616259], dtype=float32))
('Action ', array([ 8.20119381,  8.66332722], dtype=float32))
('Action ', array([ 10.10406971,   8.05158424], dtype=float32))
('Action ', array([ 8.19133282,  8.65187454], dtype=float32))
('Action ', array([ 10.3891573 ,   5.84009123], dtype=float32))
('Action ', array([ 8.15839863,  8.64452076], dtype=float32))
('Action ', array([ 11.55716038,   6.76633024], dtype=float32))
('Action ', array([ 8.1748991 ,  8.67934227], dtype=float32))
('Action ', array([ 8.11339092,  6.60157728], dtype=float32))
('Action ', array([ 8.1748991 ,  8.67934227], dtype=float32))
('Action ', array([ 8.1748991 ,  8.67934227], dtype=float32))
('Action ', array([ 8.01642323,  5.73065519], dtype=float32))
('Action ', array([ 8.1748991 ,

('Action ', array([ 9.18928623,  7.74028921], dtype=float32))
('Action ', array([ 8.1794405 ,  8.63558769], dtype=float32))
('Action ', array([ 9.18928623,  7.74028921], dtype=float32))
('Action ', array([ 8.18305492,  8.63597584], dtype=float32))
('Action ', array([ 9.18928623,  7.74028921], dtype=float32))
('Action ', array([ 8.14093304,  8.64248848], dtype=float32))
('Action ', array([ 8.14093304,  8.64248848], dtype=float32))
('Action ', array([ 8.18305492,  8.63597584], dtype=float32))
('Action ', array([ 9.67390251,  8.52483177], dtype=float32))
('Action ', array([ 8.18305492,  8.63597584], dtype=float32))
('Action ', array([ 9.67390251,  8.52483177], dtype=float32))
('Action ', array([ 8.1223402 ,  8.57995415], dtype=float32))
('Action ', array([ 9.7626524 ,  9.97010994], dtype=float32))
('Action ', array([ 8.1223402 ,  8.57995415], dtype=float32))
('Action ', array([ 9.43904305,  7.81470728], dtype=float32))
('Action ', array([ 8.01204777,  8.13009262], dtype=float32))
('Action

('Action ', array([ 8.62158966,  9.31559467], dtype=float32))
('Action ', array([ 9.74220657,  6.16452551], dtype=float32))
('Action ', array([ 8.19327927,  8.43874073], dtype=float32))
('Action ', array([ 8.22626495,  6.0773139 ], dtype=float32))
('Action ', array([ 8.22488594,  8.42341995], dtype=float32))
('Action ', array([ 8.01401424,  5.88812399], dtype=float32))
('Action ', array([ 8.09806633,  8.32201385], dtype=float32))
('Action ', array([ 8.3615284 ,  4.95032644], dtype=float32))
('Action ', array([ 8.04031754,  8.28454208], dtype=float32))
('Action ', array([ 8.46438885,  5.06446218], dtype=float32))
('Action ', array([ 7.99954653,  8.25940609], dtype=float32))
Episode: 629/5000, score: 39
('Action ', array([ 9.16060543,  7.81494617], dtype=float32))
('Action ', array([ 8.47499561,  9.53992939], dtype=float32))
('Action ', array([ 9.16060543,  7.81494617], dtype=float32))
('Action ', array([ 8.47499561,  9.53992939], dtype=float32))
('Action ', array([ 9.16060543,  7.814946

('Action ', array([ 9.19559765,  7.88716412], dtype=float32))
('Action ', array([ 8.40319157,  9.54707718], dtype=float32))
('Action ', array([ 9.19559765,  7.88716412], dtype=float32))
('Action ', array([ 8.40319157,  9.54707718], dtype=float32))
('Action ', array([ 9.19559765,  7.88716412], dtype=float32))
('Action ', array([ 10.05344677,   8.49285221], dtype=float32))
('Action ', array([ 8.40319157,  9.54707718], dtype=float32))
('Action ', array([ 10.05344677,   8.49285221], dtype=float32))
('Action ', array([ 8.38348866,  9.41140461], dtype=float32))
('Action ', array([ 8.85939503,  9.47756481], dtype=float32))
('Action ', array([ 8.39748096,  9.4231081 ], dtype=float32))
('Action ', array([  8.81923771,  10.54998302], dtype=float32))
('Action ', array([ 8.58088779,  9.83192348], dtype=float32))
('Action ', array([ 6.13971472,  9.06293201], dtype=float32))
('Action ', array([ 8.37321377,  9.83615875], dtype=float32))
('Action ', array([ 6.78338289,  9.6148386 ], dtype=float32))
('

('Action ', array([ 9.18553162,  7.89152241], dtype=float32))
('Action ', array([ 8.36644745,  9.67771149], dtype=float32))
('Action ', array([ 9.18553162,  7.89152241], dtype=float32))
('Action ', array([ 8.35570145,  9.67831898], dtype=float32))
('Action ', array([ 9.18553162,  7.89152241], dtype=float32))
('Action ', array([ 8.35570145,  9.67831898], dtype=float32))
('Action ', array([ 9.18553162,  7.89152241], dtype=float32))
('Action ', array([ 8.35570145,  9.67831898], dtype=float32))
('Action ', array([ 9.49272251,  9.37905025], dtype=float32))
('Action ', array([ 8.35565758,  9.67681313], dtype=float32))
('Action ', array([ 9.49272251,  9.37905025], dtype=float32))
('Action ', array([ 8.35565758,  9.67681313], dtype=float32))
('Action ', array([ 9.51186943,  9.2922554 ], dtype=float32))
('Action ', array([ 8.35565758,  9.67681313], dtype=float32))
('Action ', array([ 9.51186943,  9.2922554 ], dtype=float32))
('Action ', array([ 8.35565758,  9.67681313], dtype=float32))
('Action

('Action ', array([ 9.2690258,  7.897048 ], dtype=float32))
('Action ', array([ 7.9535718 ,  8.73963261], dtype=float32))
('Action ', array([ 10.4234705 ,   8.71011448], dtype=float32))
('Action ', array([ 7.9535718 ,  8.73963261], dtype=float32))
('Action ', array([ 10.45491695,   8.88608837], dtype=float32))
('Action ', array([ 7.62548304,  8.57934093], dtype=float32))
('Action ', array([ 10.84621143,   8.48104382], dtype=float32))
('Action ', array([ 11.05993366,   7.49351788], dtype=float32))
('Action ', array([ 7.68193674,  8.54770279], dtype=float32))
('Action ', array([ 11.20462132,   6.92384815], dtype=float32))
('Action ', array([ 7.66894388,  8.5434618 ], dtype=float32))
('Action ', array([ 11.09640598,   6.32410908], dtype=float32))
('Action ', array([ 11.24333858,   6.48867512], dtype=float32))
('Action ', array([ 7.35600901,  8.320014  ], dtype=float32))
('Action ', array([ 11.23339844,   6.5113039 ], dtype=float32))
('Action ', array([ 7.51979303,  8.57333374], dtype=floa

('Action ', array([ 10.62157154,   8.76850414], dtype=float32))
('Action ', array([ 8.15977192,  8.33066368], dtype=float32))
('Action ', array([ 8.45863152,  7.1792593 ], dtype=float32))
('Action ', array([ 8.24908352,  8.37295055], dtype=float32))
('Action ', array([ 7.33546829,  6.47840405], dtype=float32))
('Action ', array([ 8.27603626,  8.41974354], dtype=float32))
('Action ', array([ 3.77472186,  6.36455059], dtype=float32))
Episode: 652/5000, score: 38
('Action ', array([ 9.21120071,  8.07820892], dtype=float32))
('Action ', array([ 8.31407452,  9.59006405], dtype=float32))
('Action ', array([ 10.70818615,   8.77085495], dtype=float32))
('Action ', array([ 8.35976505,  9.75975227], dtype=float32))
('Action ', array([ 10.73624897,   8.23363495], dtype=float32))
('Action ', array([ 8.36516476,  9.74128723], dtype=float32))
('Action ', array([ 10.09789944,   7.87709045], dtype=float32))
('Action ', array([ 8.36516476,  9.74128723], dtype=float32))
('Action ', array([ 10.09789944, 

('Action ', array([ 7.81463814,  7.81739378], dtype=float32))
('Action ', array([ 5.77897739,  4.69346189], dtype=float32))
('Action ', array([ 4.34003639,  2.10099387], dtype=float32))
('Action ', array([ 9.06370735,  8.91869259], dtype=float32))
('Action ', array([ 6.39325905,  4.64291334], dtype=float32))
('Action ', array([ 9.06370735,  8.91869259], dtype=float32))
('Action ', array([ 3.95866394,  3.22486854], dtype=float32))
('Action ', array([ 9.06370735,  8.91869259], dtype=float32))
('Action ', array([ 6.3617897 ,  4.61728239], dtype=float32))
('Action ', array([ 9.0598526 ,  8.92001152], dtype=float32))
('Action ', array([ 5.03788185,  3.85195899], dtype=float32))
('Action ', array([ 9.52942467,  9.3355484 ], dtype=float32))
('Action ', array([ 0.56673807,  2.14448142], dtype=float32))
Episode: 659/5000, score: 44
('Action ', array([ 9.20374489,  8.11109257], dtype=float32))
('Action ', array([ 8.46220207,  9.770854  ], dtype=float32))
('Action ', array([ 10.33385086,   7.3100

('Action ', array([ 9.27093887,  8.08534622], dtype=float32))
('Action ', array([ 8.29652596,  9.14033031], dtype=float32))
('Action ', array([ 10.05294228,   4.94819212], dtype=float32))
('Action ', array([ 8.44476318,  9.33352757], dtype=float32))
('Action ', array([ 9.98723221,  7.29682875], dtype=float32))
('Action ', array([ 8.40123177,  9.3441658 ], dtype=float32))
('Action ', array([ 8.5034008,  9.4570179], dtype=float32))
('Action ', array([ 8.84307289,  8.51612377], dtype=float32))
('Action ', array([ 8.52657509,  9.37281799], dtype=float32))
('Action ', array([  9.69590569,  11.077075  ], dtype=float32))
('Action ', array([ 8.57181549,  9.41180038], dtype=float32))
('Action ', array([ 9.44811821,  9.49639225], dtype=float32))
('Action ', array([ 8.32423973,  8.69725037], dtype=float32))
('Action ', array([ 6.43416691,  4.99562025], dtype=float32))
('Action ', array([ 6.81317329,  7.71342325], dtype=float32))
Episode: 665/5000, score: 15
('Action ', array([ 9.28692341,  8.0725

('Action ', array([ 10.2106142 ,   8.03520679], dtype=float32))
('Action ', array([ 8.42958355,  9.59204102], dtype=float32))
('Action ', array([ 10.01488113,   7.47122622], dtype=float32))
('Action ', array([ 8.21814251,  9.60116863], dtype=float32))
Episode: 671/5000, score: 33
('Action ', array([ 9.31505299,  8.06790543], dtype=float32))
('Action ', array([  8.78246498,  10.31431675], dtype=float32))
('Action ', array([ 10.97365379,   8.45526409], dtype=float32))
('Action ', array([  8.86598396,  10.44141293], dtype=float32))
('Action ', array([ 11.03240204,   8.55551815], dtype=float32))
('Action ', array([  8.88550186,  10.41618252], dtype=float32))
('Action ', array([ 8.70717049,  5.64115858], dtype=float32))
('Action ', array([ 8.2435894,  9.4313345], dtype=float32))
('Action ', array([ 4.50094175,  0.49083263], dtype=float32))
('Action ', array([ 8.18636513,  9.35966778], dtype=float32))
('Action ', array([ 4.18542147,  1.66243291], dtype=float32))
('Action ', array([ 8.2128448

('Action ', array([ 8.84655857,  9.48729038], dtype=float32))
('Action ', array([ 9.62406158,  9.52375221], dtype=float32))
('Action ', array([ 8.72673893,  9.44739342], dtype=float32))
('Action ', array([ 8.71244812,  8.4275074 ], dtype=float32))
('Action ', array([ 8.44190693,  9.43225002], dtype=float32))
Episode: 676/5000, score: 33
('Action ', array([ 9.31652451,  8.22310066], dtype=float32))
('Action ', array([ 8.542449  ,  9.27246189], dtype=float32))
('Action ', array([ 9.8688221 ,  9.15872574], dtype=float32))
('Action ', array([ 8.542449  ,  9.27246189], dtype=float32))
('Action ', array([ 9.8688221 ,  9.15872574], dtype=float32))
('Action ', array([ 8.542449  ,  9.27246189], dtype=float32))
('Action ', array([ 9.8688221 ,  9.15872574], dtype=float32))
('Action ', array([ 8.542449  ,  9.27246189], dtype=float32))
('Action ', array([ 10.20937634,   8.35809326], dtype=float32))
('Action ', array([ 8.542449  ,  9.27246189], dtype=float32))
('Action ', array([ 10.20937634,   8.35

('Action ', array([ 9.35688591,  8.24810314], dtype=float32))
('Action ', array([  8.6561718 ,  10.03924942], dtype=float32))
('Action ', array([ 10.37860012,   8.39947414], dtype=float32))
('Action ', array([  8.6561718 ,  10.03924942], dtype=float32))
('Action ', array([ 10.37860012,   8.39947414], dtype=float32))
('Action ', array([  8.6561718 ,  10.03924942], dtype=float32))
('Action ', array([  8.6561718 ,  10.03924942], dtype=float32))
('Action ', array([ 10.37747192,   8.25998306], dtype=float32))
('Action ', array([  8.67740631,  10.03507805], dtype=float32))
('Action ', array([ 10.41792107,   8.24245834], dtype=float32))
('Action ', array([  8.67740631,  10.03507805], dtype=float32))
('Action ', array([ 10.45184326,  10.80636692], dtype=float32))
('Action ', array([  8.69414902,  10.16359425], dtype=float32))
('Action ', array([ 10.22374344,  10.12630272], dtype=float32))
('Action ', array([  8.79999352,  10.14585876], dtype=float32))
('Action ', array([ 9.15408516,  7.7706337

('Action ', array([ 9.48807621,  8.19098377], dtype=float32))
('Action ', array([ 10.96303558,  10.4475069 ], dtype=float32))
('Action ', array([ 8.74913025,  9.98795605], dtype=float32))
('Action ', array([ 10.93307781,  10.3428936 ], dtype=float32))
('Action ', array([ 8.74913025,  9.98795605], dtype=float32))
('Action ', array([ 10.93307781,  10.3428936 ], dtype=float32))
('Action ', array([ 8.74913025,  9.98795605], dtype=float32))
('Action ', array([ 10.62513161,   8.37495899], dtype=float32))
('Action ', array([ 8.74913025,  9.98795605], dtype=float32))
('Action ', array([ 10.62513161,   8.37495899], dtype=float32))
('Action ', array([ 8.74913025,  9.98795605], dtype=float32))
('Action ', array([ 10.62513161,   8.37495899], dtype=float32))
('Action ', array([ 8.74913025,  9.98795605], dtype=float32))
('Action ', array([ 10.62513161,   8.37495899], dtype=float32))
('Action ', array([ 8.74913025,  9.98795605], dtype=float32))
('Action ', array([ 11.04377079,   8.2400856 ], dtype=fl

('Action ', array([ 9.52301121,  8.21637249], dtype=float32))
('Action ', array([ 8.861516  ,  9.35421944], dtype=float32))
('Action ', array([ 8.090415  ,  9.42682362], dtype=float32))
('Action ', array([ 8.8720274 ,  9.35604286], dtype=float32))
('Action ', array([ 8.6260128 ,  8.50822353], dtype=float32))
('Action ', array([ 8.95221996,  9.49708939], dtype=float32))
('Action ', array([ 8.6260128 ,  8.50822353], dtype=float32))
('Action ', array([ 8.97877026,  9.47961807], dtype=float32))
('Action ', array([ 8.42560863,  9.66101742], dtype=float32))
('Action ', array([ 8.97677326,  9.48371887], dtype=float32))
('Action ', array([ 9.0164156 ,  8.85730743], dtype=float32))
('Action ', array([ 9.05565834,  9.01532269], dtype=float32))
('Action ', array([ 8.16653156,  8.26516438], dtype=float32))
Episode: 690/5000, score: 13
('Action ', array([ 9.49656296,  8.23113632], dtype=float32))
('Action ', array([  8.81865406,  10.05822754], dtype=float32))
('Action ', array([ 9.49656296,  8.2311

('Action ', array([ 9.48833847,  8.30613327], dtype=float32))
('Action ', array([  9.07192516,  10.18893337], dtype=float32))
('Action ', array([ 10.40122128,   9.95671082], dtype=float32))
('Action ', array([  9.07192516,  10.18893337], dtype=float32))
('Action ', array([ 10.39666843,   9.95735931], dtype=float32))
('Action ', array([ 8.56482792,  9.75169945], dtype=float32))
('Action ', array([ 10.3747282 ,   9.92072487], dtype=float32))
('Action ', array([ 8.56482792,  9.75169945], dtype=float32))
('Action ', array([ 10.46443367,   9.84618378], dtype=float32))
('Action ', array([ 8.56482792,  9.75169945], dtype=float32))
('Action ', array([ 10.46443367,   9.84618378], dtype=float32))
('Action ', array([ 8.56482792,  9.75169945], dtype=float32))
('Action ', array([ 10.27431774,  11.0087471 ], dtype=float32))
('Action ', array([ 8.56482792,  9.75169945], dtype=float32))
('Action ', array([ 10.27431774,  11.0087471 ], dtype=float32))
('Action ', array([ 8.56482792,  9.75169945], dtype=

('Action ', array([ 8.63016224,  4.18742704], dtype=float32))
('Action ', array([ 8.22838974,  8.41406918], dtype=float32))
Episode: 701/5000, score: 31
('Action ', array([ 9.76867485,  8.28109646], dtype=float32))
('Action ', array([  9.41417789,  10.61521435], dtype=float32))
('Action ', array([ 14.04641438,  10.03699493], dtype=float32))
('Action ', array([  9.41417789,  10.61521435], dtype=float32))
('Action ', array([ 14.04641438,  10.03699493], dtype=float32))
('Action ', array([  9.41417789,  10.61521435], dtype=float32))
('Action ', array([ 14.04641438,  10.03699493], dtype=float32))
('Action ', array([ 15.45335102,  10.86622238], dtype=float32))
('Action ', array([  9.41417789,  10.61521435], dtype=float32))
('Action ', array([ 15.45335102,  10.86622238], dtype=float32))
('Action ', array([  9.41417789,  10.61521435], dtype=float32))
('Action ', array([ 15.45335102,  10.86622238], dtype=float32))
('Action ', array([  9.41417789,  10.61521435], dtype=float32))
('Action ', array

('Action ', array([  9.24697113,  10.25160599], dtype=float32))
('Action ', array([ 8.37840843,  8.39397812], dtype=float32))
('Action ', array([  9.20787811,  10.44663334], dtype=float32))
('Action ', array([ 8.44900894,  5.13121033], dtype=float32))
('Action ', array([  9.19955444,  10.35542965], dtype=float32))
('Action ', array([ 8.97088146,  0.02799244], dtype=float32))
('Action ', array([ 8.29963112,  9.25827599], dtype=float32))
('Action ', array([ 7.42301989,  5.10666656], dtype=float32))
('Action ', array([ 8.72865677,  9.76435947], dtype=float32))
('Action ', array([ 6.39611483,  3.71694589], dtype=float32))
('Action ', array([ 9.10938644,  9.88270569], dtype=float32))
('Action ', array([ 6.2912631 ,  3.76244378], dtype=float32))
('Action ', array([ 10.06583023,  10.62495613], dtype=float32))
('Action ', array([ 6.03088713,  2.36222863], dtype=float32))
('Action ', array([  9.61779785,  10.1737175 ], dtype=float32))
('Action ', array([ 5.65844488,  3.02433038], dtype=float32)

('Action ', array([ 9.60003757,  9.85381413], dtype=float32))
('Action ', array([ 3.8624332,  4.8977747], dtype=float32))
('Action ', array([  9.77564144,  10.1238575 ], dtype=float32))
Episode: 712/5000, score: 33
('Action ', array([ 9.65494251,  8.58955574], dtype=float32))
('Action ', array([ 8.8713274,  9.4257803], dtype=float32))
('Action ', array([ 9.65494251,  8.58955574], dtype=float32))
('Action ', array([ 10.6085825 ,   9.47482967], dtype=float32))
('Action ', array([ 8.9703474 ,  9.51175404], dtype=float32))
('Action ', array([ 11.54665756,   9.54962063], dtype=float32))
('Action ', array([  9.15367985,  10.20696545], dtype=float32))
('Action ', array([ 11.33459568,   8.50670147], dtype=float32))
('Action ', array([ 9.18569279,  8.73206234], dtype=float32))
('Action ', array([ 8.63705158,  9.88069439], dtype=float32))
('Action ', array([ 10.14030552,   9.29378796], dtype=float32))
('Action ', array([ 8.15281963,  9.44274426], dtype=float32))
('Action ', array([ 7.7213068 ,  

('Action ', array([ 9.60675144,  8.58503246], dtype=float32))
('Action ', array([  9.10492802,  10.41777515], dtype=float32))
('Action ', array([ 10.85349941,   7.63543272], dtype=float32))
('Action ', array([  9.14174938,  10.47790909], dtype=float32))
('Action ', array([ 10.72259235,   7.42687178], dtype=float32))
('Action ', array([  9.14174938,  10.47790909], dtype=float32))
('Action ', array([ 10.71978474,   7.42747068], dtype=float32))
('Action ', array([  9.14174938,  10.47790909], dtype=float32))
('Action ', array([ 8.95805073,  6.31361914], dtype=float32))
('Action ', array([  9.14174938,  10.47790909], dtype=float32))
('Action ', array([ 8.85532093,  6.21423101], dtype=float32))
('Action ', array([  9.14174938,  10.47790909], dtype=float32))
('Action ', array([ 8.85532093,  6.21423101], dtype=float32))
('Action ', array([  9.14174938,  10.47790909], dtype=float32))
('Action ', array([ 8.85532093,  6.21423101], dtype=float32))
('Action ', array([  9.14174938,  10.47790909], dt

('Action ', array([  9.59410858,  10.9149437 ], dtype=float32))
('Action ', array([ 9.73425674,  6.85814667], dtype=float32))
('Action ', array([ 9.14492226,  9.78966618], dtype=float32))
('Action ', array([ 9.18092918,  6.24925041], dtype=float32))
('Action ', array([  9.34646416,  10.09793472], dtype=float32))
('Action ', array([ 8.3114109,  6.4272747], dtype=float32))
('Action ', array([  9.29761505,  10.01869297], dtype=float32))
('Action ', array([ 7.87763119,  6.85970497], dtype=float32))
('Action ', array([  9.23091316,  10.03489876], dtype=float32))
('Action ', array([ 5.89538336,  5.45447731], dtype=float32))
('Action ', array([ 8.9974041 ,  9.46253395], dtype=float32))
('Action ', array([ 3.79040885,  6.85291481], dtype=float32))
Episode: 723/5000, score: 40
('Action ', array([ 9.64469051,  8.74895287], dtype=float32))
('Action ', array([  8.89385128,  10.31150341], dtype=float32))
('Action ', array([ 9.64469051,  8.74895287], dtype=float32))
('Action ', array([  8.89385128, 

('Action ', array([ 9.75161648,  8.82175827], dtype=float32))
('Action ', array([ 8.93271732,  9.59344006], dtype=float32))
('Action ', array([ 11.10042286,  10.2651577 ], dtype=float32))
('Action ', array([ 8.93271732,  9.59344006], dtype=float32))
('Action ', array([ 11.53677464,  11.66552639], dtype=float32))
('Action ', array([ 8.93271732,  9.59344006], dtype=float32))
('Action ', array([ 10.88750172,  11.32923603], dtype=float32))
('Action ', array([ 8.9124403 ,  9.61066532], dtype=float32))
('Action ', array([ 11.01094913,  11.20235538], dtype=float32))
('Action ', array([ 8.87846279,  9.57330608], dtype=float32))
('Action ', array([ 10.70636845,   9.20492554], dtype=float32))
('Action ', array([ 7.22131777,  7.99590969], dtype=float32))
('Action ', array([ 9.18311596,  7.70221615], dtype=float32))
('Action ', array([ 7.31038904,  8.09341335], dtype=float32))
('Action ', array([ 6.17949629,  6.15448093], dtype=float32))
('Action ', array([ 7.17084742,  7.90193653], dtype=float32)

Episode: 734/5000, score: 29
('Action ', array([ 9.76589394,  8.75950241], dtype=float32))
('Action ', array([  9.28526974,  10.39995956], dtype=float32))
('Action ', array([ 10.94249249,   9.84647274], dtype=float32))
('Action ', array([  9.28526974,  10.39995956], dtype=float32))
('Action ', array([  9.28526974,  10.39995956], dtype=float32))
('Action ', array([ 9.97754097,  9.83700848], dtype=float32))
('Action ', array([  9.30062199,  10.44220638], dtype=float32))
('Action ', array([ 9.06105709,  8.01605129], dtype=float32))
('Action ', array([  9.30616665,  10.41090202], dtype=float32))
('Action ', array([ 9.00331116,  7.70788145], dtype=float32))
('Action ', array([  9.30616665,  10.41090202], dtype=float32))
('Action ', array([ 8.91225529,  7.37596083], dtype=float32))
('Action ', array([  9.32805157,  10.44285965], dtype=float32))
('Action ', array([ 8.46964359,  7.04190016], dtype=float32))
('Action ', array([  9.32805157,  10.44285965], dtype=float32))
('Action ', array([ 8.4

('Action ', array([ 9.31234264,  8.84293747], dtype=float32))
('Action ', array([ 6.54663181,  0.87185907], dtype=float32))
('Action ', array([ 9.3601675 ,  8.78527164], dtype=float32))
('Action ', array([ 9.25034809,  2.90013742], dtype=float32))
('Action ', array([ 9.33684063,  8.99839306], dtype=float32))
('Action ', array([ 7.57495022,  8.74875927], dtype=float32))
('Action ', array([ 8.74262714,  8.25743484], dtype=float32))
('Action ', array([ 4.33885574,  8.54071331], dtype=float32))
('Action ', array([ 9.9759264 ,  9.36187077], dtype=float32))
('Action ', array([ 4.41697693,  1.87411737], dtype=float32))
('Action ', array([ 10.53831196,   9.44991684], dtype=float32))
('Action ', array([ 2.74540901,  2.90943766], dtype=float32))
('Action ', array([ 10.49780178,   9.61095619], dtype=float32))
('Action ', array([  1.25767517,  12.51697826], dtype=float32))
('Action ', array([ 10.4966917 ,   9.86414433], dtype=float32))
('Action ', array([  7.13724709,  16.704813  ], dtype=float32)

('Action ', array([ 9.99620342,  8.83393574], dtype=float32))
('Action ', array([ 9.07893848,  9.50556087], dtype=float32))
('Action ', array([ 10.21175957,   9.49850178], dtype=float32))
('Action ', array([ 9.07893848,  9.50556087], dtype=float32))
('Action ', array([ 10.52855873,  10.63472843], dtype=float32))
('Action ', array([ 9.07893848,  9.50556087], dtype=float32))
('Action ', array([ 10.21175957,   9.49850178], dtype=float32))
('Action ', array([ 9.08913708,  9.51312637], dtype=float32))
('Action ', array([ 10.28616047,   9.94486523], dtype=float32))
('Action ', array([ 9.33585262,  9.44200611], dtype=float32))
('Action ', array([ 10.83674908,  10.62691402], dtype=float32))
('Action ', array([ 8.91823864,  8.77816105], dtype=float32))
('Action ', array([ 10.9730463 ,   9.73512936], dtype=float32))
('Action ', array([ 8.87861156,  8.76944447], dtype=float32))
('Action ', array([ 11.01530743,   9.86643887], dtype=float32))
('Action ', array([ 9.32080173,  9.41717911], dtype=floa

('Action ', array([ 9.99388027,  8.85866642], dtype=float32))
('Action ', array([ 9.12837601,  9.54229164], dtype=float32))
('Action ', array([ 10.75041771,   9.77226734], dtype=float32))
('Action ', array([ 10.75041771,   9.77226734], dtype=float32))
('Action ', array([ 8.73478508,  9.23606586], dtype=float32))
('Action ', array([ 11.12158108,   8.5052557 ], dtype=float32))
('Action ', array([ 8.35655403,  9.00701523], dtype=float32))
('Action ', array([ 10.54561043,   8.97983456], dtype=float32))
('Action ', array([ 8.47813797,  9.10879803], dtype=float32))
('Action ', array([ 10.56483173,   9.29614544], dtype=float32))
('Action ', array([ 8.90275574,  9.27059174], dtype=float32))
('Action ', array([ 10.45494366,   7.1156106 ], dtype=float32))
('Action ', array([ 8.96899796,  9.17204571], dtype=float32))
('Action ', array([ 2.90605903, -0.16124475], dtype=float32))
('Action ', array([ 8.81286812,  9.17222691], dtype=float32))
Episode: 748/5000, score: 15
('Action ', array([ 9.9975748

('Action ', array([ 1.74571943,  1.33749163], dtype=float32))
('Action ', array([ 9.63534069,  9.14349556], dtype=float32))
('Action ', array([ 3.3015933 ,  5.07283545], dtype=float32))
('Action ', array([ 9.5883379 ,  9.11780453], dtype=float32))
('Action ', array([ 1.36956358,  3.23982406], dtype=float32))
('Action ', array([ 7.75851393,  8.00869465], dtype=float32))
('Action ', array([ 3.01420736,  3.75485778], dtype=float32))
('Action ', array([ 7.62050581,  7.96845961], dtype=float32))
('Action ', array([ 3.99189711,  3.98527312], dtype=float32))
('Action ', array([ 7.59275198,  7.97656679], dtype=float32))
('Action ', array([ 3.39740229,  3.16304946], dtype=float32))
('Action ', array([ 8.06322384,  8.27283096], dtype=float32))
('Action ', array([ 4.25452948,  3.1135118 ], dtype=float32))
('Action ', array([ 7.87534857,  8.18526649], dtype=float32))
('Action ', array([ 3.2217803 ,  4.63261938], dtype=float32))
('Action ', array([ 7.94341993,  8.20022678], dtype=float32))
('Action

Episode: 760/5000, score: 29
('Action ', array([ 10.03582478,   8.90364552], dtype=float32))
('Action ', array([  9.26147938,  10.18574047], dtype=float32))
('Action ', array([ 11.4614706 ,   9.83204746], dtype=float32))
('Action ', array([  9.50182819,  10.16810799], dtype=float32))
('Action ', array([ 11.25738525,   9.23191643], dtype=float32))
('Action ', array([  9.53546238,  10.15895748], dtype=float32))
('Action ', array([ 10.80247307,   9.53064346], dtype=float32))
('Action ', array([  9.53546238,  10.15895748], dtype=float32))
('Action ', array([ 10.10921097,  10.08713818], dtype=float32))
('Action ', array([  9.53324032,  10.15977001], dtype=float32))
('Action ', array([ 10.94981575,   9.67540073], dtype=float32))
('Action ', array([  9.57356167,  10.22520351], dtype=float32))
('Action ', array([ 10.7327013,   9.2476778], dtype=float32))
('Action ', array([  9.59277058,  10.23206997], dtype=float32))
('Action ', array([ 10.43996906,  10.36164761], dtype=float32))
('Action ', a

('Action ', array([ 10.09993839,   8.9891758 ], dtype=float32))
('Action ', array([  9.40612888,  10.23878098], dtype=float32))
('Action ', array([ 11.24614429,   8.82355595], dtype=float32))
('Action ', array([  9.40686512,  10.23898315], dtype=float32))
('Action ', array([ 11.65470409,   7.77257013], dtype=float32))
('Action ', array([  9.40686512,  10.23898315], dtype=float32))
('Action ', array([ 11.80972672,   9.55261898], dtype=float32))
('Action ', array([  9.40686512,  10.23898315], dtype=float32))
('Action ', array([ 11.18174648,   8.85105038], dtype=float32))
('Action ', array([  9.40686512,  10.23898315], dtype=float32))
('Action ', array([ 11.34471226,   8.57327175], dtype=float32))
('Action ', array([  9.54394245,  10.35960007], dtype=float32))
('Action ', array([ 11.24360752,   8.0676012 ], dtype=float32))
('Action ', array([  9.54389858,  10.30610466], dtype=float32))
('Action ', array([ 8.0984602 ,  7.07977533], dtype=float32))
('Action ', array([  9.60852528,  10.45085

('Action ', array([ 9.82277775,  9.21500301], dtype=float32))
('Action ', array([  9.1886034 ,  10.26640606], dtype=float32))
('Action ', array([ 10.89397049,  10.29579353], dtype=float32))
('Action ', array([  9.27506161,  10.34864616], dtype=float32))
('Action ', array([ 10.95557404,   9.9914856 ], dtype=float32))
('Action ', array([  9.2937479 ,  10.34509659], dtype=float32))
('Action ', array([ 10.69402981,  10.87798119], dtype=float32))
('Action ', array([  9.29736042,  10.41259575], dtype=float32))
('Action ', array([ 10.24970913,  11.81937027], dtype=float32))
('Action ', array([  9.71630192,  10.70563412], dtype=float32))
('Action ', array([  9.45953083,  11.62659264], dtype=float32))
('Action ', array([  9.53691959,  10.44562149], dtype=float32))
('Action ', array([  9.65497303,  11.54146004], dtype=float32))
('Action ', array([ 9.4142046 ,  9.71898365], dtype=float32))
('Action ', array([ 5.78028488,  5.89832497], dtype=float32))
('Action ', array([ 9.43679714,  9.70951366], 

('Action ', array([ 9.35971546,  9.43352413], dtype=float32))
('Action ', array([ 8.9210453 ,  9.29318905], dtype=float32))
('Action ', array([ 9.35971546,  9.43352413], dtype=float32))
('Action ', array([ 8.92313004,  9.28916454], dtype=float32))
('Action ', array([ 9.90023041,  9.64187145], dtype=float32))
('Action ', array([ 8.60772324,  8.70350742], dtype=float32))
('Action ', array([ 6.57936668,  4.8303113 ], dtype=float32))
('Action ', array([ 6.71651888,  7.39014959], dtype=float32))
('Action ', array([ 6.20839548,  4.59040117], dtype=float32))
('Action ', array([ 6.72322893,  7.36316252], dtype=float32))
('Action ', array([ 4.0904851,  3.7253232], dtype=float32))
('Action ', array([ 6.92041063,  7.41042852], dtype=float32))
('Action ', array([ 1.36786115,  3.95167589], dtype=float32))
('Action ', array([ 6.70095873,  7.12306643], dtype=float32))
Episode: 779/5000, score: 13
('Action ', array([ 9.33242607,  9.45300388], dtype=float32))
('Action ', array([  8.91685009,  10.052365

('Action ', array([ 9.20218945,  9.24478817], dtype=float32))
('Action ', array([ 5.49988031,  6.61561394], dtype=float32))
('Action ', array([ 8.92225361,  9.03208923], dtype=float32))
('Action ', array([ 5.49988031,  6.61561394], dtype=float32))
('Action ', array([ 8.92225361,  9.03208923], dtype=float32))
('Action ', array([ 5.49988031,  6.61561394], dtype=float32))
('Action ', array([ 9.19499683,  9.24218369], dtype=float32))
('Action ', array([ 5.75112009,  5.65636253], dtype=float32))
('Action ', array([ 9.37078571,  9.12905121], dtype=float32))
('Action ', array([ 3.58743739,  3.23803544], dtype=float32))
('Action ', array([ 9.20060825,  9.31811523], dtype=float32))
('Action ', array([ 0.47585356,  2.04115129], dtype=float32))
Episode: 788/5000, score: 40
('Action ', array([ 9.1870203 ,  9.56316376], dtype=float32))
('Action ', array([ 8.70411587,  9.14933586], dtype=float32))
('Action ', array([  9.75101376,  10.04986382], dtype=float32))
('Action ', array([ 8.70527935,  9.1551

('Action ', array([ 9.36105442,  9.57075691], dtype=float32))
('Action ', array([ 8.56656456,  9.76292133], dtype=float32))
('Action ', array([ 9.36105442,  9.57075691], dtype=float32))
('Action ', array([ 8.58311462,  9.83229637], dtype=float32))
('Action ', array([ 8.3399353 ,  9.53995228], dtype=float32))
('Action ', array([ 10.23801804,   7.17461443], dtype=float32))
('Action ', array([ 8.06069565,  9.26255894], dtype=float32))
('Action ', array([ 10.80054092,   7.24598742], dtype=float32))
('Action ', array([ 10.15219116,   6.48928881], dtype=float32))
('Action ', array([ 6.97294283,  8.26317978], dtype=float32))
('Action ', array([ 7.69676638,  1.49796319], dtype=float32))
Episode: 798/5000, score: 12
('Action ', array([ 9.37839031,  9.58584309], dtype=float32))
('Action ', array([ 8.36016464,  8.99453163], dtype=float32))
('Action ', array([ 9.37839031,  9.58584309], dtype=float32))
('Action ', array([ 8.38162613,  9.01090813], dtype=float32))
('Action ', array([ 10.51252079,   

('Action ', array([ 9.3446188,  9.5606842], dtype=float32))
('Action ', array([ 8.427248  ,  9.83849049], dtype=float32))
('Action ', array([ 9.20242119,  8.91860294], dtype=float32))
('Action ', array([ 8.34618568,  9.84119701], dtype=float32))
('Action ', array([ 7.98244858,  8.70818424], dtype=float32))
('Action ', array([  8.65640259,  10.1561203 ], dtype=float32))
('Action ', array([ 6.67332506,  5.01731205], dtype=float32))
('Action ', array([ 7.58050394,  8.7096405 ], dtype=float32))
('Action ', array([ 4.98397875,  3.41207218], dtype=float32))
('Action ', array([ 7.43440294,  8.65410328], dtype=float32))
('Action ', array([ 2.91769457,  1.67458045], dtype=float32))
Episode: 808/5000, score: 10
('Action ', array([ 9.36439419,  9.55639744], dtype=float32))
('Action ', array([ 8.01480675,  8.94623852], dtype=float32))
('Action ', array([ 9.93453503,  9.77203751], dtype=float32))
('Action ', array([ 8.02683067,  8.92909241], dtype=float32))
('Action ', array([ 9.93453503,  9.772037

('Action ', array([ 9.49353218,  9.51240921], dtype=float32))
('Action ', array([  8.43223953,  10.02947903], dtype=float32))
('Action ', array([ 11.4665966 ,  10.44389915], dtype=float32))
('Action ', array([  8.43223953,  10.02947903], dtype=float32))
('Action ', array([ 10.57038689,  10.31364441], dtype=float32))
('Action ', array([ 8.22935486,  9.83859634], dtype=float32))
('Action ', array([ 10.92955208,  10.04451752], dtype=float32))
('Action ', array([ 8.28507042,  9.79524899], dtype=float32))
('Action ', array([ 10.53281021,   9.26906204], dtype=float32))
('Action ', array([ 7.42703867,  8.54994202], dtype=float32))
('Action ', array([ 9.27167988,  9.32260895], dtype=float32))
('Action ', array([ 7.27180529,  8.53342628], dtype=float32))
('Action ', array([ 7.23688936,  5.12363815], dtype=float32))
('Action ', array([ 7.14052057,  8.44640064], dtype=float32))
('Action ', array([ 6.01114511,  5.02403641], dtype=float32))
Episode: 818/5000, score: 14
('Action ', array([ 9.5103464

('Action ', array([ 9.44696331,  9.53970242], dtype=float32))
('Action ', array([ 8.42663288,  9.97103786], dtype=float32))
('Action ', array([ 10.40644455,  11.84070587], dtype=float32))
('Action ', array([  8.75652599,  10.31579399], dtype=float32))
('Action ', array([ 9.38781452,  9.41391182], dtype=float32))
('Action ', array([ 8.23321629,  8.96887016], dtype=float32))
('Action ', array([ 4.85712767,  5.89336061], dtype=float32))
('Action ', array([ 7.68318892,  8.28629494], dtype=float32))
Episode: 826/5000, score: 7
('Action ', array([ 9.48957825,  9.54358387], dtype=float32))
('Action ', array([  8.76887703,  10.23456097], dtype=float32))
('Action ', array([ 7.15673018,  7.66484356], dtype=float32))
('Action ', array([ 8.33974838,  9.32685852], dtype=float32))
('Action ', array([ 8.44660187,  9.4285078 ], dtype=float32))
('Action ', array([ 4.69020081,  8.03635883], dtype=float32))
('Action ', array([ 6.4603405 ,  7.91452599], dtype=float32))
('Action ', array([ 2.05360246,  5.3

('Action ', array([  8.98119545,  10.26601887], dtype=float32))
Episode: 832/5000, score: 29
('Action ', array([ 9.7167902,  9.4477396], dtype=float32))
('Action ', array([  8.60131264,  10.06256485], dtype=float32))
('Action ', array([ 12.21292305,   9.1330061 ], dtype=float32))
('Action ', array([  8.63105774,  10.10374641], dtype=float32))
('Action ', array([ 12.17754269,   9.07856655], dtype=float32))
('Action ', array([  8.63105774,  10.10374641], dtype=float32))
('Action ', array([ 12.78637695,  11.10117626], dtype=float32))
('Action ', array([  8.63105774,  10.10374641], dtype=float32))
('Action ', array([ 12.78637695,  11.10117626], dtype=float32))
('Action ', array([  8.63105774,  10.10374641], dtype=float32))
('Action ', array([  8.63105774,  10.10374641], dtype=float32))
('Action ', array([ 12.88297081,  11.16095638], dtype=float32))
('Action ', array([  8.63105774,  10.10374641], dtype=float32))
('Action ', array([ 12.88297081,  11.16095638], dtype=float32))
('Action ', arr

Episode: 838/5000, score: 29
('Action ', array([ 9.70266914,  9.43690968], dtype=float32))
('Action ', array([ 8.3470459 ,  9.24290466], dtype=float32))
('Action ', array([  9.34275723,  10.12688351], dtype=float32))
('Action ', array([ 8.34041405,  9.32351875], dtype=float32))
('Action ', array([  8.83548927,  10.4809618 ], dtype=float32))
('Action ', array([ 8.36731148,  9.31719208], dtype=float32))
('Action ', array([ 9.02864838,  9.14068127], dtype=float32))
('Action ', array([ 8.3952198 ,  9.34148979], dtype=float32))
('Action ', array([ 8.50720978,  7.96674061], dtype=float32))
('Action ', array([ 6.82766581,  8.24298859], dtype=float32))
('Action ', array([ 4.20154047,  2.94546986], dtype=float32))
Episode: 839/5000, score: 10
('Action ', array([ 9.72655964,  9.46096706], dtype=float32))
('Action ', array([ 8.43060017,  9.1417532 ], dtype=float32))
('Action ', array([ 9.72655964,  9.46096706], dtype=float32))
('Action ', array([ 8.39156818,  9.2090683 ], dtype=float32))
('Action

('Action ', array([ 9.85571861,  9.53412437], dtype=float32))
('Action ', array([ 8.31010914,  9.98983479], dtype=float32))
('Action ', array([ 11.4557476 ,  10.33032894], dtype=float32))
('Action ', array([ 8.31145573,  9.98934841], dtype=float32))
('Action ', array([ 11.44706917,  10.33964252], dtype=float32))
('Action ', array([ 8.3124094 ,  9.95121098], dtype=float32))
('Action ', array([ 8.3124094 ,  9.95121098], dtype=float32))
('Action ', array([ 10.24723816,  10.90279484], dtype=float32))
('Action ', array([ 8.3020525 ,  9.90100098], dtype=float32))
('Action ', array([  7.72233343,  10.53095341], dtype=float32))
('Action ', array([ 8.21309757,  9.80307007], dtype=float32))
('Action ', array([ 6.66669178,  9.13014698], dtype=float32))
('Action ', array([ 8.20965099,  9.80366135], dtype=float32))
('Action ', array([ 6.44463444,  6.18519354], dtype=float32))
('Action ', array([ 8.57813358,  9.46773911], dtype=float32))
('Action ', array([ 3.69863319,  4.7495513 ], dtype=float32))


('Action ', array([ 7.05268097,  7.73535442], dtype=float32))
('Action ', array([ 5.18747997,  3.33162212], dtype=float32))
('Action ', array([ 7.04530144,  7.74050713], dtype=float32))
Episode: 851/5000, score: 33
('Action ', array([ 9.85084438,  9.39066505], dtype=float32))
('Action ', array([ 8.4050827 ,  9.94634724], dtype=float32))
('Action ', array([ 9.85084438,  9.39066505], dtype=float32))
('Action ', array([ 8.4050827 ,  9.94634724], dtype=float32))
('Action ', array([ 9.85084438,  9.39066505], dtype=float32))
('Action ', array([ 8.4050827 ,  9.94634724], dtype=float32))
('Action ', array([ 10.27227402,  10.29864311], dtype=float32))
('Action ', array([ 8.4050827 ,  9.94634724], dtype=float32))
('Action ', array([ 9.85084438,  9.39066505], dtype=float32))
('Action ', array([ 8.4050827 ,  9.94634724], dtype=float32))
('Action ', array([ 9.85084438,  9.39066505], dtype=float32))
('Action ', array([ 8.36803436,  9.90681648], dtype=float32))
('Action ', array([ 10.1868782 ,  10.38

('Action ', array([ 9.9627409 ,  9.49249744], dtype=float32))
('Action ', array([ 8.33881378,  9.18805122], dtype=float32))
('Action ', array([ 11.16562653,  10.78527164], dtype=float32))
('Action ', array([ 8.33881378,  9.18805122], dtype=float32))
('Action ', array([ 11.56134415,  11.73152351], dtype=float32))
('Action ', array([ 8.01638794,  9.01912212], dtype=float32))
('Action ', array([ 11.38121128,  10.71638489], dtype=float32))
('Action ', array([ 7.98216629,  9.03460121], dtype=float32))
('Action ', array([ 11.38121128,  10.71638489], dtype=float32))
('Action ', array([ 8.02122307,  9.02704906], dtype=float32))
('Action ', array([ 11.38121128,  10.71638489], dtype=float32))
('Action ', array([ 7.93360329,  8.94940948], dtype=float32))
('Action ', array([ 11.24082661,  10.49084759], dtype=float32))
('Action ', array([ 7.95874023,  8.96168804], dtype=float32))
('Action ', array([ 11.24082661,  10.49084759], dtype=float32))
('Action ', array([ 7.95874023,  8.96168804], dtype=floa

('Action ', array([ 9.89376926,  9.42898273], dtype=float32))
('Action ', array([ 8.3348093 ,  9.55772305], dtype=float32))
('Action ', array([ 10.43068123,   9.97623062], dtype=float32))
('Action ', array([ 8.35631466,  9.56543922], dtype=float32))
('Action ', array([ 9.92902374,  9.23174953], dtype=float32))
('Action ', array([ 8.33116817,  9.56912994], dtype=float32))
('Action ', array([ 10.77070808,  10.61381149], dtype=float32))
('Action ', array([ 8.33161068,  9.57297897], dtype=float32))
('Action ', array([ 10.46940517,  10.24710274], dtype=float32))
('Action ', array([ 9.59310818,  9.53964424], dtype=float32))
('Action ', array([ 8.29118443,  9.57984066], dtype=float32))
('Action ', array([ 9.1884737 ,  6.84426689], dtype=float32))
('Action ', array([ 8.17711926,  9.40945053], dtype=float32))
('Action ', array([ 7.74829006,  6.42184067], dtype=float32))
('Action ', array([ 6.23949194,  8.1326437 ], dtype=float32))
('Action ', array([ 7.29499483,  4.72640228], dtype=float32))
('

('Action ', array([ 6.5177269 ,  7.05334091], dtype=float32))
('Action ', array([ 8.6092329 ,  9.20091724], dtype=float32))
('Action ', array([ 6.28602791,  6.85129929], dtype=float32))
('Action ', array([ 9.05364895,  9.08515453], dtype=float32))
('Action ', array([ 9.3751936 ,  9.36608124], dtype=float32))
('Action ', array([ 6.0796442 ,  7.24490738], dtype=float32))
('Action ', array([ 8.35990429,  8.72789669], dtype=float32))
('Action ', array([ 5.09573841,  6.80300522], dtype=float32))
('Action ', array([ 8.3563509 ,  8.41749763], dtype=float32))
('Action ', array([ 3.73871922,  5.65176773], dtype=float32))
('Action ', array([ 7.91210079,  7.68589973], dtype=float32))
('Action ', array([ 2.9586556 ,  3.58905387], dtype=float32))
('Action ', array([ 7.87726879,  7.8839426 ], dtype=float32))
('Action ', array([ 4.36650372,  3.1337316 ], dtype=float32))
('Action ', array([ 8.18542957,  8.16648674], dtype=float32))
('Action ', array([ 0.40828815, -3.86495233], dtype=float32))
('Action

('Action ', array([ 9.65313053,  9.55537891], dtype=float32))
('Action ', array([ 8.39318085,  9.20646667], dtype=float32))
('Action ', array([ 7.68610382,  9.54995918], dtype=float32))
('Action ', array([ 8.39318085,  9.20646667], dtype=float32))
('Action ', array([ 9.65313053,  9.55537891], dtype=float32))
('Action ', array([ 8.39318085,  9.20646667], dtype=float32))
('Action ', array([ 9.65313053,  9.55537891], dtype=float32))
('Action ', array([ 8.35645294,  9.1673851 ], dtype=float32))
('Action ', array([ 8.51595688,  9.98740578], dtype=float32))
('Action ', array([ 8.24895096,  9.03731537], dtype=float32))
('Action ', array([ 9.26869774,  9.17852211], dtype=float32))
('Action ', array([ 7.15074158,  7.66233873], dtype=float32))
('Action ', array([ 4.9966464 ,  4.47168398], dtype=float32))
('Action ', array([ 6.92879868,  7.60304308], dtype=float32))
('Action ', array([ 2.93279815,  4.34540606], dtype=float32))
('Action ', array([ 7.73711777,  8.00613785], dtype=float32))
Episode:

('Action ', array([ 7.6100378 ,  7.61838961], dtype=float32))
('Action ', array([ 6.76673985,  6.43475485], dtype=float32))
('Action ', array([ 7.484622  ,  7.61720419], dtype=float32))
('Action ', array([ 6.63364029,  6.15153646], dtype=float32))
('Action ', array([ 7.87502575,  8.0402832 ], dtype=float32))
('Action ', array([ 6.18806171,  6.71962881], dtype=float32))
('Action ', array([ 7.84370518,  7.99735975], dtype=float32))
('Action ', array([ 4.66267872,  5.52593374], dtype=float32))
('Action ', array([ 4.74833965,  5.72029257], dtype=float32))
('Action ', array([ 7.83257771,  8.05544281], dtype=float32))
('Action ', array([ 6.7642374 ,  5.36047888], dtype=float32))
('Action ', array([ 7.63785458,  7.84814119], dtype=float32))
('Action ', array([ 6.48074722,  6.17656088], dtype=float32))
('Action ', array([ 8.19271946,  8.07002926], dtype=float32))
('Action ', array([ 6.32124805,  6.85554266], dtype=float32))
('Action ', array([ 7.42086887,  7.08329725], dtype=float32))
('Action

('Action ', array([ 9.46835995,  9.45998478], dtype=float32))
('Action ', array([ 8.21327782,  8.13285065], dtype=float32))
('Action ', array([ 7.68377018,  8.34157372], dtype=float32))
('Action ', array([ 8.24393845,  8.11222458], dtype=float32))
('Action ', array([ 7.70322418,  8.33898163], dtype=float32))
('Action ', array([ 8.17397213,  8.18430614], dtype=float32))
('Action ', array([ 6.51700401,  8.33590412], dtype=float32))
('Action ', array([ 8.13964939,  8.15633774], dtype=float32))
('Action ', array([ 6.51700401,  8.33590412], dtype=float32))
('Action ', array([ 8.24625874,  8.16309547], dtype=float32))
('Action ', array([ 6.13018608,  8.365798  ], dtype=float32))
('Action ', array([ 8.2219038 ,  8.15857029], dtype=float32))
('Action ', array([ 7.61386967,  8.48486805], dtype=float32))
('Action ', array([ 8.303545  ,  7.46444607], dtype=float32))
('Action ', array([ 6.33111   ,  6.91388035], dtype=float32))
('Action ', array([ 7.31512642,  8.0970583 ], dtype=float32))
('Action

('Action ', array([ 9.43097305,  9.53388882], dtype=float32))
('Action ', array([ 8.48196507,  8.87912369], dtype=float32))
('Action ', array([ 10.91725826,   8.38667583], dtype=float32))
('Action ', array([ 8.17195225,  8.08257675], dtype=float32))
('Action ', array([ 10.09686756,  10.25773907], dtype=float32))
('Action ', array([ 8.17195225,  8.08257675], dtype=float32))
('Action ', array([ 10.11186314,   9.4071207 ], dtype=float32))
('Action ', array([ 8.17195225,  8.08257675], dtype=float32))
('Action ', array([ 10.13096333,   9.99104786], dtype=float32))
('Action ', array([ 8.10062408,  8.06108952], dtype=float32))
('Action ', array([ 9.96444416,  8.29711437], dtype=float32))
('Action ', array([ 7.26762915,  7.4237566 ], dtype=float32))
('Action ', array([ 10.15111542,   7.94115353], dtype=float32))
('Action ', array([ 7.49152327,  7.41441631], dtype=float32))
('Action ', array([ 9.79744339,  7.49234295], dtype=float32))
('Action ', array([ 6.00717306,  6.219347  ], dtype=float32)

('Action ', array([ 8.73720837,  7.51150131], dtype=float32))
('Action ', array([-0.42606246,  4.33654022], dtype=float32))
('Action ', array([ 9.13860798,  8.08841228], dtype=float32))
('Action ', array([-2.38535762,  9.25566483], dtype=float32))
Episode: 903/5000, score: 28
('Action ', array([ 9.11751652,  9.5982523 ], dtype=float32))
('Action ', array([ 8.2831192 ,  8.29403782], dtype=float32))
('Action ', array([ 9.11751652,  9.5982523 ], dtype=float32))
('Action ', array([ 8.17828941,  7.68221951], dtype=float32))
('Action ', array([ 8.34522629,  9.9333601 ], dtype=float32))
('Action ', array([ 4.95543575,  3.63893819], dtype=float32))
('Action ', array([ 6.65492678,  6.64319038], dtype=float32))
('Action ', array([ 6.6471467 ,  6.65015411], dtype=float32))
('Action ', array([ 4.20657873,  3.19320226], dtype=float32))
('Action ', array([ 6.54049349,  6.67595863], dtype=float32))
('Action ', array([ 5.58575106,  4.9145155 ], dtype=float32))
('Action ', array([ 6.56710577,  6.670862

('Action ', array([ 9.78159904, -5.07355309], dtype=float32))
('Action ', array([ 5.60371304,  6.36219978], dtype=float32))
('Action ', array([ 6.74885654, -0.3691043 ], dtype=float32))
('Action ', array([ 6.62998581,  7.06130886], dtype=float32))
('Action ', array([ 4.34333134, -4.19551659], dtype=float32))
('Action ', array([ 6.62205696,  7.11175442], dtype=float32))
('Action ', array([ 4.62257195, -3.00165749], dtype=float32))
('Action ', array([ 7.68956566,  7.88468361], dtype=float32))
('Action ', array([ 5.24854088,  3.55065346], dtype=float32))
('Action ', array([ 8.18033028,  7.9049778 ], dtype=float32))
('Action ', array([ 8.93791962,  4.51989937], dtype=float32))
('Action ', array([ 9.29777145,  8.65175724], dtype=float32))
('Action ', array([ 5.46934128,  7.096838  ], dtype=float32))
('Action ', array([ 9.37986755,  8.75996685], dtype=float32))
('Action ', array([ 10.73139286,  11.12294197], dtype=float32))
('Action ', array([ 9.68876266,  8.89184475], dtype=float32))
('Acti

('Action ', array([ 8.8756485 ,  9.55160236], dtype=float32))
('Action ', array([ 8.5848732 ,  9.69725895], dtype=float32))
('Action ', array([ 6.40651894,  7.44722033], dtype=float32))
('Action ', array([ 8.495327  ,  9.54766273], dtype=float32))
('Action ', array([ 4.41850185,  7.99869204], dtype=float32))
('Action ', array([ 8.52000237,  9.60209846], dtype=float32))
('Action ', array([ 4.79839802,  8.03044891], dtype=float32))
('Action ', array([ 8.18208885,  9.14197826], dtype=float32))
('Action ', array([ 4.06377602,  8.40682983], dtype=float32))
Episode: 920/5000, score: 8
('Action ', array([ 8.9120779 ,  9.55375099], dtype=float32))
('Action ', array([ 8.2077055 ,  9.53579044], dtype=float32))
('Action ', array([ 8.9120779 ,  9.55375099], dtype=float32))
('Action ', array([ 8.2036562 ,  9.54308414], dtype=float32))
('Action ', array([  8.23243427,  10.29899025], dtype=float32))
('Action ', array([ 7.79892778,  9.09667301], dtype=float32))
('Action ', array([ 4.35158396,  8.26029

('Action ', array([ 9.08521175,  9.41017342], dtype=float32))
('Action ', array([ 8.17099667,  9.47482777], dtype=float32))
('Action ', array([ 9.08521175,  9.41017342], dtype=float32))
('Action ', array([ 8.1338644,  9.4396944], dtype=float32))
('Action ', array([ 11.19248009,  10.67168331], dtype=float32))
('Action ', array([ 8.22687435,  9.73051548], dtype=float32))
('Action ', array([ 8.43358326,  8.30985928], dtype=float32))
('Action ', array([ 8.22999287,  9.71874905], dtype=float32))
('Action ', array([ 8.16606236,  7.59842587], dtype=float32))
('Action ', array([  8.47258663,  10.02698421], dtype=float32))
('Action ', array([ 8.35195732,  7.22932339], dtype=float32))
('Action ', array([ 8.36680126,  9.45336342], dtype=float32))
('Action ', array([ 7.71294165,  5.56267071], dtype=float32))
('Action ', array([ 8.32636547,  9.34967899], dtype=float32))
Episode: 929/5000, score: 13
('Action ', array([ 9.06036186,  9.39358044], dtype=float32))
('Action ', array([ 8.21644974,  8.7680

('Action ', array([ 9.16917038,  9.42735863], dtype=float32))
('Action ', array([ 8.50467968,  9.79576969], dtype=float32))
('Action ', array([ 7.54212427,  7.33414793], dtype=float32))
('Action ', array([ 7.35574102,  7.94270277], dtype=float32))
('Action ', array([ 8.17772388,  9.09006596], dtype=float32))
('Action ', array([ 7.30520153,  7.90151548], dtype=float32))
('Action ', array([ 8.20020008,  8.9751091 ], dtype=float32))
('Action ', array([ 5.93138695,  6.10412931], dtype=float32))
('Action ', array([ 8.19703197,  8.97495651], dtype=float32))
('Action ', array([ 5.74686813,  6.64762831], dtype=float32))
('Action ', array([ 6.95359516,  8.05724907], dtype=float32))
Episode: 940/5000, score: 11
('Action ', array([ 9.17051315,  9.39750004], dtype=float32))
('Action ', array([ 8.0960207,  9.5396328], dtype=float32))
('Action ', array([ 7.61968946,  7.01583672], dtype=float32))
('Action ', array([ 8.59204388,  9.9352169 ], dtype=float32))
('Action ', array([ 7.11765623,  9.35830498

('Action ', array([ 8.40660191,  9.06955814], dtype=float32))
('Action ', array([ 6.81087971,  9.70875549], dtype=float32))
('Action ', array([ 8.35873318,  8.90410233], dtype=float32))
('Action ', array([ 2.2253449 ,  2.17511344], dtype=float32))
('Action ', array([ 7.98302746,  8.03577709], dtype=float32))
Episode: 948/5000, score: 29
('Action ', array([ 9.2478838 ,  9.45257378], dtype=float32))
('Action ', array([ 8.11936951,  8.87802601], dtype=float32))
('Action ', array([  9.69305706,  11.69769859], dtype=float32))
('Action ', array([ 8.1444912 ,  8.86168766], dtype=float32))
('Action ', array([  7.29044056,  11.2178669 ], dtype=float32))
('Action ', array([ 7.83220291,  8.20503235], dtype=float32))
('Action ', array([  6.64110756,  11.03137398], dtype=float32))
('Action ', array([ 7.8862114 ,  8.20184422], dtype=float32))
('Action ', array([ 3.57212448,  8.95886803], dtype=float32))
('Action ', array([ 8.08400822,  8.36229706], dtype=float32))
Episode: 949/5000, score: 9
('Actio

('Action ', array([ 8.54738712,  9.36708832], dtype=float32))
('Action ', array([ 8.28363514,  7.27575874], dtype=float32))
('Action ', array([ 8.61808681,  9.34619331], dtype=float32))
('Action ', array([ 9.63074875,  7.67559242], dtype=float32))
('Action ', array([ 8.64822865,  9.27872562], dtype=float32))
('Action ', array([ 11.3013525 ,   5.08020973], dtype=float32))
('Action ', array([ 8.58104229,  8.73069954], dtype=float32))
('Action ', array([ 9.43802261,  1.9511013 ], dtype=float32))
('Action ', array([ 8.55575085,  8.92471313], dtype=float32))
('Action ', array([ 11.08841705,   7.80840874], dtype=float32))
('Action ', array([ 8.48805523,  8.63396835], dtype=float32))
('Action ', array([ 12.18681335,   6.84868431], dtype=float32))
('Action ', array([ 8.71515942,  8.86413765], dtype=float32))
('Action ', array([ 14.60683727,   2.15308952], dtype=float32))
('Action ', array([ 9.10200214,  9.11847687], dtype=float32))
('Action ', array([ 13.02711296,   0.18031123], dtype=float32)

('Action ', array([ 9.13415623,  9.38156033], dtype=float32))
('Action ', array([ 8.05478001,  8.83010292], dtype=float32))
('Action ', array([ 8.12916183,  8.9883337 ], dtype=float32))
('Action ', array([ 8.03501701,  8.86640644], dtype=float32))
('Action ', array([ 7.41678095,  7.57256031], dtype=float32))
('Action ', array([ 8.3185873,  9.1300602], dtype=float32))
('Action ', array([ 5.78179026,  6.67966366], dtype=float32))
('Action ', array([ 8.26174259,  8.90394974], dtype=float32))
Episode: 968/5000, score: 7
('Action ', array([ 9.13931751,  9.36347008], dtype=float32))
('Action ', array([ 8.42717361,  8.97367191], dtype=float32))
('Action ', array([ 9.21614075,  9.25545311], dtype=float32))
('Action ', array([ 8.11737156,  8.18340778], dtype=float32))
('Action ', array([ 9.37848282,  9.07839394], dtype=float32))
('Action ', array([ 8.41467571,  8.21008396], dtype=float32))
('Action ', array([ 8.39066315,  7.6076889 ], dtype=float32))
('Action ', array([ 8.23266697,  6.31832695]

('Action ', array([  3.55566192,  12.05875874], dtype=float32))
Episode: 976/5000, score: 26
('Action ', array([ 9.07838821,  9.28570652], dtype=float32))
('Action ', array([ 7.98650312,  8.61784267], dtype=float32))
('Action ', array([ 9.07838821,  9.28570652], dtype=float32))
('Action ', array([ 7.97171545,  8.56216717], dtype=float32))
('Action ', array([ 8.57672882,  6.055511  ], dtype=float32))
('Action ', array([ 7.5392127 ,  7.62213373], dtype=float32))
('Action ', array([ 7.433393  ,  7.52097845], dtype=float32))
('Action ', array([ 9.77472878,  7.63500547], dtype=float32))
('Action ', array([ 7.48845434,  7.62396193], dtype=float32))
('Action ', array([ 7.67039824,  3.7547605 ], dtype=float32))
('Action ', array([ 5.96270323,  6.53421545], dtype=float32))
('Action ', array([ 4.72489214,  0.30145991], dtype=float32))
('Action ', array([ 6.40288401,  6.56818438], dtype=float32))
('Action ', array([ 4.29895067,  0.07555736], dtype=float32))
Episode: 977/5000, score: 14
('Action '

('Action ', array([ 9.01191902,  9.25094509], dtype=float32))
('Action ', array([ 8.42481518,  8.99478912], dtype=float32))
('Action ', array([ 7.86506653,  6.86091137], dtype=float32))
('Action ', array([ 8.45338917,  9.01931763], dtype=float32))
('Action ', array([ 6.8181653,  7.2457571], dtype=float32))
('Action ', array([ 8.11805725,  8.21313858], dtype=float32))
('Action ', array([ 7.54393291,  9.071311  ], dtype=float32))
('Action ', array([ 7.96866131,  7.96017361], dtype=float32))
('Action ', array([ 5.70684814,  6.51041698], dtype=float32))
('Action ', array([ 7.40541172,  7.10660362], dtype=float32))
('Action ', array([ 2.26327991, -2.00401759], dtype=float32))
('Action ', array([ 7.4100914 ,  6.95585442], dtype=float32))
('Action ', array([ 2.14264774, -2.27706599], dtype=float32))
Episode: 984/5000, score: 13
('Action ', array([ 9.00126743,  9.2633934 ], dtype=float32))
('Action ', array([ 8.04548645,  7.80938005], dtype=float32))
('Action ', array([ 8.4671545 ,  9.30999374

('Action ', array([  7.76967621,  11.89573193], dtype=float32))
('Action ', array([ 7.96278954,  7.33016253], dtype=float32))
('Action ', array([ 11.17315865,   7.11131525], dtype=float32))
('Action ', array([ 8.24093151,  7.54159975], dtype=float32))
('Action ', array([ 6.02576733,  6.58243036], dtype=float32))
('Action ', array([ 8.53996754,  7.90268564], dtype=float32))
('Action ', array([ 4.42352772,  3.91424823], dtype=float32))
('Action ', array([ 4.38708782,  0.09308124], dtype=float32))
('Action ', array([ 9.2784338 ,  8.14430809], dtype=float32))
('Action ', array([ 6.80634594,  0.62392306], dtype=float32))
('Action ', array([ 9.091712  ,  7.72631407], dtype=float32))
('Action ', array([ 4.63771152,  7.82731867], dtype=float32))
('Action ', array([ 9.13708591,  7.8041234 ], dtype=float32))
('Action ', array([  0.20974079,  12.51237392], dtype=float32))
('Action ', array([ 9.45519161,  7.61941385], dtype=float32))
('Action ', array([  2.6069634,  12.1347723], dtype=float32))
('

('Action ', array([ 9.02525139,  9.11269951], dtype=float32))
('Action ', array([ 8.14615631,  7.80670691], dtype=float32))
('Action ', array([ 9.02525139,  9.11269951], dtype=float32))
('Action ', array([ 8.14615631,  7.80670691], dtype=float32))
('Action ', array([ 9.02525139,  9.11269951], dtype=float32))
('Action ', array([ 8.14615631,  7.80670691], dtype=float32))
('Action ', array([ 8.33893681,  7.90112925], dtype=float32))
('Action ', array([ 8.14615631,  7.80670691], dtype=float32))
('Action ', array([ 9.02525139,  9.11269951], dtype=float32))
('Action ', array([ 8.14615631,  7.80670691], dtype=float32))
('Action ', array([ 9.02525139,  9.11269951], dtype=float32))
('Action ', array([ 8.11342716,  7.78063726], dtype=float32))
('Action ', array([ 9.02525139,  9.11269951], dtype=float32))
('Action ', array([ 8.13289833,  7.80881071], dtype=float32))
('Action ', array([ 9.02525139,  9.11269951], dtype=float32))
('Action ', array([ 8.14615631,  7.80670691], dtype=float32))
('Action

('Action ', array([ 8.92146015,  9.09078217], dtype=float32))
('Action ', array([ 8.06755733,  8.31204796], dtype=float32))
('Action ', array([ 7.97375107,  9.41399574], dtype=float32))
('Action ', array([ 8.17135429,  8.30400085], dtype=float32))
('Action ', array([ 6.90459394,  6.72995234], dtype=float32))
('Action ', array([ 5.86454201,  7.12644529], dtype=float32))
('Action ', array([ 6.85469294,  6.76912546], dtype=float32))
('Action ', array([ 3.38717437,  4.89616728], dtype=float32))
Episode: 1001/5000, score: 8
('Action ', array([ 8.92604446,  9.08840084], dtype=float32))
('Action ', array([ 8.36805916,  8.40826035], dtype=float32))
('Action ', array([ 8.10809994,  8.93706226], dtype=float32))
('Action ', array([ 8.33990669,  8.21922016], dtype=float32))
('Action ', array([  8.37033653,  10.31963444], dtype=float32))
('Action ', array([ 8.29520988,  8.28304863], dtype=float32))
('Action ', array([ 8.30704975,  9.59871387], dtype=float32))
('Action ', array([ 8.30907631,  7.6814

('Action ', array([  9.64614201,  11.14312363], dtype=float32))
('Action ', array([ 8.9789381 ,  9.04821873], dtype=float32))
('Action ', array([ 8.03994179,  7.50326538], dtype=float32))
('Action ', array([ 8.9789381 ,  9.04821873], dtype=float32))
('Action ', array([ 8.03994179,  7.50326538], dtype=float32))
('Action ', array([ 9.18649673,  8.34328747], dtype=float32))
('Action ', array([ 8.1114645 ,  7.57229519], dtype=float32))
('Action ', array([ 9.18649673,  8.34328747], dtype=float32))
('Action ', array([ 8.1114645 ,  7.57229519], dtype=float32))
('Action ', array([ 9.19726944,  8.38675594], dtype=float32))
('Action ', array([ 7.8037219 ,  7.27849483], dtype=float32))
('Action ', array([ 10.37539959,   8.52113724], dtype=float32))
('Action ', array([ 7.72746801,  7.32871628], dtype=float32))
('Action ', array([ 9.75104713,  5.76667786], dtype=float32))
Episode: 1007/5000, score: 12
('Action ', array([ 8.95504665,  9.04794216], dtype=float32))
('Action ', array([ 8.01642799,  7.4

('Action ', array([ 7.72793531,  7.65857267], dtype=float32))
('Action ', array([ 7.07726717,  6.80279684], dtype=float32))
('Action ', array([ 7.66298056,  7.47738791], dtype=float32))
Episode: 1013/5000, score: 27
('Action ', array([ 8.77100849,  8.97676945], dtype=float32))
('Action ', array([ 7.76200914,  7.35878801], dtype=float32))
('Action ', array([ 8.77100849,  8.97676945], dtype=float32))
('Action ', array([ 7.76200914,  7.35878801], dtype=float32))
('Action ', array([ 8.77100849,  8.97676945], dtype=float32))
('Action ', array([ 7.76200914,  7.35878801], dtype=float32))
('Action ', array([ 9.20949364,  9.61653709], dtype=float32))
('Action ', array([ 7.84946489,  7.31762457], dtype=float32))
('Action ', array([ 9.00167465,  9.1761055 ], dtype=float32))
('Action ', array([ 7.85071707,  7.34572649], dtype=float32))
('Action ', array([ 8.98539925,  7.78527308], dtype=float32))
('Action ', array([ 7.82071257,  7.38271666], dtype=float32))
('Action ', array([ 8.27582264,  7.75578

('Action ', array([ 8.02365589,  8.81741619], dtype=float32))
('Action ', array([ 8.15118027,  5.14149475], dtype=float32))
('Action ', array([ 7.6575551 ,  7.72878361], dtype=float32))
('Action ', array([ 7.0286088,  4.8515358], dtype=float32))
('Action ', array([ 7.65873766,  7.75571156], dtype=float32))
('Action ', array([ 8.82790852,  5.73881531], dtype=float32))
('Action ', array([ 7.64962816,  7.6759758 ], dtype=float32))
('Action ', array([ 9.49545574,  6.83270645], dtype=float32))
('Action ', array([ 7.4486928 ,  7.41049671], dtype=float32))
('Action ', array([ 11.10725498,   0.76142478], dtype=float32))
('Action ', array([ 7.79140425,  7.53530502], dtype=float32))
('Action ', array([ 10.61009789,   3.38821006], dtype=float32))
('Action ', array([ 7.86010599,  7.70207405], dtype=float32))
Episode: 1020/5000, score: 37
('Action ', array([ 8.78667068,  8.92281055], dtype=float32))
('Action ', array([ 7.67455721,  7.53746462], dtype=float32))
('Action ', array([ 7.67455721,  7.537

('Action ', array([ 8.62600422,  8.96938992], dtype=float32))
('Action ', array([ 7.47269583,  7.54343414], dtype=float32))
('Action ', array([ 9.3410759 ,  9.40278721], dtype=float32))
('Action ', array([ 7.47269583,  7.54343414], dtype=float32))
('Action ', array([ 8.77282238,  9.18200111], dtype=float32))
('Action ', array([ 7.36153078,  7.0993309 ], dtype=float32))
('Action ', array([ 5.88873816,  7.66054344], dtype=float32))
('Action ', array([ 7.22249651,  6.9354887 ], dtype=float32))
('Action ', array([ 1.76197016,  6.32551765], dtype=float32))
('Action ', array([ 7.01867628,  6.75511265], dtype=float32))
('Action ', array([-3.22766161,  1.74200618], dtype=float32))
Episode: 1027/5000, score: 10
('Action ', array([ 8.61267281,  8.97363949], dtype=float32))
('Action ', array([ 7.4544425 ,  7.55422831], dtype=float32))
('Action ', array([ 8.61267281,  8.97363949], dtype=float32))
('Action ', array([ 7.4544425 ,  7.55422831], dtype=float32))
('Action ', array([ 9.098876  ,  9.59695

('Action ', array([ 8.08765602,  8.02090073], dtype=float32))
('Action ', array([ 4.67984295, -2.10068774], dtype=float32))
('Action ', array([ 8.22455692,  7.88573933], dtype=float32))
('Action ', array([ 0.88999659, -4.27120113], dtype=float32))
Episode: 1035/5000, score: 28
('Action ', array([ 8.69491959,  8.68879414], dtype=float32))
('Action ', array([ 7.30415154,  7.5604248 ], dtype=float32))
('Action ', array([ 8.22377682,  8.25388336], dtype=float32))
('Action ', array([ 7.30577469,  7.559062  ], dtype=float32))
('Action ', array([ 8.0810318 ,  8.20960426], dtype=float32))
('Action ', array([ 7.34713459,  7.59866524], dtype=float32))
('Action ', array([ 10.62857151,   6.10757065], dtype=float32))
('Action ', array([ 5.63909721,  6.36308098], dtype=float32))
('Action ', array([ 10.512537  ,   4.93592072], dtype=float32))
('Action ', array([ 5.57635021,  6.28889751], dtype=float32))
('Action ', array([ 11.82384872,   4.95284271], dtype=float32))
('Action ', array([ 7.10406399,  7

('Action ', array([ 8.66240215,  8.52910805], dtype=float32))
('Action ', array([ 7.27735186,  7.64248037], dtype=float32))
('Action ', array([ 7.82523251,  8.15441608], dtype=float32))
('Action ', array([ 7.2890811 ,  7.63425875], dtype=float32))
('Action ', array([ 7.88941002,  7.79076815], dtype=float32))
('Action ', array([ 7.60677958,  7.62719393], dtype=float32))
('Action ', array([ 7.80724764,  7.25820017], dtype=float32))
('Action ', array([ 7.68734789,  7.64783716], dtype=float32))
('Action ', array([ 8.10365868,  7.52009821], dtype=float32))
('Action ', array([ 7.68898153,  7.61853552], dtype=float32))
('Action ', array([ 7.87963963,  7.78208399], dtype=float32))
('Action ', array([ 7.61403704,  7.59660482], dtype=float32))
('Action ', array([ 7.96894455,  7.77421808], dtype=float32))
('Action ', array([ 7.83625841,  8.54424286], dtype=float32))
('Action ', array([ 8.60988045,  8.73742199], dtype=float32))
('Action ', array([ 7.28451967,  8.17195511], dtype=float32))
('Action

('Action ', array([ 8.67609024,  8.39919662], dtype=float32))
('Action ', array([ 7.39083958,  7.85689306], dtype=float32))
('Action ', array([ 9.45167446,  9.39812565], dtype=float32))
('Action ', array([ 7.44993687,  7.911551  ], dtype=float32))
('Action ', array([ 9.96199799,  9.64812946], dtype=float32))
('Action ', array([ 7.44993687,  7.911551  ], dtype=float32))
('Action ', array([ 9.96199799,  9.64812946], dtype=float32))
('Action ', array([ 7.44993687,  7.911551  ], dtype=float32))
('Action ', array([ 9.96199799,  9.64812946], dtype=float32))
('Action ', array([ 7.44993687,  7.911551  ], dtype=float32))
('Action ', array([ 9.96199799,  9.64812946], dtype=float32))
('Action ', array([ 7.44993687,  7.911551  ], dtype=float32))
('Action ', array([ 9.96199799,  9.64812946], dtype=float32))
('Action ', array([ 7.44993687,  7.911551  ], dtype=float32))
('Action ', array([ 9.96199799,  9.64812946], dtype=float32))
('Action ', array([ 7.44993687,  7.911551  ], dtype=float32))
('Action

('Action ', array([ 8.66383266,  8.24538803], dtype=float32))
('Action ', array([ 8.66383266,  8.24538803], dtype=float32))
('Action ', array([ 7.31165123,  8.05209541], dtype=float32))
('Action ', array([ 8.85008144,  8.08896255], dtype=float32))
('Action ', array([ 7.28389645,  8.06659985], dtype=float32))
('Action ', array([ 8.81153774,  8.56788731], dtype=float32))
('Action ', array([ 6.89045429,  7.74271727], dtype=float32))
('Action ', array([ 8.51336861,  7.35826349], dtype=float32))
('Action ', array([ 6.64398098,  7.60839701], dtype=float32))
('Action ', array([ 9.10730839,  8.72501278], dtype=float32))
('Action ', array([ 6.70196629,  7.65818071], dtype=float32))
('Action ', array([ 9.38739109,  9.59047604], dtype=float32))
('Action ', array([ 6.70196915,  7.66294432], dtype=float32))
('Action ', array([ 9.25890541,  8.98707104], dtype=float32))
('Action ', array([ 6.70196629,  7.65818071], dtype=float32))
('Action ', array([ 9.06100178,  8.77488613], dtype=float32))
('Action

('Action ', array([ 8.72311592,  8.33289051], dtype=float32))
('Action ', array([ 7.2408638 ,  8.71338081], dtype=float32))
('Action ', array([ 9.48401165,  8.72078609], dtype=float32))
('Action ', array([ 7.2408638 ,  8.71338081], dtype=float32))
('Action ', array([ 9.48401165,  8.72078609], dtype=float32))
('Action ', array([ 7.2408638 ,  8.71338081], dtype=float32))
('Action ', array([ 9.06009483,  7.75543261], dtype=float32))
('Action ', array([ 7.2408638 ,  8.71338081], dtype=float32))
('Action ', array([ 8.93217659,  8.82226086], dtype=float32))
('Action ', array([ 7.2408638 ,  8.71338081], dtype=float32))
('Action ', array([ 8.9325285 ,  8.85204792], dtype=float32))
('Action ', array([ 7.2408638 ,  8.71338081], dtype=float32))
('Action ', array([ 7.2408638 ,  8.71338081], dtype=float32))
('Action ', array([ 8.9384737 ,  8.79210186], dtype=float32))
('Action ', array([ 7.24575138,  8.7309103 ], dtype=float32))
('Action ', array([ 8.59972   ,  8.98722553], dtype=float32))
('Action

('Action ', array([ 8.69774055,  8.45692348], dtype=float32))
('Action ', array([ 7.18251276,  8.77788353], dtype=float32))
('Action ', array([ 9.66306591,  9.44359779], dtype=float32))
('Action ', array([ 7.18251276,  8.77788353], dtype=float32))
('Action ', array([ 7.18016863,  8.76406479], dtype=float32))
('Action ', array([ 7.64062452,  9.23258114], dtype=float32))
('Action ', array([ 7.1479249,  8.7843008], dtype=float32))
('Action ', array([ 7.51636887,  8.88708973], dtype=float32))
('Action ', array([ 7.65855265,  9.10736179], dtype=float32))
('Action ', array([  5.49657869,  10.96665478], dtype=float32))
('Action ', array([ 7.59453058,  8.80722427], dtype=float32))
('Action ', array([  5.49091768,  10.06790447], dtype=float32))
('Action ', array([ 6.0824542 ,  7.29796457], dtype=float32))
('Action ', array([ 3.94379306,  8.0318861 ], dtype=float32))
Episode: 1068/5000, score: 14
('Action ', array([ 8.70735359,  8.43733883], dtype=float32))
('Action ', array([ 6.94255352,  7.948

('Action ', array([ 3.05029917,  3.01826262], dtype=float32))
('Action ', array([ 7.1832366,  8.227561 ], dtype=float32))
Episode: 1074/5000, score: 27
('Action ', array([ 8.79361629,  8.39190006], dtype=float32))
('Action ', array([ 7.26808929,  8.27841854], dtype=float32))
('Action ', array([ 9.33705997,  9.56916428], dtype=float32))
('Action ', array([ 7.26808929,  8.27841854], dtype=float32))
('Action ', array([ 10.58708477,   7.09561777], dtype=float32))
('Action ', array([ 7.38446045,  8.34707546], dtype=float32))
('Action ', array([ 9.94704342,  8.74470234], dtype=float32))
('Action ', array([ 7.39954472,  8.3374033 ], dtype=float32))
('Action ', array([ 9.25023842,  8.17922211], dtype=float32))
('Action ', array([ 7.39774418,  8.34123993], dtype=float32))
('Action ', array([ 9.63995838,  9.06401253], dtype=float32))
('Action ', array([ 7.42189693,  8.31794739], dtype=float32))
('Action ', array([ 9.9744463 ,  9.64789772], dtype=float32))
('Action ', array([ 7.11147213,  7.89540

('Action ', array([ 8.77421093,  8.57077789], dtype=float32))
('Action ', array([ 7.33793449,  8.32173634], dtype=float32))
('Action ', array([ 8.77421093,  8.57077789], dtype=float32))
('Action ', array([ 7.33793449,  8.32173634], dtype=float32))
('Action ', array([ 9.30744076,  8.92068863], dtype=float32))
('Action ', array([ 7.33793449,  8.32173634], dtype=float32))
('Action ', array([ 7.88913536,  8.62065792], dtype=float32))
('Action ', array([ 7.33793449,  8.32173634], dtype=float32))
('Action ', array([ 9.30744076,  8.92068863], dtype=float32))
('Action ', array([ 7.33793449,  8.32173634], dtype=float32))
('Action ', array([ 9.30744076,  8.92068863], dtype=float32))
('Action ', array([ 7.3378458 ,  8.31559467], dtype=float32))
('Action ', array([ 9.30744076,  8.92068863], dtype=float32))
('Action ', array([ 7.33542442,  8.32196999], dtype=float32))
('Action ', array([ 9.30744076,  8.92068863], dtype=float32))
('Action ', array([ 7.33542442,  8.32196999], dtype=float32))
('Action

('Action ', array([ 7.83407021,  9.48148727], dtype=float32))
('Action ', array([ 10.31283951,   8.29242229], dtype=float32))
('Action ', array([ 7.82649422,  9.46575928], dtype=float32))
('Action ', array([ 9.762146  ,  8.25552654], dtype=float32))
('Action ', array([ 7.83288193,  9.47029018], dtype=float32))
('Action ', array([ 9.91422462,  7.34457302], dtype=float32))
('Action ', array([ 7.77810287,  9.48352814], dtype=float32))
('Action ', array([ 8.6050663 ,  6.43601513], dtype=float32))
('Action ', array([ 7.77189827,  9.42919827], dtype=float32))
('Action ', array([ 7.51695061,  5.86915493], dtype=float32))
('Action ', array([ 7.73196602,  9.39165211], dtype=float32))
('Action ', array([ 5.84363651,  4.51062679], dtype=float32))
Episode: 1087/5000, score: 36
('Action ', array([ 8.94562912,  8.55480766], dtype=float32))
('Action ', array([ 7.4294343 ,  8.83108425], dtype=float32))
('Action ', array([ 9.66481018,  8.5458231 ], dtype=float32))
('Action ', array([ 7.4294343 ,  8.831

('Action ', array([ 8.87721825,  8.62793827], dtype=float32))
('Action ', array([ 7.68946505,  8.83570099], dtype=float32))
('Action ', array([ 9.65933132,  9.21765327], dtype=float32))
('Action ', array([ 7.68946505,  8.83570099], dtype=float32))
('Action ', array([ 9.65858555,  9.22385597], dtype=float32))
('Action ', array([ 7.68946505,  8.83570099], dtype=float32))
('Action ', array([ 7.68946505,  8.83570099], dtype=float32))
('Action ', array([ 8.91725063,  9.3298378 ], dtype=float32))
('Action ', array([ 7.68946505,  8.83570099], dtype=float32))
('Action ', array([ 9.9810648 ,  9.87713432], dtype=float32))
('Action ', array([ 7.55439043,  8.69965267], dtype=float32))
('Action ', array([ 9.98072147,  9.8768692 ], dtype=float32))
('Action ', array([ 7.77586508,  8.82299423], dtype=float32))
('Action ', array([ 8.24712753,  8.56640625], dtype=float32))
('Action ', array([ 7.97565126,  8.32181931], dtype=float32))
('Action ', array([ 8.1019907 ,  7.95119095], dtype=float32))
('Action

('Action ', array([ 8.4833231 ,  8.53899574], dtype=float32))
('Action ', array([ 6.93879557,  9.38021088], dtype=float32))
('Action ', array([ 8.44613171,  8.66403008], dtype=float32))
('Action ', array([ 6.76094675,  2.4908905 ], dtype=float32))
('Action ', array([ 8.57323933,  8.99265862], dtype=float32))
('Action ', array([ 7.29218721,  8.02735901], dtype=float32))
('Action ', array([ 7.31006765,  8.17464447], dtype=float32))
('Action ', array([ 8.72702312,  9.03076172], dtype=float32))
('Action ', array([ 8.53944206,  5.53387451], dtype=float32))
('Action ', array([ 8.63390064,  8.34158993], dtype=float32))
('Action ', array([ 9.28505707, -3.50282669], dtype=float32))
('Action ', array([ 8.45863438,  7.77963448], dtype=float32))
Episode: 1099/5000, score: 37
('Action ', array([ 8.94453335,  8.58320713], dtype=float32))
('Action ', array([ 7.59550714,  8.47494411], dtype=float32))
('Action ', array([ 9.29179764,  5.70882845], dtype=float32))
('Action ', array([ 7.59039068,  8.47946

('Action ', array([ 8.92518997,  8.62612629], dtype=float32))
('Action ', array([ 7.4534688,  7.5513854], dtype=float32))
('Action ', array([ 9.61873627,  8.40649414], dtype=float32))
('Action ', array([ 7.4534688,  7.5513854], dtype=float32))
('Action ', array([ 9.56139946,  8.44983959], dtype=float32))
('Action ', array([ 7.46852922,  7.54208899], dtype=float32))
('Action ', array([ 9.56139946,  8.44983959], dtype=float32))
('Action ', array([ 7.5187068 ,  7.49905539], dtype=float32))
('Action ', array([ 9.56139946,  8.44983959], dtype=float32))
('Action ', array([ 7.47674131,  7.48756456], dtype=float32))
('Action ', array([ 10.91218376,   8.86863995], dtype=float32))
('Action ', array([ 7.45895529,  7.46017122], dtype=float32))
('Action ', array([ 10.00425911,   7.07415628], dtype=float32))
('Action ', array([ 7.14775705,  7.29601145], dtype=float32))
('Action ', array([ 10.87646675,   8.24709988], dtype=float32))
('Action ', array([ 7.14775896,  7.30187654], dtype=float32))
('Acti

Episode: 1109/5000, score: 24
('Action ', array([ 8.73793697,  8.86347198], dtype=float32))
('Action ', array([ 8.01733112,  8.46497726], dtype=float32))
('Action ', array([ 8.82038116,  8.94628525], dtype=float32))
('Action ', array([ 7.37049532,  7.4858079 ], dtype=float32))
('Action ', array([ 9.57960129,  8.9577179 ], dtype=float32))
('Action ', array([ 7.44023085,  7.5413928 ], dtype=float32))
('Action ', array([ 7.49272394,  6.80026674], dtype=float32))
('Action ', array([ 8.43699837,  7.07173491], dtype=float32))
('Action ', array([ 6.11980772,  5.81800508], dtype=float32))
('Action ', array([ 6.14067221,  5.90662813], dtype=float32))
('Action ', array([ 8.68719769,  6.15853071], dtype=float32))
('Action ', array([ 7.51285028,  6.90490103], dtype=float32))
('Action ', array([ 9.16004753,  7.21805143], dtype=float32))
('Action ', array([ 7.46059465,  7.39493322], dtype=float32))
('Action ', array([ 9.65531635,  9.25395966], dtype=float32))
('Action ', array([ 7.74936247,  7.77982

('Action ', array([ 7.21973515,  6.83177662], dtype=float32))
('Action ', array([ 7.03055763,  5.0465498 ], dtype=float32))
('Action ', array([ 7.20280457,  6.96458149], dtype=float32))
('Action ', array([ 6.26433182,  4.30768108], dtype=float32))
('Action ', array([ 7.23939323,  6.92500114], dtype=float32))
('Action ', array([ 6.06282234,  5.41403103], dtype=float32))
('Action ', array([ 7.38226509,  7.00523281], dtype=float32))
('Action ', array([ 8.64636898,  6.97646618], dtype=float32))
('Action ', array([ 6.86798668,  7.12455654], dtype=float32))
('Action ', array([ 8.57146072,  7.02198696], dtype=float32))
('Action ', array([ 7.79274368,  7.54506969], dtype=float32))
('Action ', array([ 3.62741089, -0.23019505], dtype=float32))
('Action ', array([ 8.12824535,  7.62152672], dtype=float32))
('Action ', array([-6.10326958, -5.30621052], dtype=float32))
Episode: 1117/5000, score: 38
('Action ', array([ 8.57019997,  8.86946583], dtype=float32))
('Action ', array([ 8.08552456,  8.82743

('Action ', array([ 8.50481224,  8.85359287], dtype=float32))
('Action ', array([ 7.59171247,  7.87616873], dtype=float32))
('Action ', array([ 9.24738216,  9.08995724], dtype=float32))
('Action ', array([ 7.59171247,  7.87616873], dtype=float32))
('Action ', array([ 9.24738216,  9.08995724], dtype=float32))
('Action ', array([ 7.6118083 ,  7.27161169], dtype=float32))
('Action ', array([ 9.0590086 ,  8.68096733], dtype=float32))
('Action ', array([ 9.24738216,  9.08995724], dtype=float32))
('Action ', array([ 7.59422731,  7.8759408 ], dtype=float32))
('Action ', array([ 8.60464191,  8.94901943], dtype=float32))
('Action ', array([ 7.58593416,  7.85438585], dtype=float32))
('Action ', array([ 8.50481224,  8.85359287], dtype=float32))
('Action ', array([ 7.66260099,  7.78901052], dtype=float32))
('Action ', array([ 8.44841003,  7.83458567], dtype=float32))
('Action ', array([ 7.63915014,  7.84473372], dtype=float32))
('Action ', array([ 8.58309555,  8.21515179], dtype=float32))
('Action

('Action ', array([ 7.76750278,  8.10882664], dtype=float32))
('Action ', array([ 3.31730175,  3.96127629], dtype=float32))
Episode: 1132/5000, score: 26
('Action ', array([ 8.47604942,  8.86243725], dtype=float32))
('Action ', array([ 7.59223652,  7.97628593], dtype=float32))
('Action ', array([ 8.47604942,  8.86243725], dtype=float32))
('Action ', array([ 7.59411812,  7.97276592], dtype=float32))
('Action ', array([ 8.85998154,  8.76021481], dtype=float32))
('Action ', array([ 7.55273628,  7.45316601], dtype=float32))
('Action ', array([ 4.56800175,  3.58263874], dtype=float32))
('Action ', array([ 6.18259525,  6.51528454], dtype=float32))
('Action ', array([ 4.65902901,  3.49120045], dtype=float32))
('Action ', array([ 6.11728859,  6.46635723], dtype=float32))
('Action ', array([ 4.97893715,  3.55809498], dtype=float32))
('Action ', array([ 6.13650322,  6.46088791], dtype=float32))
('Action ', array([ 4.97893715,  3.55809498], dtype=float32))
('Action ', array([ 4.94104385,  3.54016

('Action ', array([ 8.57737732,  8.84712601], dtype=float32))
('Action ', array([ 7.62109518,  8.09134007], dtype=float32))
('Action ', array([ 8.5666256 ,  8.89685726], dtype=float32))
('Action ', array([ 7.60185099,  8.06515598], dtype=float32))
('Action ', array([ 7.59390306,  7.43783236], dtype=float32))
('Action ', array([ 5.20410013,  1.65916407], dtype=float32))
('Action ', array([ 6.457726  ,  6.50274992], dtype=float32))
('Action ', array([ 6.07560349,  2.34276152], dtype=float32))
('Action ', array([ 6.35175562,  6.41696405], dtype=float32))
('Action ', array([ 3.22993541,  1.23444331], dtype=float32))
('Action ', array([ 5.84256124,  5.92548895], dtype=float32))
('Action ', array([-0.48995528, -0.77942693], dtype=float32))
Episode: 1141/5000, score: 12
('Action ', array([ 8.65062428,  8.81701756], dtype=float32))
('Action ', array([ 8.08340645,  9.22218609], dtype=float32))
('Action ', array([ 10.84795094,  10.3307724 ], dtype=float32))
('Action ', array([ 7.81207514,  8.844

('Action ', array([ 8.64678097,  8.77846909], dtype=float32))
('Action ', array([ 7.6660018 ,  8.00724506], dtype=float32))
('Action ', array([ 8.64678097,  8.77846909], dtype=float32))
('Action ', array([ 7.64423704,  7.98143005], dtype=float32))
('Action ', array([ 7.63693857,  7.35090542], dtype=float32))
('Action ', array([ 7.65214825,  4.00576973], dtype=float32))
('Action ', array([ 6.373631  ,  6.31175137], dtype=float32))
('Action ', array([ 7.39274549,  4.05433083], dtype=float32))
('Action ', array([ 6.373631  ,  6.31175137], dtype=float32))
('Action ', array([ 7.2062273 ,  4.04292488], dtype=float32))
('Action ', array([ 7.8152318 ,  7.24100876], dtype=float32))
('Action ', array([ 9.26607513,  6.29948235], dtype=float32))
('Action ', array([ 7.81322908,  7.86747265], dtype=float32))
('Action ', array([ 9.49008083,  5.9420948 ], dtype=float32))
('Action ', array([ 7.79417562,  7.8776226 ], dtype=float32))
('Action ', array([ 8.90773773,  5.67806435], dtype=float32))
('Action

('Action ', array([ 8.79266644,  8.83721638], dtype=float32))
('Action ', array([ 7.68914747,  7.73253632], dtype=float32))
('Action ', array([ 8.79266644,  8.83721638], dtype=float32))
('Action ', array([ 7.68663549,  7.73276329], dtype=float32))
('Action ', array([ 9.91859531,  9.29322433], dtype=float32))
('Action ', array([ 7.77280283,  7.79676151], dtype=float32))
('Action ', array([ 9.3944416 ,  8.63075638], dtype=float32))
('Action ', array([ 7.52291727,  7.41312122], dtype=float32))
('Action ', array([ 7.48254824,  8.71458435], dtype=float32))
('Action ', array([ 7.52471399,  7.45322037], dtype=float32))
('Action ', array([ 7.03949881,  7.34009552], dtype=float32))
('Action ', array([ 7.43767595,  7.3992157 ], dtype=float32))
('Action ', array([ 7.13677645,  7.20842743], dtype=float32))
('Action ', array([ 7.51136923,  7.41613483], dtype=float32))
('Action ', array([ 5.79243422,  7.919487  ], dtype=float32))
('Action ', array([ 1.59279323,  1.5029372 ], dtype=float32))
Episode:

('Action ', array([ 9.08521366,  7.08491373], dtype=float32))
('Action ', array([ 7.99199629,  7.89350939], dtype=float32))
('Action ', array([ 10.34211826,   7.57491922], dtype=float32))
('Action ', array([ 8.06210327,  8.04109192], dtype=float32))
('Action ', array([ 9.61726761,  9.51136303], dtype=float32))
('Action ', array([ 8.63727951,  8.04523087], dtype=float32))
('Action ', array([ 7.68638277,  8.10222149], dtype=float32))
('Action ', array([ 8.29486465,  7.84333086], dtype=float32))
('Action ', array([  8.61063766,  11.44479656], dtype=float32))
('Action ', array([ 8.29662323,  7.84430933], dtype=float32))
('Action ', array([  8.9166441 ,  10.89770031], dtype=float32))
('Action ', array([ 8.32109642,  7.82054663], dtype=float32))
('Action ', array([ 9.29575062,  7.09254694], dtype=float32))
('Action ', array([ 8.27175236,  7.81537867], dtype=float32))
('Action ', array([ 7.46190882,  8.41548443], dtype=float32))
('Action ', array([ 8.06335354,  7.58743906], dtype=float32))
('

('Action ', array([ 8.66961956,  8.63495636], dtype=float32))
('Action ', array([ 7.56640816,  8.26405334], dtype=float32))
('Action ', array([ 10.09783745,   9.02684593], dtype=float32))
('Action ', array([ 7.55261898,  8.24245167], dtype=float32))
('Action ', array([  9.08488464,  10.16363049], dtype=float32))
('Action ', array([ 7.55261898,  8.24245167], dtype=float32))
('Action ', array([ 9.04232788,  8.54714966], dtype=float32))
('Action ', array([ 7.5571146 ,  8.24182129], dtype=float32))
('Action ', array([ 9.04232788,  8.54714966], dtype=float32))
('Action ', array([ 7.52134228,  8.2066555 ], dtype=float32))
('Action ', array([ 9.02891922,  9.13052845], dtype=float32))
('Action ', array([ 7.94828796,  8.67494011], dtype=float32))
('Action ', array([ 6.74451065,  7.44242954], dtype=float32))
('Action ', array([ 7.46500683,  7.64322948], dtype=float32))
('Action ', array([ 5.66844654,  7.2560854 ], dtype=float32))
('Action ', array([ 7.38575935,  7.00108528], dtype=float32))
('Ac

('Action ', array([ 5.01787424,  2.37358594], dtype=float32))
('Action ', array([ 5.64648962,  3.20802045], dtype=float32))
('Action ', array([ 7.90746737,  7.58368397], dtype=float32))
('Action ', array([ 4.94330931,  3.04175305], dtype=float32))
('Action ', array([ 8.1200037 ,  7.60190964], dtype=float32))
('Action ', array([ 5.91368818,  3.74719739], dtype=float32))
('Action ', array([ 8.31026173,  7.36215115], dtype=float32))
('Action ', array([ 4.7436986,  3.2756474], dtype=float32))
('Action ', array([ 7.78462172,  7.36564445], dtype=float32))
('Action ', array([ 4.73494768,  3.30932355], dtype=float32))
('Action ', array([ 7.29460859,  7.28711033], dtype=float32))
('Action ', array([ 5.17211866,  6.57563496], dtype=float32))
('Action ', array([ 7.42025423,  6.94831848], dtype=float32))
('Action ', array([ 5.17211866,  6.57563496], dtype=float32))
('Action ', array([ 8.11098003,  7.13958645], dtype=float32))
('Action ', array([ 8.55085373,  8.70885563], dtype=float32))
('Action '

('Action ', array([ 8.5460453 ,  8.57287979], dtype=float32))
('Action ', array([ 7.75760555,  8.78522301], dtype=float32))
('Action ', array([ 7.26749706,  5.09156513], dtype=float32))
('Action ', array([ 7.49616623,  7.94818211], dtype=float32))
('Action ', array([ 7.12562752,  5.02284336], dtype=float32))
('Action ', array([ 7.51054668,  7.93511868], dtype=float32))
('Action ', array([ 6.96002388,  4.97803211], dtype=float32))
('Action ', array([ 7.49082279,  7.89898682], dtype=float32))
('Action ', array([ 6.96002388,  4.97803211], dtype=float32))
('Action ', array([ 7.49938297,  7.91952419], dtype=float32))
('Action ', array([ 6.60994911,  5.11577511], dtype=float32))
('Action ', array([ 7.31276989,  7.16906071], dtype=float32))
('Action ', array([ 5.15672684,  4.9956255 ], dtype=float32))
('Action ', array([ 7.27292442,  7.08599758], dtype=float32))
('Action ', array([ 6.49506378,  6.32697773], dtype=float32))
('Action ', array([ 7.28306007,  7.20456219], dtype=float32))
('Action

('Action ', array([ 6.18508053,  6.91346455], dtype=float32))
('Action ', array([ 10.02253246,   6.77530861], dtype=float32))
('Action ', array([ 6.44191647,  7.15624619], dtype=float32))
('Action ', array([ 12.34918308,   8.42465401], dtype=float32))
('Action ', array([ 7.18156052,  7.6478548 ], dtype=float32))
('Action ', array([ 13.79038334,   0.51764858], dtype=float32))
Episode: 1191/5000, score: 30
('Action ', array([ 8.64971066,  8.59575939], dtype=float32))
('Action ', array([ 7.37971592,  8.60488605], dtype=float32))
('Action ', array([ 10.01321793,   7.47851658], dtype=float32))
('Action ', array([ 7.3730135 ,  8.65534019], dtype=float32))
('Action ', array([ 9.70440292,  6.83374119], dtype=float32))
('Action ', array([ 7.38425255,  8.65182018], dtype=float32))
('Action ', array([ 7.36125183,  8.64169407], dtype=float32))
('Action ', array([ 7.33073902,  8.6148634 ], dtype=float32))
('Action ', array([ 8.69980431,  5.27138805], dtype=float32))
('Action ', array([ 7.17594242, 

('Action ', array([ 6.48740959,  7.16706419], dtype=float32))
('Action ', array([ 7.13279438,  4.24276781], dtype=float32))
('Action ', array([ 6.59711075,  7.06090498], dtype=float32))
('Action ', array([ 5.67579937,  4.22912264], dtype=float32))
('Action ', array([ 7.33021259,  7.29598188], dtype=float32))
('Action ', array([ 3.64478588,  3.80438662], dtype=float32))
('Action ', array([ 7.25556469,  7.23388529], dtype=float32))
('Action ', array([ 4.06384945,  2.40263414], dtype=float32))
('Action ', array([ 7.47473621,  7.46526289], dtype=float32))
('Action ', array([ 4.02199268,  2.34400988], dtype=float32))
('Action ', array([ 7.6300869 ,  7.54904318], dtype=float32))
('Action ', array([ 3.73499203,  3.2205472 ], dtype=float32))
('Action ', array([ 8.37022305,  7.49402094], dtype=float32))
Episode: 1197/5000, score: 39
('Action ', array([ 8.63962936,  8.70890331], dtype=float32))
('Action ', array([ 7.40355253,  8.65163994], dtype=float32))
('Action ', array([ 9.94064999,  8.98193

('Action ', array([ 7.51400757,  8.83032894], dtype=float32))
('Action ', array([ 7.1272254 ,  7.27686596], dtype=float32))
('Action ', array([ 7.46428585,  8.8686161 ], dtype=float32))
('Action ', array([ 6.79041433,  3.96890235], dtype=float32))
('Action ', array([ 7.85528755,  9.31946087], dtype=float32))
('Action ', array([ 6.60441208,  5.17001629], dtype=float32))
('Action ', array([ 7.34346104,  8.15237999], dtype=float32))
('Action ', array([ 5.14377117,  1.66291511], dtype=float32))
('Action ', array([ 7.28689575,  8.11987591], dtype=float32))
('Action ', array([-1.9706403 , -8.18592739], dtype=float32))
Episode: 1204/5000, score: 10
('Action ', array([ 8.60552597,  8.73441505], dtype=float32))
('Action ', array([ 7.50456762,  8.25455379], dtype=float32))
('Action ', array([ 8.36714935,  8.45023155], dtype=float32))
('Action ', array([ 7.54657793,  8.24493885], dtype=float32))
('Action ', array([ 7.1112628 ,  6.78825808], dtype=float32))
('Action ', array([ 5.64563799,  6.70921

('Action ', array([ 8.75011826,  8.81297016], dtype=float32))
('Action ', array([ 7.62214231,  8.83558559], dtype=float32))
('Action ', array([ 7.60990667,  8.82989311], dtype=float32))
('Action ', array([ 10.15351772,  10.21121407], dtype=float32))
('Action ', array([ 7.91965723,  9.145154  ], dtype=float32))
('Action ', array([ 8.41109467,  7.93491602], dtype=float32))
('Action ', array([ 9.28153801,  9.26595116], dtype=float32))
('Action ', array([ 7.20154142,  7.90661669], dtype=float32))
('Action ', array([  9.25848579,  10.55723381], dtype=float32))
('Action ', array([ 7.18802786,  7.92204237], dtype=float32))
('Action ', array([ 7.98334932,  8.62368584], dtype=float32))
('Action ', array([ 6.62969923,  7.17412901], dtype=float32))
('Action ', array([ 3.98525286, -0.36372146], dtype=float32))
('Action ', array([ 6.6645112 ,  7.08088636], dtype=float32))
Episode: 1213/5000, score: 15
('Action ', array([ 8.73626995,  8.79606724], dtype=float32))
('Action ', array([ 7.99715662,  9.1

('Action ', array([ 8.64388275,  8.8353548 ], dtype=float32))
('Action ', array([ 7.50096416,  8.57793903], dtype=float32))
('Action ', array([ 9.38807583,  9.25334263], dtype=float32))
('Action ', array([ 7.49447346,  8.62788868], dtype=float32))
('Action ', array([ 9.32480907,  9.07822895], dtype=float32))
('Action ', array([ 9.38799191,  9.0584383 ], dtype=float32))
('Action ', array([ 7.44878292,  8.59449959], dtype=float32))
('Action ', array([ 9.38799191,  9.0584383 ], dtype=float32))
('Action ', array([ 7.44878292,  8.59449959], dtype=float32))
('Action ', array([ 9.44419956,  9.15498734], dtype=float32))
('Action ', array([ 7.41709614,  8.57134247], dtype=float32))
('Action ', array([ 9.34241772,  8.99727917], dtype=float32))
('Action ', array([ 7.4247694 ,  8.54708481], dtype=float32))
('Action ', array([ 7.37477303,  5.50133467], dtype=float32))
('Action ', array([ 7.36232853,  5.49726343], dtype=float32))
('Action ', array([ 7.39096355,  8.57966137], dtype=float32))
('Action

('Action ', array([ 8.66060925,  8.86927795], dtype=float32))
('Action ', array([ 7.50954723,  8.66187   ], dtype=float32))
('Action ', array([ 8.52025414,  6.87532568], dtype=float32))
('Action ', array([ 7.46579933,  8.59931946], dtype=float32))
('Action ', array([ 7.85328817,  6.65995073], dtype=float32))
('Action ', array([ 7.91825676,  9.195755  ], dtype=float32))
('Action ', array([ 8.04321098,  7.45063829], dtype=float32))
('Action ', array([ 7.88222408,  8.98053455], dtype=float32))
('Action ', array([ 7.85548353,  7.37092257], dtype=float32))
('Action ', array([ 7.24278164,  7.90315771], dtype=float32))
('Action ', array([ 7.1095314 ,  5.38254595], dtype=float32))
('Action ', array([ 7.29284191,  7.86441851], dtype=float32))
('Action ', array([ 5.60592461,  6.56641054], dtype=float32))
('Action ', array([ 7.29144955,  7.83850336], dtype=float32))
('Action ', array([ 6.04995346,  6.04267168], dtype=float32))
('Action ', array([ 7.28883743,  7.8139596 ], dtype=float32))
('Action

('Action ', array([ 5.55658579,  1.76228619], dtype=float32))
('Action ', array([ 9.24885464,  8.74849415], dtype=float32))
('Action ', array([ 2.85649371, -1.74079227], dtype=float32))
Episode: 1239/5000, score: 28
('Action ', array([ 8.68700981,  8.82555389], dtype=float32))
('Action ', array([ 7.23072052,  7.59007215], dtype=float32))
('Action ', array([ 8.68700981,  8.82555389], dtype=float32))
('Action ', array([ 7.25141144,  7.60455847], dtype=float32))
('Action ', array([ 8.68700981,  8.82555389], dtype=float32))
('Action ', array([ 7.29551125,  6.78704596], dtype=float32))
('Action ', array([ 9.21207237,  4.82035971], dtype=float32))
('Action ', array([ 5.95736408,  5.72668409], dtype=float32))
('Action ', array([ 5.88949013,  2.03105307], dtype=float32))
('Action ', array([ 5.91712189,  5.78821135], dtype=float32))
('Action ', array([ 6.1344986,  1.8592391], dtype=float32))
('Action ', array([ 5.94211674,  5.85010767], dtype=float32))
('Action ', array([ 7.23740482,  2.6456847

('Action ', array([ 8.52904797,  8.86892414], dtype=float32))
('Action ', array([ 7.71427584,  8.42510605], dtype=float32))
('Action ', array([ 8.25215149,  8.20236874], dtype=float32))
('Action ', array([ 7.72691965,  8.40883541], dtype=float32))
('Action ', array([  7.60143661,  10.79858971], dtype=float32))
('Action ', array([ 8.01587105,  8.72293282], dtype=float32))
('Action ', array([ 6.54927874,  6.86018896], dtype=float32))
('Action ', array([ 6.89317274,  7.23498487], dtype=float32))
('Action ', array([ 3.99615455,  3.64010787], dtype=float32))
Episode: 1249/5000, score: 10
('Action ', array([ 8.56488419,  8.85028362], dtype=float32))
('Action ', array([ 7.72374153,  8.42916203], dtype=float32))
('Action ', array([ 9.24297523,  9.79049015], dtype=float32))
('Action ', array([ 7.72030258,  8.44658184], dtype=float32))
('Action ', array([ 9.27595425,  9.88487339], dtype=float32))
('Action ', array([ 8.00219917,  8.71451187], dtype=float32))
('Action ', array([ 8.2237711 ,  7.693

('Action ', array([ 1.72324145,  0.86752307], dtype=float32))
('Action ', array([ 7.97770262,  7.83140659], dtype=float32))
('Action ', array([ 2.39080977,  1.8890456 ], dtype=float32))
('Action ', array([ 9.2170105 ,  7.38622856], dtype=float32))
('Action ', array([ 0.59611475, -4.45187759], dtype=float32))
('Action ', array([ 10.09861755,   8.25967216], dtype=float32))
('Action ', array([-0.50200307, -6.82271194], dtype=float32))
('Action ', array([ 10.16304398,   8.35955143], dtype=float32))
Episode: 1255/5000, score: 31
('Action ', array([ 8.52019978,  8.70857716], dtype=float32))
('Action ', array([ 7.45562935,  7.71630907], dtype=float32))
('Action ', array([ 8.52019978,  8.70857716], dtype=float32))
('Action ', array([ 7.50614834,  7.73594809], dtype=float32))
('Action ', array([ 8.780756  ,  8.68965149], dtype=float32))
('Action ', array([ 7.78089333,  7.07549429], dtype=float32))
('Action ', array([ 8.15866375,  7.04226351], dtype=float32))
('Action ', array([ 6.266119  ,  5.8

('Action ', array([ 8.59236813,  8.88418865], dtype=float32))
('Action ', array([ 7.60533905,  8.53428841], dtype=float32))
('Action ', array([ 9.24159527,  8.73902798], dtype=float32))
('Action ', array([ 7.59410191,  8.54658794], dtype=float32))
('Action ', array([ 9.00156784,  8.99672318], dtype=float32))
('Action ', array([ 7.59221649,  8.55007935], dtype=float32))
('Action ', array([ 10.64573288,  10.36666965], dtype=float32))
('Action ', array([ 7.55594921,  8.51443386], dtype=float32))
('Action ', array([ 10.42172432,  10.31446266], dtype=float32))
('Action ', array([ 7.83137608,  8.84641743], dtype=float32))
('Action ', array([ 12.04581451,  14.23517227], dtype=float32))
('Action ', array([ 8.0210886 ,  8.97966003], dtype=float32))
('Action ', array([  5.74923897,  10.21735191], dtype=float32))
Episode: 1265/5000, score: 12
('Action ', array([ 8.63269234,  8.86871815], dtype=float32))
('Action ', array([ 7.64127445,  8.00948143], dtype=float32))
('Action ', array([ 8.32598209, 

('Action ', array([ 8.60741234,  8.7337141 ], dtype=float32))
('Action ', array([ 7.53670359,  7.99479866], dtype=float32))
('Action ', array([ 8.60741234,  8.7337141 ], dtype=float32))
('Action ', array([ 7.48054171,  7.94994926], dtype=float32))
('Action ', array([ 8.71936512,  8.53056717], dtype=float32))
('Action ', array([ 7.24126482,  7.14308262], dtype=float32))
('Action ', array([ 8.07091045,  6.0833931 ], dtype=float32))
('Action ', array([ 7.10324526,  7.10942268], dtype=float32))
('Action ', array([ 7.02646637,  4.36986351], dtype=float32))
('Action ', array([ 6.06091928,  6.35621834], dtype=float32))
('Action ', array([ 6.10613394,  6.31157017], dtype=float32))
('Action ', array([ 6.82450247,  5.43330574], dtype=float32))
('Action ', array([ 6.09016085,  6.28557301], dtype=float32))
('Action ', array([ 5.34849691,  4.15136147], dtype=float32))
('Action ', array([ 6.12445211,  6.24090481], dtype=float32))
('Action ', array([ 5.09495592,  3.85396385], dtype=float32))
('Action

('Action ', array([ 8.74389458,  8.9584713 ], dtype=float32))
('Action ', array([ 7.58460808,  8.02443695], dtype=float32))
('Action ', array([ 9.5212822 ,  9.81306171], dtype=float32))
('Action ', array([ 7.56033897,  8.0303278 ], dtype=float32))
('Action ', array([  9.15707302,  10.35464287], dtype=float32))
('Action ', array([ 6.84129143,  7.16072893], dtype=float32))
('Action ', array([ 4.99337006,  3.18810868], dtype=float32))
('Action ', array([ 6.83879948,  7.03474665], dtype=float32))
('Action ', array([ 3.41491032,  2.03354478], dtype=float32))
Episode: 1284/5000, score: 8
('Action ', array([ 8.721035  ,  8.94586563], dtype=float32))
('Action ', array([ 7.52987957,  8.05333805], dtype=float32))
('Action ', array([ 8.721035  ,  8.94586563], dtype=float32))
('Action ', array([ 7.53787327,  8.07213593], dtype=float32))
('Action ', array([ 9.45809269,  9.40204811], dtype=float32))
('Action ', array([ 7.39059448,  7.30335665], dtype=float32))
('Action ', array([ 7.11847019,  6.7077

('Action ', array([ 8.77755833,  8.8651104 ], dtype=float32))
('Action ', array([ 7.69795465,  8.14834118], dtype=float32))
('Action ', array([ 9.12650108,  8.70747185], dtype=float32))
('Action ', array([ 7.69447279,  8.15245914], dtype=float32))
('Action ', array([ 9.12650108,  8.70747185], dtype=float32))
('Action ', array([ 7.69447279,  8.15245914], dtype=float32))
('Action ', array([ 8.72394085,  8.19880199], dtype=float32))
('Action ', array([ 7.18859625,  7.40770006], dtype=float32))
('Action ', array([ 9.05854416,  6.39257765], dtype=float32))
('Action ', array([ 7.58526754,  7.57757139], dtype=float32))
('Action ', array([ 10.0199461 ,   7.02205992], dtype=float32))
('Action ', array([ 7.59667158,  7.57664633], dtype=float32))
('Action ', array([ 7.38078547,  5.7513938 ], dtype=float32))
('Action ', array([ 7.25255537,  7.47194338], dtype=float32))
('Action ', array([ 9.26202488,  4.87389517], dtype=float32))
('Action ', array([ 9.11981297,  5.05425406], dtype=float32))
('Acti

('Action ', array([ 8.84355068,  8.92989922], dtype=float32))
('Action ', array([ 9.57097054,  9.24809361], dtype=float32))
('Action ', array([ 7.8299365 ,  8.87617016], dtype=float32))
('Action ', array([ 9.57097054,  9.24809361], dtype=float32))
('Action ', array([ 7.8299365 ,  8.87617016], dtype=float32))
('Action ', array([ 8.84355068,  8.92989922], dtype=float32))
('Action ', array([ 7.8299365 ,  8.87617016], dtype=float32))
('Action ', array([ 9.57097054,  9.24809361], dtype=float32))
('Action ', array([ 7.8299365 ,  8.87617016], dtype=float32))
('Action ', array([ 9.36007214,  8.57399559], dtype=float32))
('Action ', array([ 8.14718914,  9.20239544], dtype=float32))
('Action ', array([ 10.0935154,   8.0981884], dtype=float32))
('Action ', array([ 7.94100332,  8.91681004], dtype=float32))
('Action ', array([ 9.39121437,  7.39975595], dtype=float32))
('Action ', array([ 7.55161905,  6.12601328], dtype=float32))
('Action ', array([ 7.62116671,  7.98305368], dtype=float32))
('Action

('Action ', array([ 8.79663086,  9.03559875], dtype=float32))
('Action ', array([ 8.03392887,  8.29699802], dtype=float32))
('Action ', array([ 8.79663086,  9.03559875], dtype=float32))
('Action ', array([ 8.00920868,  8.29172134], dtype=float32))
('Action ', array([ 9.23904324,  9.50048828], dtype=float32))
('Action ', array([ 8.01411438,  7.62195253], dtype=float32))
('Action ', array([ 7.08058357,  6.11013842], dtype=float32))
('Action ', array([ 6.36985302,  6.23793173], dtype=float32))
('Action ', array([ 5.95183754,  7.12819338], dtype=float32))
('Action ', array([ 6.38642979,  6.20883322], dtype=float32))
('Action ', array([ 3.21911144,  5.26673174], dtype=float32))
('Action ', array([ 6.31674099,  6.10664511], dtype=float32))
('Action ', array([ 0.53490454,  4.58393908], dtype=float32))
('Action ', array([ 5.4261322 ,  5.35757303], dtype=float32))
Episode: 1304/5000, score: 13
('Action ', array([ 8.79001808,  9.01948929], dtype=float32))
('Action ', array([ 8.05648327,  8.91709

('Action ', array([ 7.13533926,  7.12108755], dtype=float32))
('Action ', array([  9.4802599 ,  10.74674225], dtype=float32))
('Action ', array([ 7.12076998,  7.12698889], dtype=float32))
('Action ', array([  9.55889988,  10.69670868], dtype=float32))
('Action ', array([ 7.12076998,  7.12698889], dtype=float32))
('Action ', array([ 10.43557549,   9.71324158], dtype=float32))
('Action ', array([ 7.03654909,  7.16418409], dtype=float32))
('Action ', array([  9.89435863,  13.44695663], dtype=float32))
('Action ', array([ 7.27053118,  7.56624842], dtype=float32))
('Action ', array([ 9.04886913,  9.61598206], dtype=float32))
('Action ', array([ 7.3643384 ,  7.97312593], dtype=float32))
Episode: 1312/5000, score: 35
('Action ', array([ 8.84798813,  9.00274086], dtype=float32))
('Action ', array([ 8.296422  ,  8.25602436], dtype=float32))
('Action ', array([ 7.76152611,  8.18057346], dtype=float32))
('Action ', array([ 8.29245567,  8.2597332 ], dtype=float32))
('Action ', array([ 8.04756355, 

('Action ', array([ 9.32398987,  7.85479355], dtype=float32))
('Action ', array([ 8.23496246,  8.78330803], dtype=float32))
('Action ', array([ 9.26060486,  7.73441315], dtype=float32))
('Action ', array([ 8.23496246,  8.78330803], dtype=float32))
('Action ', array([ 9.23287392,  7.74412918], dtype=float32))
('Action ', array([ 7.76894474,  8.24847698], dtype=float32))
('Action ', array([ 9.5445118 ,  8.02960587], dtype=float32))
('Action ', array([ 7.76894474,  8.24847698], dtype=float32))
('Action ', array([ 7.76894474,  8.24847698], dtype=float32))
('Action ', array([ 9.5445118 ,  8.02960587], dtype=float32))
('Action ', array([ 7.76894474,  8.24847698], dtype=float32))
('Action ', array([ 9.5445118 ,  8.02960587], dtype=float32))
('Action ', array([ 7.76894474,  8.24847698], dtype=float32))
('Action ', array([ 9.5445118 ,  8.02960587], dtype=float32))
('Action ', array([ 7.9713335 ,  8.17527103], dtype=float32))
('Action ', array([ 9.80760574,  8.43778229], dtype=float32))
('Action

('Action ', array([  9.43373203,  10.51142597], dtype=float32))
('Action ', array([ 7.56411791,  8.03389072], dtype=float32))
('Action ', array([ 7.968575  ,  5.98361874], dtype=float32))
('Action ', array([ 7.16398001,  7.80198956], dtype=float32))
('Action ', array([ 4.06217527, -1.3088541 ], dtype=float32))
('Action ', array([ 7.49675131,  7.96248055], dtype=float32))
Episode: 1325/5000, score: 17
('Action ', array([ 8.82956028,  8.83315468], dtype=float32))
('Action ', array([ 7.85403967,  7.66416931], dtype=float32))
('Action ', array([ 8.94922352,  7.51704788], dtype=float32))
('Action ', array([ 7.85419893,  7.66318607], dtype=float32))
('Action ', array([ 8.25241661,  8.05220795], dtype=float32))
('Action ', array([ 7.90152311,  7.74003124], dtype=float32))
('Action ', array([  9.79080963,  11.07846642], dtype=float32))
('Action ', array([ 8.1444521 ,  7.55965614], dtype=float32))
('Action ', array([ 10.14174938,  12.72855568], dtype=float32))
('Action ', array([ 8.17201424,  7

('Action ', array([ 5.35400772,  5.310956  ], dtype=float32))
('Action ', array([ 6.77488995,  6.77764225], dtype=float32))
('Action ', array([ 5.12055874,  5.0509119 ], dtype=float32))
('Action ', array([ 7.34032631,  7.13263512], dtype=float32))
('Action ', array([ 4.33760738,  5.98668003], dtype=float32))
('Action ', array([ 7.3744297 ,  7.33405209], dtype=float32))
('Action ', array([ 3.44908786,  3.46356273], dtype=float32))
('Action ', array([ 7.48818588,  7.45386314], dtype=float32))
('Action ', array([ 0.07547078, -2.7493546 ], dtype=float32))
('Action ', array([ 7.48122311,  7.46733284], dtype=float32))
('Action ', array([-0.5161792, -1.2947799], dtype=float32))
('Action ', array([ 6.43465805,  6.41217804], dtype=float32))
('Action ', array([-1.20649064,  0.91522682], dtype=float32))
('Action ', array([ 6.32445812,  6.30067158], dtype=float32))
('Action ', array([-1.4049865 , -3.30456853], dtype=float32))
('Action ', array([ 6.36728573,  6.27192974], dtype=float32))
('Action '

('Action ', array([ 6.89510727,  6.96526766], dtype=float32))
('Action ', array([ 6.81531143,  6.91531515], dtype=float32))
('Action ', array([ 7.67871189,  6.23218012], dtype=float32))
('Action ', array([ 6.75482273,  6.86480856], dtype=float32))
('Action ', array([ 4.55925179,  1.51459742], dtype=float32))
('Action ', array([ 6.71895599,  6.78763151], dtype=float32))
('Action ', array([ 4.82419395,  3.70318079], dtype=float32))
('Action ', array([ 6.63003635,  6.75803804], dtype=float32))
('Action ', array([ 7.27525425,  5.98691034], dtype=float32))
('Action ', array([ 7.02777576,  6.86318636], dtype=float32))
('Action ', array([ 9.18974495, -0.11971813], dtype=float32))
('Action ', array([ 7.213871  ,  6.91839647], dtype=float32))
('Action ', array([ 9.40529823,  4.13797998], dtype=float32))
('Action ', array([ 8.43148518,  7.75358629], dtype=float32))
('Action ', array([ 9.59055614,  4.96806574], dtype=float32))
('Action ', array([ 8.31536007,  8.01553249], dtype=float32))
('Action

('Action ', array([ 6.01748705,  5.50320911], dtype=float32))
('Action ', array([ 5.21807051,  3.46502399], dtype=float32))
('Action ', array([ 7.51354837,  6.07053661], dtype=float32))
('Action ', array([ 7.2575016 ,  6.63287067], dtype=float32))
('Action ', array([ 7.59515047,  6.59222126], dtype=float32))
('Action ', array([ 6.16716623,  7.20971775], dtype=float32))
('Action ', array([ 7.45640516,  7.11846924], dtype=float32))
('Action ', array([ 4.66481638,  5.0083704 ], dtype=float32))
('Action ', array([ 8.02233028,  7.64782333], dtype=float32))
Episode: 1345/5000, score: 22
('Action ', array([ 7.90285397,  8.75617313], dtype=float32))
('Action ', array([ 7.14148378,  7.17290878], dtype=float32))
('Action ', array([ 7.90285397,  8.75617313], dtype=float32))
('Action ', array([ 7.1386714 ,  7.16779327], dtype=float32))
('Action ', array([ 8.82093048,  9.32358456], dtype=float32))
('Action ', array([ 6.86794043,  6.3211813 ], dtype=float32))
('Action ', array([ 8.4882555 ,  5.23303

('Action ', array([ 7.92925644,  8.41074562], dtype=float32))
('Action ', array([ 11.00730419,   5.31605721], dtype=float32))
('Action ', array([ 7.92925644,  8.41074562], dtype=float32))
('Action ', array([ 10.91674232,   5.34184074], dtype=float32))
('Action ', array([ 10.91674232,   5.34184074], dtype=float32))
('Action ', array([ 8.42696857,  8.68283176], dtype=float32))
('Action ', array([ 10.91674232,   5.34184074], dtype=float32))
('Action ', array([ 8.20508957,  8.2167635 ], dtype=float32))
('Action ', array([ 8.60563183,  3.2185266 ], dtype=float32))
('Action ', array([ 7.66323948,  7.30211258], dtype=float32))
('Action ', array([ 5.82434273, -1.05020738], dtype=float32))
('Action ', array([ 7.62623501,  7.23090363], dtype=float32))
('Action ', array([-0.93326354, -2.22279954], dtype=float32))
('Action ', array([ 7.31116676,  6.50755978], dtype=float32))
('Action ', array([-4.13151932, -0.62315583], dtype=float32))
('Action ', array([ 8.24459553,  6.97519779], dtype=float32))


('Action ', array([ 5.19266987,  4.99687719], dtype=float32))
('Action ', array([ 4.35256958,  5.12516356], dtype=float32))
('Action ', array([ 5.09461308,  4.94539404], dtype=float32))
('Action ', array([ 1.84737408,  1.60450721], dtype=float32))
('Action ', array([ 5.04249954,  4.93772364], dtype=float32))
('Action ', array([-1.23049152, -0.57283813], dtype=float32))
('Action ', array([ 5.05155468,  4.9583354 ], dtype=float32))
Episode: 1355/5000, score: 19
('Action ', array([ 7.90823317,  8.45948982], dtype=float32))
('Action ', array([ 7.23514986,  7.17864656], dtype=float32))
('Action ', array([ 7.90823317,  8.45948982], dtype=float32))
('Action ', array([ 7.23514986,  7.17864656], dtype=float32))
('Action ', array([ 7.90823317,  8.45948982], dtype=float32))
('Action ', array([ 7.23514986,  7.17864656], dtype=float32))
('Action ', array([ 8.20892048,  8.78496647], dtype=float32))
('Action ', array([ 7.23514986,  7.17864656], dtype=float32))
('Action ', array([ 8.22507572,  8.66386

('Action ', array([ 8.04798031,  8.3006382 ], dtype=float32))
('Action ', array([ 7.95028925,  8.49920559], dtype=float32))
('Action ', array([ 7.23649359,  8.21856308], dtype=float32))
('Action ', array([ 8.08068657,  8.29120827], dtype=float32))
('Action ', array([ 7.37731409,  7.50237656], dtype=float32))
('Action ', array([ 8.01005077,  8.06499481], dtype=float32))
('Action ', array([ 7.34300756,  6.13630295], dtype=float32))
('Action ', array([ 8.10098362,  7.31053352], dtype=float32))
('Action ', array([ 4.36111403,  5.10301971], dtype=float32))
('Action ', array([ 8.14639091,  6.76883411], dtype=float32))
Episode: 1363/5000, score: 9
('Action ', array([ 7.60743189,  7.9526124 ], dtype=float32))
('Action ', array([ 8.90751648,  8.96280766], dtype=float32))
('Action ', array([ 8.02970982,  8.38691998], dtype=float32))
('Action ', array([ 7.19928026,  8.00319099], dtype=float32))
('Action ', array([ 7.64618731,  7.19725657], dtype=float32))
('Action ', array([ 7.50423384,  8.862691

('Action ', array([ 5.63175726,  6.03377676], dtype=float32))
('Action ', array([ 8.42269516,  7.06672907], dtype=float32))
('Action ', array([ 5.63175726,  6.03377676], dtype=float32))
('Action ', array([ 8.39163876,  7.01341486], dtype=float32))
('Action ', array([ 5.63175726,  6.03377676], dtype=float32))
('Action ', array([ 8.39163876,  7.01341486], dtype=float32))
('Action ', array([ 5.63175726,  6.03377676], dtype=float32))
('Action ', array([ 8.23549271,  7.2034936 ], dtype=float32))
('Action ', array([ 5.63175726,  6.03377676], dtype=float32))
('Action ', array([ 5.63175726,  6.03377676], dtype=float32))
('Action ', array([ 8.23549271,  7.2034936 ], dtype=float32))
('Action ', array([ 5.63175726,  6.03377676], dtype=float32))
('Action ', array([ 8.10483837,  7.3458848 ], dtype=float32))
('Action ', array([ 5.63175726,  6.03377676], dtype=float32))
('Action ', array([ 0.31893036,  5.71474314], dtype=float32))
('Action ', array([ 5.63175726,  6.03377676], dtype=float32))
('Action

('Action ', array([ 8.10518742,  8.27847004], dtype=float32))
('Action ', array([ 7.90421772,  8.31229591], dtype=float32))
('Action ', array([ 6.6017642 ,  8.09946728], dtype=float32))
('Action ', array([ 7.82179928,  8.18433857], dtype=float32))
('Action ', array([ 7.00008678,  7.63953352], dtype=float32))
('Action ', array([ 7.82544994,  8.19622707], dtype=float32))
('Action ', array([ 7.82764912,  7.90652418], dtype=float32))
('Action ', array([ 7.12883759,  7.29219484], dtype=float32))
Episode: 1377/5000, score: 7
('Action ', array([ 8.08175659,  8.30641937], dtype=float32))
('Action ', array([ 7.20094299,  7.32536459], dtype=float32))
('Action ', array([ 7.93367767,  9.59900475], dtype=float32))
('Action ', array([ 7.23195267,  7.3256669 ], dtype=float32))
('Action ', array([ 7.74644375,  9.45905972], dtype=float32))
('Action ', array([ 4.38537312,  7.96836996], dtype=float32))
('Action ', array([ 7.00437927,  6.09444571], dtype=float32))
('Action ', array([ 5.2066555 ,  8.213006

('Action ', array([ 8.07537937,  8.14861679], dtype=float32))
('Action ', array([ 7.01270294,  7.40816069], dtype=float32))
('Action ', array([ 8.54624176,  8.88020992], dtype=float32))
('Action ', array([ 7.01270294,  7.40816069], dtype=float32))
('Action ', array([ 7.82957649,  7.3027606 ], dtype=float32))
('Action ', array([ 7.44503689,  7.54968119], dtype=float32))
('Action ', array([ 7.21504021,  6.34527731], dtype=float32))
('Action ', array([ 6.47334957,  6.43487692], dtype=float32))
('Action ', array([ 8.12497234,  8.00586796], dtype=float32))
('Action ', array([ 6.51126862,  6.48653364], dtype=float32))
('Action ', array([ 8.30855179,  7.61979437], dtype=float32))
('Action ', array([ 6.51126862,  6.48653364], dtype=float32))
('Action ', array([ 6.48486042,  6.43475008], dtype=float32))
('Action ', array([ 7.23278666,  6.30313253], dtype=float32))
('Action ', array([ 7.1871376 ,  7.06024885], dtype=float32))
('Action ', array([ 7.53532267,  6.81209517], dtype=float32))
('Action

('Action ', array([ 5.57933474,  6.4732585 ], dtype=float32))
('Action ', array([ 6.17690659,  5.90415335], dtype=float32))
('Action ', array([ 5.76642084,  6.56058455], dtype=float32))
Episode: 1398/5000, score: 15
('Action ', array([ 8.27461052,  8.13934231], dtype=float32))
('Action ', array([ 6.80160427,  7.59462166], dtype=float32))
('Action ', array([ 8.27461052,  8.13934231], dtype=float32))
('Action ', array([ 6.80160427,  7.59462166], dtype=float32))
('Action ', array([ 8.95965004,  7.79557228], dtype=float32))
('Action ', array([ 6.80160427,  7.59462166], dtype=float32))
('Action ', array([ 8.95965004,  7.79557228], dtype=float32))
('Action ', array([ 6.80160427,  7.59462166], dtype=float32))
('Action ', array([ 9.19989109,  9.42879105], dtype=float32))
('Action ', array([ 6.80160427,  7.59462166], dtype=float32))
('Action ', array([ 8.95965004,  7.79557228], dtype=float32))
('Action ', array([ 6.77588749,  7.60487938], dtype=float32))
('Action ', array([ 6.77588749,  7.60487

('Action ', array([ 6.80052519,  6.53877974], dtype=float32))
('Action ', array([ 2.71104479,  0.20489839], dtype=float32))
('Action ', array([ 6.01444006,  6.51248598], dtype=float32))
('Action ', array([ 1.07141733, -2.42759752], dtype=float32))
('Action ', array([ 6.25404215,  6.5014329 ], dtype=float32))
('Action ', array([ 1.87299585, -1.73912859], dtype=float32))
('Action ', array([ 7.78092718,  8.10448265], dtype=float32))
('Action ', array([ 0.25931215,  0.33395341], dtype=float32))
('Action ', array([ 7.92511702,  7.98638201], dtype=float32))
('Action ', array([-1.7610774 ,  0.47315934], dtype=float32))
('Action ', array([ 7.81026697,  8.00388813], dtype=float32))
('Action ', array([-5.2794795 ,  1.68702269], dtype=float32))
('Action ', array([ 7.88913679,  8.36446571], dtype=float32))
Episode: 1403/5000, score: 39
('Action ', array([ 8.25992393,  8.07196903], dtype=float32))
('Action ', array([ 6.94774151,  8.34488869], dtype=float32))
('Action ', array([ 8.7827301 ,  6.40775

('Action ', array([ 8.44760227,  8.15311241], dtype=float32))
('Action ', array([ 6.67253733,  7.55571699], dtype=float32))
('Action ', array([ 8.44760227,  8.15311241], dtype=float32))
('Action ', array([ 6.67253733,  7.55571699], dtype=float32))
('Action ', array([ 8.44760227,  8.15311241], dtype=float32))
('Action ', array([ 6.63210821,  7.55935907], dtype=float32))
('Action ', array([ 8.44760227,  8.15311241], dtype=float32))
('Action ', array([ 6.63210821,  7.55935907], dtype=float32))
('Action ', array([ 8.96516323,  8.22643852], dtype=float32))
('Action ', array([ 6.63210821,  7.55935907], dtype=float32))
('Action ', array([ 8.93018627,  9.53223228], dtype=float32))
('Action ', array([ 6.32818842,  7.34398031], dtype=float32))
('Action ', array([ 8.70367336,  8.48833084], dtype=float32))
('Action ', array([ 6.47570086,  7.27591944], dtype=float32))
('Action ', array([ 8.75335312,  8.44702148], dtype=float32))
('Action ', array([ 6.4647727,  7.2351594], dtype=float32))
('Action '

('Action ', array([ 8.51345539,  8.11855984], dtype=float32))
('Action ', array([ 7.10707664,  8.31954861], dtype=float32))
('Action ', array([ 8.51345539,  8.11855984], dtype=float32))
('Action ', array([ 7.10707664,  8.31954861], dtype=float32))
('Action ', array([ 8.95999527,  8.6986351 ], dtype=float32))
('Action ', array([ 7.10707664,  8.31954861], dtype=float32))
('Action ', array([ 8.95999527,  8.6986351 ], dtype=float32))
('Action ', array([ 7.10707664,  8.31954861], dtype=float32))
('Action ', array([ 8.9910059 ,  8.64182758], dtype=float32))
('Action ', array([ 7.10707664,  8.31954861], dtype=float32))
('Action ', array([ 8.9910059 ,  8.64182758], dtype=float32))
('Action ', array([ 7.10707664,  8.31954861], dtype=float32))
('Action ', array([ 9.03861046,  8.55185986], dtype=float32))
('Action ', array([ 7.10459328,  8.32632256], dtype=float32))
('Action ', array([ 9.23658371,  8.7221384 ], dtype=float32))
('Action ', array([ 7.10070801,  8.36394405], dtype=float32))
('Action

('Action ', array([ 5.91036415,  3.7252419 ], dtype=float32))
('Action ', array([ 7.77141666,  7.90910482], dtype=float32))
('Action ', array([ 4.76768303,  2.70082784], dtype=float32))
('Action ', array([ 7.4940443 ,  7.44664526], dtype=float32))
('Action ', array([ 4.7281971 ,  3.39327168], dtype=float32))
('Action ', array([ 7.77636337,  7.73214674], dtype=float32))
('Action ', array([ 0.63167763,  3.02599263], dtype=float32))
('Action ', array([ 7.2770834 ,  7.39049673], dtype=float32))
Episode: 1418/5000, score: 31
('Action ', array([ 8.42781162,  8.12814045], dtype=float32))
('Action ', array([ 6.83026361,  7.72299623], dtype=float32))
('Action ', array([ 8.21364975,  7.7378583 ], dtype=float32))
('Action ', array([ 6.83026361,  7.72299623], dtype=float32))
('Action ', array([ 8.21364975,  7.7378583 ], dtype=float32))
('Action ', array([ 6.83026361,  7.72299623], dtype=float32))
('Action ', array([ 8.21364975,  7.7378583 ], dtype=float32))
('Action ', array([ 6.83026361,  7.72299

('Action ', array([ 8.51624489,  8.36029053], dtype=float32))
('Action ', array([ 6.96190691,  7.94609547], dtype=float32))
('Action ', array([ 7.66203451,  8.02013493], dtype=float32))
('Action ', array([ 6.94967222,  7.99593735], dtype=float32))
('Action ', array([ 7.97009087,  9.14770412], dtype=float32))
('Action ', array([ 7.09993696,  8.04828167], dtype=float32))
('Action ', array([ 7.15606928,  8.07136536], dtype=float32))
('Action ', array([  8.2316227 ,  10.60417843], dtype=float32))
('Action ', array([ 5.58913851,  6.66266346], dtype=float32))
Episode: 1426/5000, score: 9
('Action ', array([ 8.53712559,  8.37308121], dtype=float32))
('Action ', array([ 6.95271492,  8.59351349], dtype=float32))
('Action ', array([ 8.36405659,  7.3344121 ], dtype=float32))
('Action ', array([ 6.95422745,  8.63479137], dtype=float32))
('Action ', array([ 8.36405659,  7.3344121 ], dtype=float32))
('Action ', array([ 6.95422745,  8.63479137], dtype=float32))
('Action ', array([ 7.23814726,  8.5527

('Action ', array([ 8.61194992,  8.28927708], dtype=float32))
('Action ', array([ 6.93085527,  7.91078186], dtype=float32))
('Action ', array([ 7.22152948,  8.03984261], dtype=float32))
('Action ', array([ 6.92715788,  7.90365219], dtype=float32))
('Action ', array([ 8.45802402,  6.24600124], dtype=float32))
('Action ', array([ 7.01871729,  8.00669098], dtype=float32))
('Action ', array([ 8.52631283,  6.09020996], dtype=float32))
('Action ', array([ 7.02681494,  8.02346802], dtype=float32))
('Action ', array([ 8.52631283,  6.09020996], dtype=float32))
('Action ', array([ 7.0275569 ,  8.01787663], dtype=float32))
('Action ', array([ 8.27239704,  8.04058838], dtype=float32))
('Action ', array([ 7.02863169,  8.02609158], dtype=float32))
('Action ', array([ 8.34315491,  6.31994247], dtype=float32))
('Action ', array([ 6.49655294,  7.22555542], dtype=float32))
('Action ', array([ 8.81481838,  7.03305054], dtype=float32))
('Action ', array([ 8.0525465 ,  2.78478622], dtype=float32))
('Action

('Action ', array([ 6.55596113,  6.12690401], dtype=float32))
Episode: 1436/5000, score: 29
('Action ', array([ 8.52069378,  8.27216339], dtype=float32))
('Action ', array([ 7.2744565 ,  8.89812469], dtype=float32))
('Action ', array([ 7.4728775 ,  6.53695059], dtype=float32))
('Action ', array([ 7.28101778,  8.85653877], dtype=float32))
('Action ', array([ 6.75338268,  6.62204885], dtype=float32))
('Action ', array([ 7.28101778,  8.85653877], dtype=float32))
('Action ', array([ 6.27991009,  5.87020254], dtype=float32))
('Action ', array([ 7.28101778,  8.85653877], dtype=float32))
('Action ', array([ 6.33714628,  5.80641699], dtype=float32))
('Action ', array([ 7.28101778,  8.85653877], dtype=float32))
('Action ', array([ 6.46262312,  6.23508215], dtype=float32))
('Action ', array([ 7.28101778,  8.85653877], dtype=float32))
('Action ', array([ 6.46262312,  6.23508215], dtype=float32))
('Action ', array([ 7.28894091,  8.87550163], dtype=float32))
('Action ', array([ 6.30345869,  5.96484

('Action ', array([ 8.49359131,  8.52245331], dtype=float32))
('Action ', array([ 6.96214056,  8.50195885], dtype=float32))
('Action ', array([ 8.77813911,  9.53751278], dtype=float32))
('Action ', array([ 7.26165533,  8.83422661], dtype=float32))
('Action ', array([ 9.00532532,  9.31149197], dtype=float32))
('Action ', array([ 6.67457914,  7.54534912], dtype=float32))
('Action ', array([ 6.84376526,  7.69740009], dtype=float32))
('Action ', array([ 6.3100667 ,  6.65832329], dtype=float32))
('Action ', array([ 2.33433008,  1.01318467], dtype=float32))
Episode: 1443/5000, score: 8
('Action ', array([ 8.49330235,  8.55707932], dtype=float32))
('Action ', array([ 6.92229605,  7.89470577], dtype=float32))
('Action ', array([ 9.57097054,  9.27185917], dtype=float32))
('Action ', array([ 6.9496932 ,  7.92273903], dtype=float32))
('Action ', array([ 9.35462189,  9.264781  ], dtype=float32))
('Action ', array([ 6.92952013,  7.91627789], dtype=float32))
('Action ', array([ 9.35462189,  9.264781

('Action ', array([ 8.38925076,  8.48259163], dtype=float32))
('Action ', array([ 6.99248838,  8.11062527], dtype=float32))
('Action ', array([ 8.0464468 ,  3.67872739], dtype=float32))
('Action ', array([ 6.95997286,  8.17685699], dtype=float32))
('Action ', array([ 7.15459204,  4.09046555], dtype=float32))
('Action ', array([ 6.92211199,  8.15836334], dtype=float32))
('Action ', array([ 7.09975004,  4.56261349], dtype=float32))
('Action ', array([ 6.87955046,  8.116786  ], dtype=float32))
('Action ', array([ 7.30071688,  4.46809101], dtype=float32))
('Action ', array([ 6.78359556,  7.96315002], dtype=float32))
('Action ', array([ 6.68681431,  4.61467457], dtype=float32))
('Action ', array([ 6.38795424,  7.55788708], dtype=float32))
('Action ', array([ 7.10090542,  6.01319218], dtype=float32))
('Action ', array([ 5.37465143,  6.38673687], dtype=float32))
('Action ', array([ 2.56751966,  1.7911694 ], dtype=float32))
('Action ', array([ 5.66515493,  6.26238346], dtype=float32))
Episode:

('Action ', array([ 4.78728533,  3.62361741], dtype=float32))
('Action ', array([ 3.0191071 ,  2.68521714], dtype=float32))
Episode: 1461/5000, score: 14
('Action ', array([ 8.44404316,  8.60265064], dtype=float32))
('Action ', array([ 6.98834705,  7.94837379], dtype=float32))
('Action ', array([ 6.95309448,  7.91319466], dtype=float32))
('Action ', array([ 10.19659805,   9.89129543], dtype=float32))
('Action ', array([ 7.04030609,  8.1583519 ], dtype=float32))
('Action ', array([ 8.10489368,  7.36473179], dtype=float32))
('Action ', array([ 7.03051281,  8.1603632 ], dtype=float32))
('Action ', array([ 8.1322937 ,  7.32677555], dtype=float32))
('Action ', array([ 7.09122849,  8.17055798], dtype=float32))
('Action ', array([ 8.21236801,  4.90804386], dtype=float32))
('Action ', array([ 6.85052013,  7.37668896], dtype=float32))
('Action ', array([ 4.2020874 ,  2.41867948], dtype=float32))
Episode: 1462/5000, score: 12
('Action ', array([ 8.455019 ,  8.6036377], dtype=float32))
('Action '

('Action ', array([ 5.91759586,  3.12092185], dtype=float32))
('Action ', array([ 5.37947941,  5.51240444], dtype=float32))
Episode: 1468/5000, score: 13
('Action ', array([ 8.3872776 ,  8.61586857], dtype=float32))
('Action ', array([ 6.92610359,  8.00500393], dtype=float32))
('Action ', array([ 8.96642876,  9.15754414], dtype=float32))
('Action ', array([ 6.92610359,  8.00500393], dtype=float32))
('Action ', array([ 8.71499825,  9.97145367], dtype=float32))
('Action ', array([ 7.21558475,  8.21830177], dtype=float32))
('Action ', array([ 8.29817104,  8.61777592], dtype=float32))
('Action ', array([ 7.22302914,  8.11538792], dtype=float32))
('Action ', array([ 5.75274467,  4.53648472], dtype=float32))
Episode: 1469/5000, score: 8
('Action ', array([ 8.34683609,  8.62543583], dtype=float32))
('Action ', array([ 7.88717747,  7.96904612], dtype=float32))
('Action ', array([ 6.85688448,  7.47919512], dtype=float32))
('Action ', array([ 5.62399244,  6.71094656], dtype=float32))
('Action ',

Episode: 1477/5000, score: 12
('Action ', array([ 8.35462475,  8.51226997], dtype=float32))
('Action ', array([ 6.75723076,  7.95481873], dtype=float32))
('Action ', array([ 8.68315697,  8.58764553], dtype=float32))
('Action ', array([ 7.05213451,  8.27344704], dtype=float32))
('Action ', array([ 8.78720474,  8.58652592], dtype=float32))
('Action ', array([ 7.04463959,  8.26267815], dtype=float32))
('Action ', array([ 6.77959538,  7.44996929], dtype=float32))
('Action ', array([ 9.54801083,  7.17796612], dtype=float32))
('Action ', array([ 6.79459476,  7.4012785 ], dtype=float32))
('Action ', array([ 7.42587185,  5.73876858], dtype=float32))
('Action ', array([ 6.79934406,  7.4144783 ], dtype=float32))
('Action ', array([ 7.42587185,  5.73876858], dtype=float32))
('Action ', array([ 6.82181454,  7.40413094], dtype=float32))
('Action ', array([ 7.42587185,  5.73876858], dtype=float32))
('Action ', array([ 6.44904327,  6.52636528], dtype=float32))
('Action ', array([ 4.68276405, -2.34832

('Action ', array([ 8.24916553,  8.55068493], dtype=float32))
('Action ', array([ 6.4752183 ,  8.00557995], dtype=float32))
('Action ', array([ 8.90465164,  9.00421524], dtype=float32))
('Action ', array([ 6.44100332,  7.96591568], dtype=float32))
('Action ', array([ 8.11011124,  9.25187206], dtype=float32))
('Action ', array([ 5.97913027,  7.53477287], dtype=float32))
('Action ', array([ 5.34143782,  4.10225964], dtype=float32))
('Action ', array([ 5.91117144,  7.53578568], dtype=float32))
('Action ', array([ 0.0535225 ,  0.14742163], dtype=float32))
Episode: 1486/5000, score: 8
('Action ', array([ 8.26518917,  8.53505135], dtype=float32))
('Action ', array([ 6.16354752,  7.29650545], dtype=float32))
('Action ', array([ 8.48153973,  8.71610069], dtype=float32))
('Action ', array([ 6.16822243,  7.30284262], dtype=float32))
('Action ', array([ 8.00483418,  8.22400951], dtype=float32))
('Action ', array([ 5.89026546,  6.57859659], dtype=float32))
('Action ', array([ 7.40776205,  5.214991

('Action ', array([ 8.33083725,  8.52741814], dtype=float32))
('Action ', array([ 6.54405212,  8.10301018], dtype=float32))
('Action ', array([ 8.33083725,  8.52741814], dtype=float32))
('Action ', array([ 6.55469704,  8.10290909], dtype=float32))
('Action ', array([ 8.89317513,  9.79007626], dtype=float32))
('Action ', array([ 6.25528812,  7.75918818], dtype=float32))
('Action ', array([ 9.47236443,  8.72361183], dtype=float32))
('Action ', array([ 6.31529331,  7.82095003], dtype=float32))
('Action ', array([ 5.0059824 ,  4.36636209], dtype=float32))
('Action ', array([ 5.62295818,  6.98530626], dtype=float32))
Episode: 1497/5000, score: 9
('Action ', array([ 8.32260036,  8.53184223], dtype=float32))
('Action ', array([ 6.43958139,  7.55685997], dtype=float32))
('Action ', array([ 7.78957319,  9.24030113], dtype=float32))
('Action ', array([ 6.2344079 ,  6.61650944], dtype=float32))
('Action ', array([ 7.28412867,  6.30303478], dtype=float32))
('Action ', array([ 4.61565638,  5.502451

('Action ', array([ 6.53604507,  4.13311243], dtype=float32))
('Action ', array([ 6.71862411,  7.48840761], dtype=float32))
('Action ', array([ 5.58860493,  3.43162394], dtype=float32))
('Action ', array([ 5.15716171,  5.75390577], dtype=float32))
('Action ', array([ 4.90930748,  0.5599122 ], dtype=float32))
('Action ', array([ 5.25421047,  5.90941095], dtype=float32))
('Action ', array([ 5.83351707,  1.23658609], dtype=float32))
Episode: 1506/5000, score: 18
('Action ', array([ 8.37115479,  8.39754772], dtype=float32))
('Action ', array([ 9.15925217,  9.44246006], dtype=float32))
('Action ', array([ 6.69361162,  7.97647333], dtype=float32))
('Action ', array([ 9.15925217,  9.44246006], dtype=float32))
('Action ', array([ 6.69361162,  7.97647333], dtype=float32))
('Action ', array([ 6.84146643,  8.358078  ], dtype=float32))
('Action ', array([ 8.31333733,  5.32412291], dtype=float32))
('Action ', array([ 6.87677717,  8.32374191], dtype=float32))
('Action ', array([ 8.22886944,  4.66403

('Action ', array([ 5.10150051,  0.03513704], dtype=float32))
('Action ', array([ 6.69506836,  7.31086922], dtype=float32))
('Action ', array([ 4.85201168, -2.86127114], dtype=float32))
('Action ', array([ 6.2277832 ,  6.47745132], dtype=float32))
Episode: 1511/5000, score: 15
('Action ', array([ 8.34000015,  8.36992455], dtype=float32))
('Action ', array([ 6.94783783,  8.17511272], dtype=float32))
('Action ', array([ 8.13472939,  7.51750803], dtype=float32))
('Action ', array([ 6.83770847,  8.04471207], dtype=float32))
('Action ', array([ 8.13472939,  7.51750803], dtype=float32))
('Action ', array([ 6.83812523,  8.04997349], dtype=float32))
('Action ', array([ 8.13472939,  7.51750803], dtype=float32))
('Action ', array([ 6.848423  ,  8.05583572], dtype=float32))
('Action ', array([ 8.13472939,  7.51750803], dtype=float32))
('Action ', array([ 6.87478352,  7.29273081], dtype=float32))
('Action ', array([ 8.48265839,  7.36521959], dtype=float32))
('Action ', array([ 6.87333775,  7.02628

Episode: 1521/5000, score: 11
('Action ', array([ 8.33771133,  8.3027153 ], dtype=float32))
('Action ', array([ 6.56805706,  7.9590497 ], dtype=float32))
('Action ', array([ 8.18852901,  7.60096121], dtype=float32))
('Action ', array([ 8.18852901,  7.60096121], dtype=float32))
('Action ', array([ 6.56805706,  7.9590497 ], dtype=float32))
('Action ', array([ 8.18852901,  7.60096121], dtype=float32))
('Action ', array([ 6.56042194,  7.92037821], dtype=float32))
('Action ', array([ 8.18852901,  7.60096121], dtype=float32))
('Action ', array([ 8.23691463,  8.28294277], dtype=float32))
('Action ', array([ 6.51265144,  7.90586042], dtype=float32))
('Action ', array([ 7.12730932,  4.82588625], dtype=float32))
('Action ', array([ 6.75345993,  7.78766489], dtype=float32))
('Action ', array([ 7.2128706 ,  6.11640596], dtype=float32))
('Action ', array([ 6.75582504,  7.80137491], dtype=float32))
('Action ', array([ 9.15850735,  6.95209932], dtype=float32))
('Action ', array([ 6.7126379 ,  7.75927

('Action ', array([ 4.14359093, -1.13292205], dtype=float32))
('Action ', array([ 5.32527256,  5.81996632], dtype=float32))
Episode: 1527/5000, score: 13
('Action ', array([ 8.35639381,  8.20018578], dtype=float32))
('Action ', array([ 9.43181992,  7.54323339], dtype=float32))
('Action ', array([ 6.72865582,  8.01077747], dtype=float32))
('Action ', array([ 9.06347466,  7.16769171], dtype=float32))
('Action ', array([ 6.26163864,  7.39796209], dtype=float32))
('Action ', array([ 9.80515194,  6.03723669], dtype=float32))
('Action ', array([ 9.78471756,  7.73936987], dtype=float32))
('Action ', array([ 6.03278923,  7.2122941 ], dtype=float32))
('Action ', array([ 7.92396164,  3.42545843], dtype=float32))
('Action ', array([ 4.10112953,  5.15996408], dtype=float32))
('Action ', array([ 4.84250736,  1.63359606], dtype=float32))
('Action ', array([ 4.44568729,  5.30724096], dtype=float32))
Episode: 1528/5000, score: 13
('Action ', array([ 8.35187244,  8.21021652], dtype=float32))
('Action '

('Action ', array([ 5.07662344,  5.7028656 ], dtype=float32))
('Action ', array([ 4.96329641,  5.66692162], dtype=float32))
Episode: 1533/5000, score: 25
('Action ', array([ 8.29507732,  8.18279266], dtype=float32))
('Action ', array([ 5.93341446,  6.94891977], dtype=float32))
('Action ', array([ 8.13780689,  7.90224981], dtype=float32))
('Action ', array([ 5.93341446,  6.94891977], dtype=float32))
('Action ', array([ 8.13780689,  7.90224981], dtype=float32))
('Action ', array([ 5.93341446,  6.94891977], dtype=float32))
('Action ', array([ 7.99404144,  9.14583683], dtype=float32))
('Action ', array([ 5.95649242,  6.96219587], dtype=float32))
('Action ', array([ 8.1535387 ,  7.93801832], dtype=float32))
('Action ', array([ 5.93221664,  6.97121859], dtype=float32))
('Action ', array([ 8.2933569 ,  7.94080496], dtype=float32))
('Action ', array([ 5.93221664,  6.97121859], dtype=float32))
('Action ', array([ 7.63110924,  8.33359051], dtype=float32))
('Action ', array([ 6.38998699,  7.18521

('Action ', array([ 9.06321144,  7.93036747], dtype=float32))
('Action ', array([ 5.84944201,  6.85811424], dtype=float32))
('Action ', array([ 9.05136299,  7.95172787], dtype=float32))
('Action ', array([ 5.84944963,  6.8593092 ], dtype=float32))
('Action ', array([ 8.36686134,  8.3231554 ], dtype=float32))
('Action ', array([ 5.84944963,  6.8593092 ], dtype=float32))
('Action ', array([ 7.6799016 ,  8.37696552], dtype=float32))
('Action ', array([ 5.84944963,  6.8593092 ], dtype=float32))
('Action ', array([ 8.36686134,  8.3231554 ], dtype=float32))
('Action ', array([ 5.85312891,  6.86443996], dtype=float32))
('Action ', array([ 8.51911259,  8.34201908], dtype=float32))
('Action ', array([ 5.85312891,  6.86443996], dtype=float32))
('Action ', array([ 8.32115746,  8.22272205], dtype=float32))
('Action ', array([ 5.84240484,  6.86168575], dtype=float32))
('Action ', array([ 8.32115746,  8.22272205], dtype=float32))
('Action ', array([ 5.83518267,  6.86003208], dtype=float32))
('Action

('Action ', array([ 6.92389917,  7.52517748], dtype=float32))
('Action ', array([ 9.47601795,  8.02316952], dtype=float32))
('Action ', array([ 6.78632307,  7.55756617], dtype=float32))
('Action ', array([ 9.57324314,  7.94704103], dtype=float32))
('Action ', array([ 6.80660963,  7.56718683], dtype=float32))
('Action ', array([ 9.57324314,  7.94704103], dtype=float32))
('Action ', array([ 6.80660963,  7.56718683], dtype=float32))
('Action ', array([ 9.51484776,  8.05384922], dtype=float32))
('Action ', array([ 6.87654734,  6.87569952], dtype=float32))
('Action ', array([ 9.35398006,  7.52662325], dtype=float32))
('Action ', array([ 6.79159117,  6.49694014], dtype=float32))
('Action ', array([ 9.35398006,  7.52662325], dtype=float32))
('Action ', array([ 6.75049353,  7.15782499], dtype=float32))
('Action ', array([ 8.72092152,  8.56003284], dtype=float32))
('Action ', array([ 6.7802825 ,  7.09225035], dtype=float32))
('Action ', array([ 7.9065299,  7.2000165], dtype=float32))
('Action '

('Action ', array([ 6.94460201,  4.57969904], dtype=float32))
('Action ', array([ 3.87816119,  4.13490725], dtype=float32))
('Action ', array([ 6.0152483 ,  5.06162119], dtype=float32))
('Action ', array([ 4.03847027,  4.18847513], dtype=float32))
('Action ', array([ 5.9475565,  4.8527627], dtype=float32))
('Action ', array([ 4.0946846 ,  4.18358946], dtype=float32))
('Action ', array([ 6.06149006,  4.79484415], dtype=float32))
('Action ', array([ 4.12926769,  4.22855616], dtype=float32))
('Action ', array([ 6.06149006,  4.79484415], dtype=float32))
('Action ', array([ 4.07252884,  4.25118208], dtype=float32))
('Action ', array([ 6.01962757,  4.76806498], dtype=float32))
('Action ', array([ 4.81118488,  4.23745584], dtype=float32))
('Action ', array([ 6.16887474,  5.11718988], dtype=float32))
('Action ', array([ 4.82057285,  4.21941042], dtype=float32))
('Action ', array([ 5.39926434,  5.7378602 ], dtype=float32))
('Action ', array([ 4.18108749,  4.28215551], dtype=float32))
('Action '

('Action ', array([ 8.13182545,  7.88156652], dtype=float32))
('Action ', array([ 6.27930355,  7.4648509 ], dtype=float32))
('Action ', array([ 8.13182545,  7.88156652], dtype=float32))
('Action ', array([ 6.27930355,  7.4648509 ], dtype=float32))
('Action ', array([ 8.42737579,  8.27655029], dtype=float32))
('Action ', array([ 6.27930355,  7.4648509 ], dtype=float32))
('Action ', array([ 8.88499165,  7.77075052], dtype=float32))
('Action ', array([ 6.27930355,  7.4648509 ], dtype=float32))
('Action ', array([ 8.88499165,  7.77075052], dtype=float32))
('Action ', array([ 6.27930355,  7.4648509 ], dtype=float32))
('Action ', array([ 8.17334557,  8.18769073], dtype=float32))
('Action ', array([ 6.27930355,  7.4648509 ], dtype=float32))
('Action ', array([ 8.88499165,  7.77075052], dtype=float32))
('Action ', array([ 6.11537743,  7.35861444], dtype=float32))
('Action ', array([ 8.72391987,  8.53131485], dtype=float32))
('Action ', array([ 6.11537743,  7.35861444], dtype=float32))
('Action

('Action ', array([ 7.32442188,  5.52569151], dtype=float32))
('Action ', array([ 5.01156187,  4.0502429 ], dtype=float32))
('Action ', array([ 4.10609388,  5.84728575], dtype=float32))
('Action ', array([ 6.39145899,  7.71773767], dtype=float32))
('Action ', array([ 4.88360929,  6.78166914], dtype=float32))
('Action ', array([ 6.13124418,  7.11630678], dtype=float32))
Episode: 1565/5000, score: 19
('Action ', array([ 8.08657265,  7.91687489], dtype=float32))
('Action ', array([ 6.86195993,  8.24915695], dtype=float32))
('Action ', array([ 8.97685432,  9.84500599], dtype=float32))
('Action ', array([ 6.86195993,  8.24915695], dtype=float32))
('Action ', array([ 8.08657265,  7.91687489], dtype=float32))
('Action ', array([ 6.68986368,  8.01978493], dtype=float32))
('Action ', array([ 8.93987942,  8.98550129], dtype=float32))
('Action ', array([ 6.67980337,  7.99559164], dtype=float32))
('Action ', array([ 9.03682137,  7.27380037], dtype=float32))
('Action ', array([ 6.6286788 ,  7.80676

('Action ', array([ 4.17570114,  1.2242322 ], dtype=float32))
('Action ', array([ 4.58635235,  5.21533537], dtype=float32))
Episode: 1572/5000, score: 13
('Action ', array([ 8.07794094,  7.86136293], dtype=float32))
('Action ', array([ 6.63120461,  7.95336294], dtype=float32))
('Action ', array([ 7.4338336 ,  8.42128563], dtype=float32))
('Action ', array([ 8.07794094,  7.86136293], dtype=float32))
('Action ', array([ 6.63120461,  7.95336294], dtype=float32))
('Action ', array([ 7.4338336 ,  8.42128563], dtype=float32))
('Action ', array([ 6.63120461,  7.95336294], dtype=float32))
('Action ', array([ 8.07794094,  7.86136293], dtype=float32))
('Action ', array([ 6.74809933,  8.13375282], dtype=float32))
('Action ', array([ 7.06782436,  5.56174135], dtype=float32))
('Action ', array([ 6.71335316,  8.01075268], dtype=float32))
('Action ', array([ 6.5052166 ,  3.80803347], dtype=float32))
('Action ', array([ 6.72560501,  8.01461124], dtype=float32))
('Action ', array([ 6.61215115,  3.64004

('Action ', array([ 6.77925396,  7.91927099], dtype=float32))
('Action ', array([ 6.54649448,  9.59285259], dtype=float32))
('Action ', array([ 6.30516434,  6.6469779 ], dtype=float32))
('Action ', array([ 6.50322819,  8.82667446], dtype=float32))
('Action ', array([ 5.74851227,  5.62884569], dtype=float32))
('Action ', array([ 2.61695027,  2.10761499], dtype=float32))
('Action ', array([ 6.73276901,  6.41488695], dtype=float32))
('Action ', array([ 3.07994771,  3.57975626], dtype=float32))
Episode: 1581/5000, score: 20
('Action ', array([ 8.13577366,  7.94908714], dtype=float32))
('Action ', array([ 6.34514904,  7.69832706], dtype=float32))
('Action ', array([ 8.41153145,  8.40948963], dtype=float32))
('Action ', array([ 6.34514904,  7.69832706], dtype=float32))
('Action ', array([ 8.41153145,  8.40948963], dtype=float32))
('Action ', array([ 6.34514904,  7.69832706], dtype=float32))
('Action ', array([ 8.41278648,  8.35515499], dtype=float32))
('Action ', array([ 6.34514904,  7.69832

('Action ', array([ 6.38937235,  7.22426558], dtype=float32))
('Action ', array([ 8.98431778,  5.07862806], dtype=float32))
('Action ', array([ 5.69684458,  6.2750144 ], dtype=float32))
('Action ', array([ 8.17626667,  4.70787001], dtype=float32))
('Action ', array([ 5.66941214,  6.18174791], dtype=float32))
('Action ', array([ 9.63298607,  5.39106321], dtype=float32))
('Action ', array([ 4.31962729,  5.04532194], dtype=float32))
('Action ', array([ 6.75564337,  3.97823691], dtype=float32))
('Action ', array([ 4.31516981,  5.04473639], dtype=float32))
('Action ', array([ 7.35391474, -4.07658434], dtype=float32))
('Action ', array([ 4.26520967,  4.96370173], dtype=float32))
('Action ', array([ 7.409163  ,  2.85161948], dtype=float32))
('Action ', array([ 4.13750124,  5.00147486], dtype=float32))
('Action ', array([ 6.15894938,  1.40839744], dtype=float32))
('Action ', array([ 5.24221754,  5.40217829], dtype=float32))
('Action ', array([ 6.03962564,  1.87751746], dtype=float32))
('Action

('Action ', array([ 8.07463169,  8.08069611], dtype=float32))
('Action ', array([ 6.23904324,  8.01291943], dtype=float32))
('Action ', array([ 6.16409445,  7.89893961], dtype=float32))
('Action ', array([ 6.69890785,  8.52688408], dtype=float32))
('Action ', array([ 5.13038445,  7.49972582], dtype=float32))
('Action ', array([ 5.12498569,  6.14778566], dtype=float32))
('Action ', array([ 6.28060818,  7.25192118], dtype=float32))
('Action ', array([ 4.95708752,  7.15878725], dtype=float32))
('Action ', array([ 4.34939003,  5.60113764], dtype=float32))
('Action ', array([ 1.59213996,  4.36320162], dtype=float32))
Episode: 1591/5000, score: 10
('Action ', array([ 6.3773284 ,  7.89499331], dtype=float32))
('Action ', array([ 8.27748013,  8.67170048], dtype=float32))
('Action ', array([ 6.3773284 ,  7.89499331], dtype=float32))
('Action ', array([ 6.3773284 ,  7.89499331], dtype=float32))
('Action ', array([ 6.35597849,  7.91227198], dtype=float32))
('Action ', array([ 7.61976528,  9.92253

Episode: 1599/5000, score: 11
('Action ', array([ 8.22734261,  8.01393795], dtype=float32))
('Action ', array([ 6.49331284,  7.61018753], dtype=float32))
('Action ', array([ 8.22734261,  8.01393795], dtype=float32))
('Action ', array([ 6.49331284,  7.61018753], dtype=float32))
('Action ', array([ 8.22734261,  8.01393795], dtype=float32))
('Action ', array([ 6.50654888,  7.60779762], dtype=float32))
('Action ', array([ 8.22688103,  7.76756954], dtype=float32))
('Action ', array([ 6.50654888,  7.60779762], dtype=float32))
('Action ', array([ 8.22688103,  7.76756954], dtype=float32))
('Action ', array([ 6.50654888,  7.60779762], dtype=float32))
('Action ', array([ 8.53890228,  7.72982693], dtype=float32))
('Action ', array([ 6.50614262,  7.6074419 ], dtype=float32))
('Action ', array([ 8.96208477,  8.66109085], dtype=float32))
('Action ', array([ 6.50614262,  7.6074419 ], dtype=float32))
('Action ', array([ 8.61581993,  8.55548096], dtype=float32))
('Action ', array([ 6.50573349,  7.60708

('Action ', array([ 6.93250561,  6.51375294], dtype=float32))
('Action ', array([ 6.30632687,  8.03458214], dtype=float32))
('Action ', array([ 5.60131359,  6.21335316], dtype=float32))
('Action ', array([ 6.30548   ,  7.99073315], dtype=float32))
('Action ', array([ 1.72956574,  4.53016758], dtype=float32))
('Action ', array([ 5.16816711,  6.78334904], dtype=float32))
Episode: 1608/5000, score: 17
('Action ', array([ 8.35169983,  8.09828186], dtype=float32))
('Action ', array([ 6.65934753,  8.46430588], dtype=float32))
('Action ', array([ 8.35169983,  8.09828186], dtype=float32))
('Action ', array([ 6.65934753,  8.46430588], dtype=float32))
('Action ', array([ 8.35169983,  8.09828186], dtype=float32))
('Action ', array([ 6.65934753,  8.46430588], dtype=float32))
('Action ', array([ 9.2686348,  9.56917  ], dtype=float32))
('Action ', array([ 6.65934753,  8.46430588], dtype=float32))
('Action ', array([ 9.00122452,  9.34747219], dtype=float32))
('Action ', array([ 6.66039467,  8.4691505

('Action ', array([ 6.71024752,  8.01100826], dtype=float32))
('Action ', array([ 10.50651169,   5.72237253], dtype=float32))
('Action ', array([ 6.71024752,  8.01100826], dtype=float32))
('Action ', array([ 10.54593086,   5.48893976], dtype=float32))
('Action ', array([ 6.71024752,  8.01100826], dtype=float32))
('Action ', array([ 10.44705963,   5.5546937 ], dtype=float32))
('Action ', array([ 6.79363298,  8.2017231 ], dtype=float32))
('Action ', array([ 10.29020405,   5.11308527], dtype=float32))
('Action ', array([ 6.79363298,  8.2017231 ], dtype=float32))
('Action ', array([ 10.29020405,   5.11308527], dtype=float32))
('Action ', array([ 6.86825991,  8.37369728], dtype=float32))
('Action ', array([ 10.37692547,   5.24311686], dtype=float32))
('Action ', array([ 6.83441782,  8.30965519], dtype=float32))
('Action ', array([ 9.23170471,  3.70060945], dtype=float32))
('Action ', array([ 6.85568666,  8.35681343], dtype=float32))
('Action ', array([ 9.92901516,  3.64904618], dtype=float3

('Action ', array([ 6.65119791,  7.68784523], dtype=float32))
('Action ', array([ 7.28700113,  5.63757038], dtype=float32))
('Action ', array([ 5.83727789,  6.35946751], dtype=float32))
('Action ', array([ 6.59052229,  7.6662941 ], dtype=float32))
('Action ', array([ 5.8900733 ,  6.71854115], dtype=float32))
('Action ', array([ 6.50089121,  7.61510754], dtype=float32))
('Action ', array([ 3.38794565,  2.56263804], dtype=float32))
Episode: 1617/5000, score: 20
('Action ', array([ 8.21795273,  8.30646992], dtype=float32))
('Action ', array([ 6.96711969,  8.96714401], dtype=float32))
('Action ', array([  9.85981083,  10.10341167], dtype=float32))
('Action ', array([ 7.47389269,  9.19245148], dtype=float32))
('Action ', array([  9.5375309,  11.3308382], dtype=float32))
('Action ', array([ 7.70830297,  9.11419296], dtype=float32))
('Action ', array([  9.19898701,  11.42086887], dtype=float32))
('Action ', array([ 6.6408143 ,  7.37232018], dtype=float32))
('Action ', array([ 3.66152167,  6.4

('Action ', array([ 9.77446842,  8.4923954 ], dtype=float32))
('Action ', array([ 6.79919529,  7.42989016], dtype=float32))
('Action ', array([ 9.23680592,  6.93680906], dtype=float32))
('Action ', array([ 7.42888641,  7.51380873], dtype=float32))
('Action ', array([ 9.34930134,  7.36792326], dtype=float32))
('Action ', array([ 5.99172115,  6.26283312], dtype=float32))
('Action ', array([ 8.93923855,  7.30157423], dtype=float32))
('Action ', array([ 6.02607155,  6.13336039], dtype=float32))
('Action ', array([ 8.93923855,  7.30157423], dtype=float32))
('Action ', array([ 6.0707016 ,  6.16717768], dtype=float32))
('Action ', array([ 7.28321505,  6.7541728 ], dtype=float32))
Episode: 1626/5000, score: 34
('Action ', array([ 8.4810276 ,  8.37413788], dtype=float32))
('Action ', array([ 7.11886978,  8.54733849], dtype=float32))
('Action ', array([ 9.62126732,  7.95039415], dtype=float32))
('Action ', array([ 7.11886978,  8.54733849], dtype=float32))
('Action ', array([ 10.60175514,   8.170

('Action ', array([ 6.90864325,  7.06434011], dtype=float32))
('Action ', array([ 5.64414692,  5.90747213], dtype=float32))
('Action ', array([ 4.1826086 ,  5.84254217], dtype=float32))
('Action ', array([ 5.44173908,  5.53987837], dtype=float32))
('Action ', array([ 0.01968305,  2.08213949], dtype=float32))
('Action ', array([ 5.3643837 ,  5.53382444], dtype=float32))
Episode: 1631/5000, score: 17
('Action ', array([ 8.48949146,  8.51850319], dtype=float32))
('Action ', array([ 7.14573479,  8.52567005], dtype=float32))
('Action ', array([ 7.19274902,  8.54620552], dtype=float32))
('Action ', array([ 9.23735619,  9.57305336], dtype=float32))
('Action ', array([ 7.34673786,  7.42669487], dtype=float32))
('Action ', array([ 6.75065708,  6.40763855], dtype=float32))
('Action ', array([ 6.01926231,  6.05108166], dtype=float32))
('Action ', array([ 4.50806427,  6.60520172], dtype=float32))
('Action ', array([ 6.38116264,  5.78567123], dtype=float32))
Episode: 1632/5000, score: 9
('Action ',

('Action ', array([ 6.91358471,  3.71253157], dtype=float32))
('Action ', array([ 5.6248312 ,  6.14750814], dtype=float32))
('Action ', array([ 5.50705433,  6.06745672], dtype=float32))
('Action ', array([ 1.90959811, -1.21643126], dtype=float32))
Episode: 1639/5000, score: 16
('Action ', array([ 8.72993946,  8.77823162], dtype=float32))
('Action ', array([ 7.95376635,  9.69829655], dtype=float32))
('Action ', array([ 11.23330212,  11.77245426], dtype=float32))
('Action ', array([ 7.65561247,  9.31315231], dtype=float32))
('Action ', array([ 8.19881821,  7.3241291 ], dtype=float32))
('Action ', array([ 7.58497858,  9.14408112], dtype=float32))
('Action ', array([ 7.53702784,  7.90879631], dtype=float32))
('Action ', array([ 7.57492495,  9.18198299], dtype=float32))
('Action ', array([ 5.46074438,  6.05827522], dtype=float32))
('Action ', array([ 6.40285635,  7.8532486 ], dtype=float32))
Episode: 1640/5000, score: 9
('Action ', array([ 8.78168106,  8.81299591], dtype=float32))
('Action 

('Action ', array([ 9.50150108,  8.86214352], dtype=float32))
('Action ', array([ 7.62415361,  8.64774227], dtype=float32))
('Action ', array([ 9.79808903,  9.06039143], dtype=float32))
('Action ', array([ 7.62321997,  8.64530945], dtype=float32))
('Action ', array([ 8.42819023,  9.12685871], dtype=float32))
('Action ', array([ 7.90575838,  8.66111374], dtype=float32))
('Action ', array([ 6.03845263,  4.85263586], dtype=float32))
Episode: 1646/5000, score: 20
('Action ', array([ 8.88277149,  8.88395596], dtype=float32))
('Action ', array([ 7.49617243,  8.7460556 ], dtype=float32))
('Action ', array([ 8.88277149,  8.88395596], dtype=float32))
('Action ', array([ 7.51561213,  8.75862885], dtype=float32))
('Action ', array([ 9.52479267,  9.08143139], dtype=float32))
('Action ', array([ 7.18659258,  7.40718174], dtype=float32))
('Action ', array([ 8.97267628,  6.80343628], dtype=float32))
('Action ', array([ 6.22333002,  6.41545963], dtype=float32))
('Action ', array([ 5.90056562,  1.29716

('Action ', array([ 3.5762291 ,  5.54955959], dtype=float32))
Episode: 1654/5000, score: 12
('Action ', array([ 9.0126009 ,  9.06809998], dtype=float32))
('Action ', array([ 7.37601137,  8.64217186], dtype=float32))
('Action ', array([ 9.0126009 ,  9.06809998], dtype=float32))
('Action ', array([ 7.39539862,  8.6546917 ], dtype=float32))
('Action ', array([ 8.98228836,  8.64357567], dtype=float32))
('Action ', array([ 6.3724494 ,  7.45579529], dtype=float32))
('Action ', array([ 7.52772951,  5.08124352], dtype=float32))
('Action ', array([ 5.00679827,  6.17644405], dtype=float32))
('Action ', array([ 4.65655851,  3.31133294], dtype=float32))
('Action ', array([ 4.99324369,  6.10932636], dtype=float32))
('Action ', array([ 3.54199362,  3.78459573], dtype=float32))
('Action ', array([ 4.8791213 ,  5.73985672], dtype=float32))
Episode: 1655/5000, score: 11
('Action ', array([ 9.03675079,  9.10011482], dtype=float32))
('Action ', array([ 7.30592585,  8.55556965], dtype=float32))
('Action '

('Action ', array([ 8.97599697,  9.01519489], dtype=float32))
('Action ', array([ 8.05384922,  9.27704906], dtype=float32))
('Action ', array([ 10.23753643,   9.74570465], dtype=float32))
('Action ', array([ 7.82618713,  8.99063969], dtype=float32))
('Action ', array([ 9.37858486,  6.62114334], dtype=float32))
('Action ', array([ 7.38728905,  7.99127197], dtype=float32))
('Action ', array([ 9.12654018,  5.67678452], dtype=float32))
('Action ', array([ 8.95933819,  5.94717026], dtype=float32))
('Action ', array([ 7.18208313,  7.86767864], dtype=float32))
('Action ', array([ 6.2128191 ,  4.87202454], dtype=float32))
('Action ', array([ 7.10416889,  7.88739681], dtype=float32))
('Action ', array([ 6.31833982,  5.18115234], dtype=float32))
('Action ', array([ 7.03107452,  7.80075264], dtype=float32))
('Action ', array([ 4.59947205,  3.58563209], dtype=float32))
('Action ', array([ 6.60224152,  7.1473093 ], dtype=float32))
Episode: 1664/5000, score: 15
('Action ', array([ 8.99446106,  9.032

('Action ', array([ 0.76134247,  4.83577156], dtype=float32))
('Action ', array([ 8.40798283,  7.98204136], dtype=float32))
('Action ', array([ 0.53340667, -8.21731758], dtype=float32))
('Action ', array([ 8.42994213,  7.9766264 ], dtype=float32))
('Action ', array([ 8.37063217, -8.72924614], dtype=float32))
('Action ', array([ 9.21165371,  8.22937298], dtype=float32))
('Action ', array([ 4.17786169, -3.12560844], dtype=float32))
('Action ', array([ 9.63035679,  8.53520489], dtype=float32))
('Action ', array([-2.65001154, -4.8198452 ], dtype=float32))
('Action ', array([ 9.89867306,  8.74834633], dtype=float32))
('Action ', array([ 7.44617319,  1.48552501], dtype=float32))
('Action ', array([ 8.92226696,  9.22616196], dtype=float32))
('Action ', array([ 8.1016264,  9.1537199], dtype=float32))
('Action ', array([ 8.8258791,  9.7083416], dtype=float32))
('Action ', array([ 8.06779766,  9.00412369], dtype=float32))
('Action ', array([ 7.24764585,  8.57622528], dtype=float32))
('Action ', 

('Action ', array([ 8.74370098,  8.83067322], dtype=float32))
('Action ', array([ 8.25710869,  7.71419191], dtype=float32))
('Action ', array([ 8.9245882 ,  8.55607128], dtype=float32))
('Action ', array([ 6.91795063,  5.29380083], dtype=float32))
('Action ', array([ 8.22520924,  7.51319265], dtype=float32))
('Action ', array([ 5.36701584,  1.80524099], dtype=float32))
('Action ', array([ 8.13774967,  7.32735491], dtype=float32))
('Action ', array([ 0.13378061,  0.09991109], dtype=float32))
Episode: 1680/5000, score: 20
('Action ', array([ 8.80277729,  9.11836243], dtype=float32))
('Action ', array([ 7.82882977,  8.38864803], dtype=float32))
('Action ', array([ 9.20285416,  9.38362408], dtype=float32))
('Action ', array([ 7.66243362,  8.21292877], dtype=float32))
('Action ', array([ 8.41506195,  7.9494071 ], dtype=float32))
('Action ', array([ 6.28148937,  6.58687353], dtype=float32))
('Action ', array([ 8.06401634,  7.98311949], dtype=float32))
('Action ', array([ 6.41241932,  6.55495

('Action ', array([ 10.01618958,   9.10955048], dtype=float32))
('Action ', array([ 8.21757698,  8.60166168], dtype=float32))
('Action ', array([ 9.82825851,  9.11593246], dtype=float32))
('Action ', array([ 8.21757698,  8.60166168], dtype=float32))
('Action ', array([ 10.2254715 ,   9.35984421], dtype=float32))
('Action ', array([ 8.21757698,  8.60166168], dtype=float32))
('Action ', array([ 10.2254715 ,   9.35984421], dtype=float32))
('Action ', array([ 8.21757698,  8.60166168], dtype=float32))
('Action ', array([ 10.30284595,   9.34766388], dtype=float32))
('Action ', array([ 8.30836487,  8.76928902], dtype=float32))
('Action ', array([ 10.32349396,   9.34563828], dtype=float32))
('Action ', array([ 8.32098484,  8.77228069], dtype=float32))
('Action ', array([ 8.63870811,  8.93997574], dtype=float32))
('Action ', array([ 8.30637646,  8.88108921], dtype=float32))
('Action ', array([ 8.62043953,  8.61188507], dtype=float32))
('Action ', array([ 8.32441139,  8.90414238], dtype=float32)

('Action ', array([ 7.05099535,  6.41188431], dtype=float32))
('Action ', array([ 8.89953995,  5.27876949], dtype=float32))
('Action ', array([ 7.62538481,  7.19049644], dtype=float32))
('Action ', array([ 6.41548204,  4.43979549], dtype=float32))
('Action ', array([ 7.38525629,  7.00708008], dtype=float32))
Episode: 1692/5000, score: 17
('Action ', array([ 8.73191929,  9.02269745], dtype=float32))
('Action ', array([ 7.84548903,  8.24746513], dtype=float32))
('Action ', array([ 8.73191929,  9.02269745], dtype=float32))
('Action ', array([ 7.85440111,  8.26095963], dtype=float32))
('Action ', array([ 9.35617447,  8.99931431], dtype=float32))
('Action ', array([ 8.29297352,  8.78171349], dtype=float32))
('Action ', array([ 8.02460003,  8.08744907], dtype=float32))
('Action ', array([ 7.43449259,  7.38451099], dtype=float32))
('Action ', array([ 5.57241869,  5.0556879 ], dtype=float32))
('Action ', array([ 7.27856398,  7.25429726], dtype=float32))
('Action ', array([ 5.0226779 ,  2.88934

Episode: 1701/5000, score: 11
('Action ', array([ 8.61854362,  8.9608736 ], dtype=float32))
('Action ', array([ 8.15385723,  8.78138256], dtype=float32))
('Action ', array([ 9.49817657,  8.32097912], dtype=float32))
('Action ', array([ 8.16216087,  8.75272369], dtype=float32))
('Action ', array([ 8.98271656,  8.49322033], dtype=float32))
('Action ', array([ 7.33219528,  7.5078373 ], dtype=float32))
('Action ', array([ 8.98271656,  8.49322033], dtype=float32))
('Action ', array([ 7.36539841,  7.50508499], dtype=float32))
('Action ', array([ 8.98271656,  8.49322033], dtype=float32))
('Action ', array([ 7.36539841,  7.50508499], dtype=float32))
('Action ', array([ 9.13677692,  8.41182995], dtype=float32))
('Action ', array([ 7.34933853,  7.4925127 ], dtype=float32))
('Action ', array([ 9.13677692,  8.41182995], dtype=float32))
('Action ', array([ 7.34933853,  7.4925127 ], dtype=float32))
('Action ', array([ 9.13677692,  8.41182995], dtype=float32))
('Action ', array([ 7.05366039,  6.53580

('Action ', array([ 6.31580067,  4.06318474], dtype=float32))
('Action ', array([ 8.18142128,  8.67990303], dtype=float32))
('Action ', array([ 6.44995022,  6.23710442], dtype=float32))
('Action ', array([ 7.89926624,  8.2059927 ], dtype=float32))
('Action ', array([ 2.46679235,  5.77993584], dtype=float32))
Episode: 1707/5000, score: 30
('Action ', array([ 8.60264683,  8.89594746], dtype=float32))
('Action ', array([ 7.73195982,  8.11294079], dtype=float32))
('Action ', array([ 8.60264683,  8.89594746], dtype=float32))
('Action ', array([ 7.75103807,  8.12528229], dtype=float32))
('Action ', array([ 7.84754848,  8.19614506], dtype=float32))
('Action ', array([ 6.77513075,  6.74040794], dtype=float32))
('Action ', array([ 4.68287039,  5.58203983], dtype=float32))
('Action ', array([ 6.83880377,  6.59438229], dtype=float32))
('Action ', array([ 1.95654523,  6.53405476], dtype=float32))
('Action ', array([ 7.22712278,  6.65710735], dtype=float32))
Episode: 1708/5000, score: 9
('Action ',

('Action ', array([ 6.96026087,  7.46100616], dtype=float32))
('Action ', array([ 2.78003359,  0.83595288], dtype=float32))
Episode: 1716/5000, score: 14
('Action ', array([ 8.65926647,  8.75455856], dtype=float32))
('Action ', array([ 7.15809441,  7.78160954], dtype=float32))
('Action ', array([ 9.49945259,  8.00176907], dtype=float32))
('Action ', array([ 7.3014555 ,  7.88249016], dtype=float32))
('Action ', array([ 9.49945259,  8.00176907], dtype=float32))
('Action ', array([ 7.56018066,  7.95981979], dtype=float32))
('Action ', array([ 9.49945259,  8.00176907], dtype=float32))
('Action ', array([ 7.54453754,  7.94813061], dtype=float32))
('Action ', array([ 8.88664436,  7.77733135], dtype=float32))
('Action ', array([ 6.86595058,  6.96127796], dtype=float32))
('Action ', array([ 8.74621391,  6.87625217], dtype=float32))
('Action ', array([ 6.42595768,  6.5775671 ], dtype=float32))
('Action ', array([ 8.43851471,  7.31929493], dtype=float32))
('Action ', array([ 5.17804146,  5.31728

('Action ', array([ 8.6618557 ,  8.82289791], dtype=float32))
('Action ', array([ 6.87474632,  8.08229351], dtype=float32))
('Action ', array([ 8.6618557 ,  8.82289791], dtype=float32))
('Action ', array([ 6.82403183,  8.01109791], dtype=float32))
('Action ', array([ 10.22045326,   9.61199856], dtype=float32))
('Action ', array([ 7.19064522,  8.32695293], dtype=float32))
('Action ', array([ 9.24030495,  8.69157696], dtype=float32))
('Action ', array([ 5.98190117,  6.8111062 ], dtype=float32))
('Action ', array([ 7.37012291,  7.49914122], dtype=float32))
('Action ', array([ 6.04119205,  6.87590742], dtype=float32))
('Action ', array([ 3.73633933,  6.1530261 ], dtype=float32))
('Action ', array([ 3.56734252,  4.20309591], dtype=float32))
Episode: 1725/5000, score: 11
('Action ', array([ 6.5375638 ,  7.44872904], dtype=float32))
('Action ', array([ 8.65292072,  8.8146143 ], dtype=float32))
('Action ', array([ 6.5375638 ,  7.44872904], dtype=float32))
('Action ', array([ 8.65292072,  8.814

('Action ', array([ 7.70323515,  5.41648531], dtype=float32))
('Action ', array([ 6.69943047,  7.69522524], dtype=float32))
('Action ', array([ 8.32846451,  5.97858858], dtype=float32))
('Action ', array([ 6.68148613,  7.68487883], dtype=float32))
('Action ', array([ 8.31954956,  5.13361025], dtype=float32))
('Action ', array([ 6.74418354,  7.77386808], dtype=float32))
('Action ', array([ 8.93950748,  5.32349825], dtype=float32))
('Action ', array([ 6.73426533,  7.77195215], dtype=float32))
('Action ', array([ 8.1933136 ,  5.76051188], dtype=float32))
('Action ', array([ 6.71171761,  7.78053045], dtype=float32))
('Action ', array([ 6.34077835,  4.46989679], dtype=float32))
('Action ', array([ 6.60822105,  7.69440222], dtype=float32))
('Action ', array([ 5.13768196,  2.12542176], dtype=float32))
('Action ', array([ 6.42026901,  7.55077219], dtype=float32))
('Action ', array([ 4.50219822,  3.51355577], dtype=float32))
('Action ', array([ 6.34770012,  7.42398691], dtype=float32))
('Action

('Action ', array([ 8.48496628,  8.71796417], dtype=float32))
('Action ', array([ 6.8404727 ,  8.18471718], dtype=float32))
('Action ', array([ 9.08477497,  8.58228683], dtype=float32))
('Action ', array([ 7.69064569,  8.99349689], dtype=float32))
('Action ', array([ 8.04719639,  9.17476368], dtype=float32))
('Action ', array([ 8.25502491,  6.88204622], dtype=float32))
('Action ', array([ 7.17408705,  7.46370745], dtype=float32))
('Action ', array([ 8.64323235,  6.1110425 ], dtype=float32))
('Action ', array([ 7.17218637,  7.42381716], dtype=float32))
('Action ', array([ 8.71514034,  6.14990664], dtype=float32))
('Action ', array([ 7.00898981,  7.32920122], dtype=float32))
('Action ', array([ 8.73258495,  6.0977025 ], dtype=float32))
('Action ', array([ 7.00898981,  7.32920122], dtype=float32))
('Action ', array([ 8.73258495,  6.0977025 ], dtype=float32))
('Action ', array([ 6.65480375,  6.37056971], dtype=float32))
('Action ', array([ 7.34539795,  4.72079134], dtype=float32))
('Action

('Action ', array([ 6.65032053,  5.14570427], dtype=float32))
('Action ', array([ 5.06212902,  5.61823845], dtype=float32))
('Action ', array([ 6.87496328,  5.24638557], dtype=float32))
('Action ', array([ 4.98981857,  5.65860844], dtype=float32))
('Action ', array([ 9.1700058,  7.9336834], dtype=float32))
('Action ', array([ 4.87183762,  5.55724049], dtype=float32))
('Action ', array([ 8.72116661,  7.63986397], dtype=float32))
('Action ', array([ 4.90368748,  5.55798912], dtype=float32))
('Action ', array([ 9.14989948,  8.5973835 ], dtype=float32))
('Action ', array([ 5.24276638,  5.65404701], dtype=float32))
('Action ', array([ 5.47056961,  6.06278229], dtype=float32))
('Action ', array([ 5.35997581,  2.41827965], dtype=float32))
('Action ', array([ 5.56073856,  6.18383312], dtype=float32))
('Action ', array([ 3.89001489,  2.39260292], dtype=float32))
('Action ', array([ 6.02186775,  6.76722813], dtype=float32))
('Action ', array([-0.58278441,  2.09778404], dtype=float32))
('Action '

('Action ', array([ 8.37251377,  8.85283661], dtype=float32))
('Action ', array([ 7.23219824,  9.07058048], dtype=float32))
('Action ', array([ 8.37251377,  8.85283661], dtype=float32))
('Action ', array([ 7.69018698,  9.6243515 ], dtype=float32))
('Action ', array([ 9.74208546,  9.55957413], dtype=float32))
('Action ', array([ 7.38093519,  8.35934925], dtype=float32))
('Action ', array([ 6.00531483,  6.62408304], dtype=float32))
('Action ', array([ 2.70125365,  4.52294779], dtype=float32))
('Action ', array([ 6.31119776,  6.9651227 ], dtype=float32))
Episode: 1756/5000, score: 9
('Action ', array([ 8.37871933,  8.86862659], dtype=float32))
('Action ', array([ 7.2301569 ,  9.11191177], dtype=float32))
('Action ', array([ 8.37871933,  8.86862659], dtype=float32))
('Action ', array([ 7.52709484,  9.45142174], dtype=float32))
('Action ', array([ 9.19352436,  9.99650383], dtype=float32))
('Action ', array([ 7.15430069,  8.36654377], dtype=float32))
('Action ', array([ 4.63101387,  6.180075

('Action ', array([ 8.50925922,  8.83733273], dtype=float32))
('Action ', array([ 7.37252665,  9.17151833], dtype=float32))
('Action ', array([ 6.55897856,  6.7934866 ], dtype=float32))
('Action ', array([ 7.67912912,  9.42070007], dtype=float32))
('Action ', array([ 5.69619608,  5.32910633], dtype=float32))
('Action ', array([ 7.24503946,  8.26828766], dtype=float32))
('Action ', array([ 4.43572092,  4.70182514], dtype=float32))
('Action ', array([ 6.81562281,  7.91501617], dtype=float32))
('Action ', array([ 3.91341996,  4.64213276], dtype=float32))
('Action ', array([ 4.25329161,  5.17253494], dtype=float32))
('Action ', array([-0.14409032, -2.59533978], dtype=float32))
Episode: 1767/5000, score: 10
('Action ', array([ 8.49115276,  8.87654877], dtype=float32))
('Action ', array([ 7.92496204,  9.51682949], dtype=float32))
('Action ', array([  9.30368328,  10.02111149], dtype=float32))
('Action ', array([ 7.74891376,  9.26563358], dtype=float32))
('Action ', array([ 7.67240334,  9.036

('Action ', array([ 8.82592297,  8.93884945], dtype=float32))
('Action ', array([ 7.51150942,  8.87100029], dtype=float32))
('Action ', array([ 8.82592297,  8.93884945], dtype=float32))
('Action ', array([ 7.49618864,  8.84943295], dtype=float32))
('Action ', array([ 10.47198296,   9.67790031], dtype=float32))
('Action ', array([ 7.56602335,  8.94055367], dtype=float32))
('Action ', array([ 10.54205608,   9.36672878], dtype=float32))
('Action ', array([ 5.98600245,  7.01585245], dtype=float32))
('Action ', array([ 9.98191738,  5.82840395], dtype=float32))
('Action ', array([ 5.96806765,  6.99792624], dtype=float32))
('Action ', array([ 9.49818611,  4.92225885], dtype=float32))
('Action ', array([ 6.18329   ,  7.03188944], dtype=float32))
('Action ', array([ 7.46115637,  0.42160267], dtype=float32))
('Action ', array([ 5.05860186, -2.35339117], dtype=float32))
Episode: 1777/5000, score: 14
('Action ', array([ 7.46982718,  8.76686287], dtype=float32))
('Action ', array([ 9.31843853,  8.5

('Action ', array([ 8.80925941,  9.12094879], dtype=float32))
('Action ', array([ 7.22286844,  8.54779053], dtype=float32))
('Action ', array([ 9.58797455,  9.41852188], dtype=float32))
('Action ', array([ 7.27283621,  8.62076664], dtype=float32))
('Action ', array([ 9.58797455,  9.41852188], dtype=float32))
('Action ', array([ 7.19181585,  8.55022812], dtype=float32))
('Action ', array([ 9.58797455,  9.41852188], dtype=float32))
('Action ', array([ 7.88060999,  9.14541054], dtype=float32))
('Action ', array([ 10.82020092,  10.7870903 ], dtype=float32))
('Action ', array([ 8.23299503,  9.35933971], dtype=float32))
('Action ', array([ 7.76107645,  9.02695274], dtype=float32))
('Action ', array([ 8.19508934,  9.15679741], dtype=float32))
('Action ', array([ 6.80547857,  8.13116264], dtype=float32))
('Action ', array([ 8.14336395,  9.11594009], dtype=float32))
('Action ', array([ 2.9512887 ,  2.76976585], dtype=float32))
Episode: 1786/5000, score: 14
('Action ', array([ 6.88793373,  7.905

('Action ', array([ 8.58243465,  8.99836922], dtype=float32))
('Action ', array([ 6.39751768,  7.833745  ], dtype=float32))
('Action ', array([ 8.27966881,  9.5742321 ], dtype=float32))
('Action ', array([ 5.86844397,  7.33195782], dtype=float32))
('Action ', array([ 4.7378149 ,  7.95417213], dtype=float32))
('Action ', array([ 4.72468328,  5.63463879], dtype=float32))
('Action ', array([ 5.53979111,  8.44956779], dtype=float32))
('Action ', array([ 5.23255682,  5.72492599], dtype=float32))
('Action ', array([ 3.12368822,  2.34284043], dtype=float32))
('Action ', array([ 5.6306777 ,  5.83176899], dtype=float32))
Episode: 1795/5000, score: 9
('Action ', array([ 8.58315849,  8.98731709], dtype=float32))
('Action ', array([ 6.24907064,  7.26276636], dtype=float32))
('Action ', array([ 8.65177727,  9.20627975], dtype=float32))
('Action ', array([ 6.24772501,  7.23712873], dtype=float32))
('Action ', array([ 7.54828215,  8.14816189], dtype=float32))
('Action ', array([ 6.2440629 ,  7.252191

('Action ', array([ 8.59026718,  8.83298874], dtype=float32))
('Action ', array([ 5.82171679,  7.5667696 ], dtype=float32))
('Action ', array([ 8.59026718,  8.83298874], dtype=float32))
('Action ', array([ 5.74330664,  7.49795532], dtype=float32))
('Action ', array([ 7.61580038,  7.55831528], dtype=float32))
('Action ', array([ 4.20743704,  5.7210474 ], dtype=float32))
('Action ', array([ 5.4394331,  4.2479496], dtype=float32))
('Action ', array([ 4.57643747,  3.2022531 ], dtype=float32))
('Action ', array([ 5.07308531,  3.11011291], dtype=float32))
('Action ', array([ 4.29502535,  5.51746941], dtype=float32))
Episode: 1802/5000, score: 12
('Action ', array([ 8.55579758,  8.79963684], dtype=float32))
('Action ', array([ 5.48134947,  6.93860674], dtype=float32))
('Action ', array([ 8.55579758,  8.79963684], dtype=float32))
('Action ', array([ 5.52137804,  6.93871355], dtype=float32))
('Action ', array([ 7.15660667,  7.22482443], dtype=float32))
('Action ', array([ 5.74080992,  6.9886994

('Action ', array([ 8.34374523,  8.58410931], dtype=float32))
('Action ', array([ 5.14453411,  6.70652914], dtype=float32))
('Action ', array([ 8.47092056,  8.20992851], dtype=float32))
('Action ', array([ 5.14833355,  6.71138239], dtype=float32))
('Action ', array([ 8.41285896,  8.14976025], dtype=float32))
('Action ', array([ 4.77364349,  5.55467749], dtype=float32))
('Action ', array([ 8.18124294,  7.92841768], dtype=float32))
('Action ', array([ 5.17668533,  5.40729094], dtype=float32))
('Action ', array([ 6.45145988,  4.88250589], dtype=float32))
('Action ', array([ 3.55290151,  3.77096605], dtype=float32))
('Action ', array([ 6.37870693,  5.00316858], dtype=float32))
('Action ', array([ 3.71740746,  3.68821383], dtype=float32))
('Action ', array([ 5.92766762,  3.24744654], dtype=float32))
('Action ', array([ 3.92056966,  3.72804499], dtype=float32))
('Action ', array([ 6.03133154,  3.54474115], dtype=float32))
('Action ', array([ 3.82189202,  3.73187685], dtype=float32))
('Action

('Action ', array([ 8.20206451,  8.46861649], dtype=float32))
('Action ', array([ 5.90710545,  7.88260651], dtype=float32))
('Action ', array([ 8.20206451,  8.46861649], dtype=float32))
('Action ', array([ 5.98362637,  7.9756794 ], dtype=float32))
('Action ', array([ 8.35151005,  8.37991142], dtype=float32))
('Action ', array([ 5.16009426,  7.20068169], dtype=float32))
('Action ', array([ 8.20708275,  7.75086975], dtype=float32))
('Action ', array([ 5.15002728,  7.15789795], dtype=float32))
('Action ', array([ 6.11717224,  5.70907593], dtype=float32))
('Action ', array([ 3.75811601,  5.53315353], dtype=float32))
Episode: 1822/5000, score: 10
('Action ', array([ 5.71536827,  7.41662407], dtype=float32))
('Action ', array([ 8.02105045,  8.75957108], dtype=float32))
('Action ', array([ 5.71219158,  7.4122591 ], dtype=float32))
('Action ', array([  8.85182667,  10.17052841], dtype=float32))
('Action ', array([ 5.7769165 ,  7.45655537], dtype=float32))
('Action ', array([ 7.75980568,  7.344

('Action ', array([ 8.23843098,  8.26737213], dtype=float32))
('Action ', array([ 6.21960306,  7.78165436], dtype=float32))
('Action ', array([ 7.10019779,  8.03039455], dtype=float32))
('Action ', array([ 6.4321847 ,  7.81953907], dtype=float32))
('Action ', array([ 7.05665541,  8.01977825], dtype=float32))
('Action ', array([ 6.02750254,  6.2589922 ], dtype=float32))
('Action ', array([ 5.8887105 ,  6.06336975], dtype=float32))
('Action ', array([ 4.7624898 ,  5.22093201], dtype=float32))
('Action ', array([ 5.74702311,  5.60834122], dtype=float32))
Episode: 1834/5000, score: 9
('Action ', array([ 8.25770283,  8.25444317], dtype=float32))
('Action ', array([ 6.15650177,  7.8242383 ], dtype=float32))
('Action ', array([ 8.64579296,  8.11790562], dtype=float32))
('Action ', array([ 6.16456032,  7.82837057], dtype=float32))
('Action ', array([ 8.76150227,  8.08662033], dtype=float32))
('Action ', array([ 6.16456032,  7.82837057], dtype=float32))
('Action ', array([ 8.93693542,  9.839039

('Action ', array([ 8.25706482,  8.36736107], dtype=float32))
('Action ', array([ 6.17056227,  8.18292236], dtype=float32))
('Action ', array([ 6.16698217,  8.18245411], dtype=float32))
('Action ', array([ 8.67434502,  8.60002422], dtype=float32))
('Action ', array([ 6.33209658,  8.28264713], dtype=float32))
('Action ', array([ 7.62399626,  7.96314573], dtype=float32))
('Action ', array([ 5.27977419,  6.86381006], dtype=float32))
('Action ', array([ 5.92379618,  5.69720411], dtype=float32))
('Action ', array([ 5.03197527,  6.58539343], dtype=float32))
('Action ', array([ 5.6146245 ,  4.96684599], dtype=float32))
('Action ', array([ 5.18144369,  6.16889238], dtype=float32))
('Action ', array([ 1.72594225, -1.03151751], dtype=float32))
Episode: 1843/5000, score: 12
('Action ', array([ 8.31524849,  8.38500023], dtype=float32))
('Action ', array([ 7.61125612,  9.80687618], dtype=float32))
('Action ', array([ 9.62211037,  9.51941967], dtype=float32))
('Action ', array([ 7.36223841,  9.59704

('Action ', array([ 8.25846291,  8.55408287], dtype=float32))
('Action ', array([ 6.8997016 ,  8.46315479], dtype=float32))
('Action ', array([ 7.38513088,  9.09359264], dtype=float32))
('Action ', array([ 6.94066477,  8.46400642], dtype=float32))
('Action ', array([ 7.38513088,  9.09359264], dtype=float32))
('Action ', array([ 7.14424276,  8.50311089], dtype=float32))
('Action ', array([ 6.85573626,  8.88291359], dtype=float32))
('Action ', array([ 5.41842031,  6.49047375], dtype=float32))
('Action ', array([ 4.73442745,  6.74209404], dtype=float32))
('Action ', array([ 6.68282938,  6.75351524], dtype=float32))
('Action ', array([-2.68728781, -1.40345562], dtype=float32))
Episode: 1852/5000, score: 10
('Action ', array([ 8.27933979,  8.57624054], dtype=float32))
('Action ', array([ 7.26046371,  8.99597549], dtype=float32))
('Action ', array([ 8.86538029,  8.87915897], dtype=float32))
('Action ', array([ 7.3096571 ,  9.06435299], dtype=float32))
('Action ', array([ 8.85538292,  8.79198

('Action ', array([ 8.42442131,  8.86106396], dtype=float32))
('Action ', array([ 7.3925786 ,  8.12632561], dtype=float32))
('Action ', array([ 8.93224239,  8.87213898], dtype=float32))
('Action ', array([ 7.40440416,  8.11267662], dtype=float32))
('Action ', array([ 8.93224239,  8.87213898], dtype=float32))
('Action ', array([ 7.06514597,  6.95195532], dtype=float32))
('Action ', array([ 7.00894642,  6.95100927], dtype=float32))
('Action ', array([ 7.06514597,  6.95195532], dtype=float32))
('Action ', array([ 8.93224239,  8.87213898], dtype=float32))
('Action ', array([ 7.40440416,  8.11267662], dtype=float32))
('Action ', array([ 8.93224239,  8.87213898], dtype=float32))
('Action ', array([ 7.39493704,  8.12794399], dtype=float32))
('Action ', array([ 8.20893669,  9.85252762], dtype=float32))
('Action ', array([ 7.40400648,  8.16394615], dtype=float32))
('Action ', array([ 7.43342257,  8.16781139], dtype=float32))
('Action ', array([ 9.76411915,  9.01767731], dtype=float32))
('Action

('Action ', array([ 8.42706299,  8.93703747], dtype=float32))
('Action ', array([ 7.18409014,  7.9274497 ], dtype=float32))
('Action ', array([ 8.42706299,  8.93703747], dtype=float32))
('Action ', array([ 7.18409014,  7.9274497 ], dtype=float32))
('Action ', array([ 8.22703457,  8.46147823], dtype=float32))
('Action ', array([ 7.05526876,  7.43030882], dtype=float32))
('Action ', array([ 5.83735991,  5.20767355], dtype=float32))
('Action ', array([ 6.81734991,  7.10403967], dtype=float32))
('Action ', array([ 6.23630857,  5.18158865], dtype=float32))
('Action ', array([ 7.20390558,  6.91342688], dtype=float32))
('Action ', array([ 3.00253558, -0.97574097], dtype=float32))
Episode: 1869/5000, score: 10
('Action ', array([ 8.45207977,  8.92753696], dtype=float32))
('Action ', array([ 7.57128859,  8.62867451], dtype=float32))
('Action ', array([ 8.45207977,  8.92753696], dtype=float32))
('Action ', array([ 7.48788881,  8.55431557], dtype=float32))
('Action ', array([ 7.89355183,  8.18471

('Action ', array([ 8.72530365,  8.93639565], dtype=float32))
('Action ', array([ 6.92673254,  7.97659779], dtype=float32))
('Action ', array([ 9.04951668,  9.10094166], dtype=float32))
('Action ', array([ 6.9298501 ,  7.97087669], dtype=float32))
('Action ', array([ 6.49768686,  6.87333107], dtype=float32))
('Action ', array([ 4.00275373,  1.00526524], dtype=float32))
('Action ', array([ 6.44374037,  6.7537365 ], dtype=float32))
('Action ', array([ 6.51073217,  6.73361778], dtype=float32))
Episode: 1881/5000, score: 9
('Action ', array([ 8.70069313,  8.94593716], dtype=float32))
('Action ', array([ 7.12015772,  8.61125374], dtype=float32))
('Action ', array([ 9.20682907,  8.91432476], dtype=float32))
('Action ', array([ 7.12015772,  8.61125374], dtype=float32))
('Action ', array([ 9.20682907,  8.91432476], dtype=float32))
('Action ', array([ 7.04696989,  8.54379749], dtype=float32))
('Action ', array([ 9.20682907,  8.91432476], dtype=float32))
('Action ', array([ 7.68395472,  9.200307

('Action ', array([ 5.86603165,  5.05596399], dtype=float32))
('Action ', array([ 4.64534283,  5.60610151], dtype=float32))
('Action ', array([ 7.37387657,  6.79705191], dtype=float32))
('Action ', array([ 5.24143314,  4.71633482], dtype=float32))
('Action ', array([ 7.46411896,  7.31304216], dtype=float32))
('Action ', array([ 4.44766045, -4.90257692], dtype=float32))
('Action ', array([ 8.03130817,  8.35366058], dtype=float32))
('Action ', array([ 3.3871305 , -2.10185289], dtype=float32))
('Action ', array([ 6.85969543,  7.43801069], dtype=float32))
('Action ', array([ 3.77752852, -2.19102907], dtype=float32))
('Action ', array([ 6.21281719,  6.34979773], dtype=float32))
('Action ', array([ 5.64344692, -2.539536  ], dtype=float32))
('Action ', array([ 8.64462852,  0.47510853], dtype=float32))
('Action ', array([ 5.90355778,  5.9051919 ], dtype=float32))
('Action ', array([-0.8691752 , -2.22335482], dtype=float32))
('Action ', array([ 6.21375847,  6.1266818 ], dtype=float32))
('Action

('Action ', array([ 3.97617626,  6.83287096], dtype=float32))
('Action ', array([ 7.28807354,  6.85511923], dtype=float32))
('Action ', array([ 4.14545727,  6.8201375 ], dtype=float32))
('Action ', array([ 7.58020115,  7.51576376], dtype=float32))
('Action ', array([ 2.13449574,  1.24424398], dtype=float32))
('Action ', array([ 7.83220577,  7.74793196], dtype=float32))
('Action ', array([ 2.22245121,  1.39767873], dtype=float32))
('Action ', array([ 7.85238171,  7.74601603], dtype=float32))
('Action ', array([-0.15550721,  2.72898507], dtype=float32))
('Action ', array([ 7.9338789 ,  7.73352766], dtype=float32))
('Action ', array([ 8.22200871,  8.10089874], dtype=float32))
('Action ', array([ 0.45392311,  3.31408334], dtype=float32))
('Action ', array([ 8.41374111,  8.21756458], dtype=float32))
('Action ', array([-0.56182587,  5.44846392], dtype=float32))
('Action ', array([ 8.34018993,  8.55149651], dtype=float32))
('Action ', array([ 1.96323478,  3.04320931], dtype=float32))
('Action

('Action ', array([ 8.066329  ,  5.64951801], dtype=float32))
('Action ', array([ 6.78269291,  7.50044727], dtype=float32))
('Action ', array([ 8.2457056 ,  5.29887486], dtype=float32))
('Action ', array([ 6.75368118,  7.53813076], dtype=float32))
('Action ', array([ 8.53268433,  4.85447407], dtype=float32))
('Action ', array([ 6.62450504,  7.45327759], dtype=float32))
('Action ', array([ 8.0081625 ,  4.42629337], dtype=float32))
('Action ', array([ 6.28940773,  6.88702774], dtype=float32))
('Action ', array([ 7.11993694,  2.95482755], dtype=float32))
('Action ', array([ 5.93354893,  6.70655441], dtype=float32))
('Action ', array([ 9.26400757,  6.41838169], dtype=float32))
('Action ', array([ 6.21984768,  7.41160393], dtype=float32))
('Action ', array([ 9.27291965,  6.45283222], dtype=float32))
('Action ', array([ 6.09797096,  7.45342159], dtype=float32))
('Action ', array([ 6.2684803 ,  4.96273136], dtype=float32))
('Action ', array([ 5.59974861,  6.92624378], dtype=float32))
('Action

('Action ', array([ 8.60217285,  8.87957859], dtype=float32))
('Action ', array([ 6.07304287,  7.01603794], dtype=float32))
('Action ', array([ 9.19240665,  8.98153496], dtype=float32))
('Action ', array([ 6.07304287,  7.01603794], dtype=float32))
('Action ', array([ 9.19240665,  8.98153496], dtype=float32))
('Action ', array([ 6.02119732,  6.98547077], dtype=float32))
('Action ', array([ 9.19240665,  8.98153496], dtype=float32))
('Action ', array([ 6.08944321,  7.01873302], dtype=float32))
('Action ', array([ 9.09057617,  9.00446796], dtype=float32))
('Action ', array([ 6.08944321,  7.01873302], dtype=float32))
('Action ', array([ 9.09057617,  9.00446796], dtype=float32))
('Action ', array([ 5.68210125,  5.78910828], dtype=float32))
('Action ', array([ 7.27651596,  7.74135399], dtype=float32))
('Action ', array([ 5.25551414,  5.43990612], dtype=float32))
('Action ', array([ 5.20670128,  4.25829506], dtype=float32))
('Action ', array([ 3.89913726,  3.96302223], dtype=float32))
('Action

('Action ', array([ 8.45835972,  8.42238617], dtype=float32))
('Action ', array([ 6.04070187,  7.20995855], dtype=float32))
('Action ', array([ 8.31095219,  7.11545229], dtype=float32))
('Action ', array([ 6.04070187,  7.20995855], dtype=float32))
('Action ', array([ 8.31095219,  7.11545229], dtype=float32))
('Action ', array([ 6.04070187,  7.20995855], dtype=float32))
('Action ', array([ 8.31095219,  7.11545229], dtype=float32))
('Action ', array([ 6.04070187,  7.20995855], dtype=float32))
('Action ', array([ 8.31095219,  7.11545229], dtype=float32))
('Action ', array([ 6.04070187,  7.20995855], dtype=float32))
('Action ', array([ 8.31095219,  7.11545229], dtype=float32))
('Action ', array([ 6.04070187,  7.20995855], dtype=float32))
('Action ', array([ 8.31095219,  7.11545229], dtype=float32))
('Action ', array([ 6.04070187,  7.20995855], dtype=float32))
('Action ', array([ 8.69310379,  8.32459164], dtype=float32))
('Action ', array([ 6.04070187,  7.20995855], dtype=float32))
('Action

('Action ', array([ 8.33807564,  8.31615448], dtype=float32))
('Action ', array([ 6.04342318,  7.31927919], dtype=float32))
('Action ', array([ 8.87538815,  8.49955845], dtype=float32))
('Action ', array([ 6.04342318,  7.31927919], dtype=float32))
('Action ', array([ 8.87538815,  8.49955845], dtype=float32))
('Action ', array([ 6.04342318,  7.31927919], dtype=float32))
('Action ', array([ 8.46486092,  8.68726635], dtype=float32))
('Action ', array([ 6.02695322,  7.31582022], dtype=float32))
('Action ', array([ 8.52121162,  8.64829445], dtype=float32))
('Action ', array([ 6.25639677,  7.63835096], dtype=float32))
('Action ', array([ 8.78441143,  8.78530979], dtype=float32))
('Action ', array([ 5.87815619,  5.82195616], dtype=float32))
('Action ', array([ 5.97951174,  5.64985228], dtype=float32))
('Action ', array([ 4.4006772 ,  4.37764502], dtype=float32))
('Action ', array([ 7.34596157,  7.52382231], dtype=float32))
('Action ', array([ 4.37802839,  4.33544874], dtype=float32))
('Action

('Action ', array([ 6.35583019,  7.92624474], dtype=float32))
('Action ', array([ 5.28218174,  6.58693409], dtype=float32))
('Action ', array([ 7.0836134 ,  8.51675892], dtype=float32))
('Action ', array([ 7.55323124,  1.98419297], dtype=float32))
('Action ', array([ 7.43004799,  8.75055313], dtype=float32))
('Action ', array([ 5.95531559,  2.75981236], dtype=float32))
('Action ', array([ 6.98659897,  7.10618782], dtype=float32))
('Action ', array([ 4.45748997, -0.57514083], dtype=float32))
('Action ', array([ 7.17857933,  7.38147926], dtype=float32))
('Action ', array([ 3.58410382,  2.72648716], dtype=float32))
('Action ', array([ 3.85562634,  5.47029209], dtype=float32))
('Action ', array([ 6.88330841,  7.38258839], dtype=float32))
('Action ', array([ 2.21967244,  8.37687778], dtype=float32))
('Action ', array([ 8.5737524 ,  8.67874146], dtype=float32))
('Action ', array([ 6.80293941,  0.64185441], dtype=float32))
('Action ', array([ 8.53653622,  9.11227894], dtype=float32))
('Action

('Action ', array([ 8.27429771,  8.34711838], dtype=float32))
('Action ', array([ 6.74834442,  8.18765926], dtype=float32))
('Action ', array([ 8.82030487,  8.62293243], dtype=float32))
('Action ', array([ 6.79511452,  8.25352287], dtype=float32))
('Action ', array([ 8.82030487,  8.62293243], dtype=float32))
('Action ', array([ 6.79481792,  8.2554512 ], dtype=float32))
('Action ', array([ 8.55654907,  9.32300186], dtype=float32))
('Action ', array([ 8.59992409,  8.40975761], dtype=float32))
('Action ', array([ 7.22154331,  8.63017178], dtype=float32))
('Action ', array([ 6.96410179,  6.40998459], dtype=float32))
('Action ', array([ 7.07735634,  8.35698891], dtype=float32))
('Action ', array([ 6.39664745,  6.44654465], dtype=float32))
('Action ', array([ 6.89493084,  8.2554903 ], dtype=float32))
('Action ', array([ 3.71677971,  3.7631495 ], dtype=float32))
('Action ', array([ 6.26415443,  7.0024929 ], dtype=float32))
Episode: 1935/5000, score: 15
('Action ', array([ 8.28477859,  8.39914

('Action ', array([ 6.58305311,  8.81014442], dtype=float32))
('Action ', array([ 8.79478264,  7.1946516 ], dtype=float32))
('Action ', array([ 6.58305311,  8.81014442], dtype=float32))
('Action ', array([ 8.77365208,  7.20282745], dtype=float32))
('Action ', array([ 6.65247393,  8.74084663], dtype=float32))
('Action ', array([ 8.66298389,  7.01430798], dtype=float32))
('Action ', array([ 2.58589983,  7.48706627], dtype=float32))
('Action ', array([ 8.63175774,  6.81541538], dtype=float32))
('Action ', array([ 8.20955372,  7.49082756], dtype=float32))
Episode: 1944/5000, score: 37
('Action ', array([ 8.40734482,  8.30287457], dtype=float32))
('Action ', array([ 8.40734482,  8.30287457], dtype=float32))
('Action ', array([ 7.12510824,  8.51646614], dtype=float32))
('Action ', array([ 8.19935799,  7.55157185], dtype=float32))
('Action ', array([ 7.12510824,  8.51646614], dtype=float32))
('Action ', array([ 8.19935799,  7.55157185], dtype=float32))
('Action ', array([ 7.12510824,  8.51646

('Action ', array([ 8.55055904,  8.31760216], dtype=float32))
('Action ', array([ 6.97578621,  8.01520252], dtype=float32))
('Action ', array([ 9.00729561,  7.63179493], dtype=float32))
('Action ', array([ 6.97578621,  8.01520252], dtype=float32))
('Action ', array([ 9.00729561,  7.63179493], dtype=float32))
('Action ', array([ 6.97578621,  8.01520252], dtype=float32))
('Action ', array([ 9.00729561,  7.63179493], dtype=float32))
('Action ', array([ 6.97578621,  8.01520252], dtype=float32))
('Action ', array([ 9.00729561,  7.63179493], dtype=float32))
('Action ', array([ 6.97578621,  8.01520252], dtype=float32))
('Action ', array([ 8.94228935,  7.75942993], dtype=float32))
('Action ', array([ 6.97578621,  8.01520252], dtype=float32))
('Action ', array([ 8.94228935,  7.75942993], dtype=float32))
('Action ', array([ 6.97578621,  8.01520252], dtype=float32))
('Action ', array([ 8.94228935,  7.75942993], dtype=float32))
('Action ', array([ 6.97578621,  8.01520252], dtype=float32))
('Action

('Action ', array([ 5.98718929,  5.2726078 ], dtype=float32))
('Action ', array([ 7.50442505,  7.51337814], dtype=float32))
('Action ', array([ 5.50414562,  1.68064296], dtype=float32))
('Action ', array([ 8.07295799,  7.71003342], dtype=float32))
('Action ', array([ 5.40965557,  3.12169838], dtype=float32))
('Action ', array([ 8.59942532,  7.98608208], dtype=float32))
('Action ', array([ 1.21547818,  1.96152294], dtype=float32))
('Action ', array([ 8.6510725 ,  7.79570007], dtype=float32))
('Action ', array([ 1.40139699,  1.03701198], dtype=float32))
('Action ', array([ 8.64734936,  7.86166191], dtype=float32))
('Action ', array([ 0.7338497 , -1.48246205], dtype=float32))
('Action ', array([ 8.73040104,  7.87672615], dtype=float32))
('Action ', array([ 0.7338497 , -1.48246205], dtype=float32))
('Action ', array([ 8.84842777,  8.16219139], dtype=float32))
('Action ', array([-0.75028688, -3.2318821 ], dtype=float32))
('Action ', array([ 9.29572964,  8.34441662], dtype=float32))
('Action

('Action ', array([ 4.48883581,  5.32647753], dtype=float32))
('Action ', array([ 5.77977705,  6.15249681], dtype=float32))
('Action ', array([ 0.53191531,  2.43595576], dtype=float32))
Episode: 1959/5000, score: 34
('Action ', array([ 8.63661766,  8.4763813 ], dtype=float32))
('Action ', array([ 6.85654783,  8.06453323], dtype=float32))
('Action ', array([ 6.87150621,  8.08257675], dtype=float32))
('Action ', array([ 8.06745243,  8.43545532], dtype=float32))
('Action ', array([ 6.86550283,  8.06598473], dtype=float32))
('Action ', array([ 6.83278608,  9.28989506], dtype=float32))
('Action ', array([ 6.4504714 ,  6.17333078], dtype=float32))
('Action ', array([ 5.99789572,  5.900949  ], dtype=float32))
('Action ', array([ 6.37314081,  6.16794729], dtype=float32))
('Action ', array([ 6.05443811,  5.77906179], dtype=float32))
('Action ', array([ 6.35026693,  6.17524576], dtype=float32))
('Action ', array([ 5.64077139,  6.39898825], dtype=float32))
('Action ', array([ 6.35026693,  6.17524

('Action ', array([ 8.67596245,  8.50196552], dtype=float32))
('Action ', array([ 6.87096786,  8.2369585 ], dtype=float32))
('Action ', array([ 8.67596245,  8.50196552], dtype=float32))
('Action ', array([ 6.87096786,  8.2369585 ], dtype=float32))
('Action ', array([ 9.19609642,  8.58678246], dtype=float32))
('Action ', array([ 6.87096786,  8.2369585 ], dtype=float32))
('Action ', array([ 9.03897572,  8.37963486], dtype=float32))
('Action ', array([ 6.87096786,  8.2369585 ], dtype=float32))
('Action ', array([ 8.83133507,  9.56600952], dtype=float32))
('Action ', array([ 6.87096786,  8.2369585 ], dtype=float32))
('Action ', array([ 9.03897572,  8.37963486], dtype=float32))
('Action ', array([ 6.88613224,  8.25078201], dtype=float32))
('Action ', array([ 9.03897572,  8.37963486], dtype=float32))
('Action ', array([ 6.97630405,  8.1859026 ], dtype=float32))
('Action ', array([ 9.0377636,  8.4651165], dtype=float32))
('Action ', array([ 6.98125839,  8.17560482], dtype=float32))
('Action '

('Action ', array([ 7.53184938,  9.2752037 ], dtype=float32))
('Action ', array([ 9.54135418,  7.64164972], dtype=float32))
('Action ', array([ 7.51124907,  9.36249352], dtype=float32))
('Action ', array([ 9.19748688,  4.94545603], dtype=float32))
('Action ', array([ 7.51124907,  9.36249352], dtype=float32))
('Action ', array([ 2.71580672,  2.69247317], dtype=float32))
('Action ', array([ 7.68513441,  9.54012966], dtype=float32))
('Action ', array([ 3.9711988 ,  2.63279223], dtype=float32))
('Action ', array([ 4.07111311,  4.58167505], dtype=float32))
('Action ', array([ 7.8555789 ,  9.99777412], dtype=float32))
('Action ', array([ 4.78677225,  9.81022167], dtype=float32))
('Action ', array([ 7.60531378,  9.23790073], dtype=float32))
('Action ', array([ 8.68561554,  6.81910944], dtype=float32))
Episode: 1972/5000, score: 44
('Action ', array([ 8.75949574,  8.5106039 ], dtype=float32))
('Action ', array([ 7.00361204,  8.44996262], dtype=float32))
('Action ', array([ 8.75949574,  8.51060

('Action ', array([ 8.85280037,  8.57550526], dtype=float32))
('Action ', array([ 6.98280525,  8.38556767], dtype=float32))
('Action ', array([ 9.53149223,  8.74183464], dtype=float32))
('Action ', array([ 6.98280525,  8.38556767], dtype=float32))
('Action ', array([ 9.41403961,  8.19069958], dtype=float32))
('Action ', array([ 6.98280525,  8.38556767], dtype=float32))
('Action ', array([ 9.41403961,  8.19069958], dtype=float32))
('Action ', array([ 6.9863739 ,  8.38607216], dtype=float32))
('Action ', array([ 9.41403961,  8.19069958], dtype=float32))
('Action ', array([ 6.9863739 ,  8.38607216], dtype=float32))
('Action ', array([ 9.41403961,  8.19069958], dtype=float32))
('Action ', array([ 6.9863739 ,  8.38607216], dtype=float32))
('Action ', array([ 9.74471951,  8.24620342], dtype=float32))
('Action ', array([ 6.9863739 ,  8.38607216], dtype=float32))
('Action ', array([ 9.33452129,  8.35300922], dtype=float32))
('Action ', array([ 7.46585846,  9.27824783], dtype=float32))
('Action

('Action ', array([ 8.73717117,  8.69321728], dtype=float32))
('Action ', array([ 6.91983986,  8.26100254], dtype=float32))
('Action ', array([ 8.57316875,  8.0896492 ], dtype=float32))
('Action ', array([ 6.92741585,  8.26470661], dtype=float32))
('Action ', array([ 8.67245102,  8.14739704], dtype=float32))
('Action ', array([ 6.92741585,  8.26470661], dtype=float32))
('Action ', array([ 6.92741585,  8.26470661], dtype=float32))
('Action ', array([ 8.67245102,  8.14739704], dtype=float32))
('Action ', array([ 6.90120029,  8.26651287], dtype=float32))
('Action ', array([ 8.76420498,  8.17635536], dtype=float32))
('Action ', array([ 6.87899399,  8.26263523], dtype=float32))
('Action ', array([ 8.76420498,  8.17635536], dtype=float32))
('Action ', array([ 6.80614281,  8.22543812], dtype=float32))
('Action ', array([ 8.72999859,  8.91218185], dtype=float32))
('Action ', array([ 7.16840172,  8.32189751], dtype=float32))
('Action ', array([ 7.76286411,  8.55452728], dtype=float32))
('Action

('Action ', array([ 8.8165884 ,  8.62404537], dtype=float32))
('Action ', array([ 7.01164532,  8.36786652], dtype=float32))
('Action ', array([ 8.8165884 ,  8.62404537], dtype=float32))
('Action ', array([ 7.01164532,  8.36786652], dtype=float32))
('Action ', array([ 9.56400585,  8.63510895], dtype=float32))
('Action ', array([ 7.01164532,  8.36786652], dtype=float32))
('Action ', array([ 10.03688145,   9.20389557], dtype=float32))
('Action ', array([ 7.01164532,  8.36786652], dtype=float32))
('Action ', array([ 10.03688145,   9.20389557], dtype=float32))
('Action ', array([ 7.01164532,  8.36786652], dtype=float32))
('Action ', array([ 9.05802441,  8.08405781], dtype=float32))
('Action ', array([ 6.99692249,  8.38477898], dtype=float32))
('Action ', array([ 7.38491392,  7.03825426], dtype=float32))
('Action ', array([ 6.99692249,  8.38477898], dtype=float32))
('Action ', array([ 7.02397537,  6.37032175], dtype=float32))
('Action ', array([ 6.99692249,  8.38477898], dtype=float32))
('Ac

('Action ', array([ 8.73014545,  8.81611729], dtype=float32))
('Action ', array([ 7.14047194,  8.3856411 ], dtype=float32))
('Action ', array([ 8.55912876,  7.41033649], dtype=float32))
('Action ', array([ 7.02572489,  8.32229042], dtype=float32))
('Action ', array([ 7.77774763,  8.22586823], dtype=float32))
('Action ', array([ 6.60701799,  7.94759846], dtype=float32))
('Action ', array([ 7.73420572,  5.9142189 ], dtype=float32))
('Action ', array([ 5.20294714,  6.12348652], dtype=float32))
('Action ', array([ 6.28177595,  4.14600563], dtype=float32))
('Action ', array([ 5.12855577,  6.02213478], dtype=float32))
('Action ', array([ 6.1889205 ,  3.72236466], dtype=float32))
Episode: 1992/5000, score: 10
('Action ', array([ 8.65393257,  8.89985657], dtype=float32))
('Action ', array([ 7.21539211,  8.46111774], dtype=float32))
('Action ', array([ 8.65393257,  8.89985657], dtype=float32))
('Action ', array([ 7.20105076,  8.44080067], dtype=float32))
('Action ', array([ 9.2451067,  9.109154

('Action ', array([ 4.70629501,  4.24853373], dtype=float32))
Episode: 2000/5000, score: 31
('Action ', array([ 8.66981602,  8.78903198], dtype=float32))
('Action ', array([ 6.91214514,  7.61207819], dtype=float32))
('Action ', array([ 9.19526577,  8.91736794], dtype=float32))
('Action ', array([ 6.93821669,  7.63430452], dtype=float32))
('Action ', array([ 9.18660355,  8.42859936], dtype=float32))
('Action ', array([ 6.41784048,  6.21959162], dtype=float32))
('Action ', array([ 7.17804003,  4.88221979], dtype=float32))
('Action ', array([ 6.41784048,  6.21959162], dtype=float32))
('Action ', array([ 7.77025461,  7.94228792], dtype=float32))
('Action ', array([ 6.94936419,  7.62467241], dtype=float32))
('Action ', array([ 7.84490061,  7.91948938], dtype=float32))
('Action ', array([ 6.92673349,  7.63141203], dtype=float32))
('Action ', array([ 8.52933884,  7.98827791], dtype=float32))
('Action ', array([ 6.45525885,  6.208673  ], dtype=float32))
('Action ', array([ 8.1108036 ,  7.48497

('Action ', array([ 10.10647583,  10.51989079], dtype=float32))
('Action ', array([ 7.07833481,  7.97040653], dtype=float32))
('Action ', array([ 8.76115036,  8.35032368], dtype=float32))
('Action ', array([ 8.18264008,  9.1837244 ], dtype=float32))
('Action ', array([ 9.01316547,  9.26783848], dtype=float32))
('Action ', array([ 8.50029564,  9.32208729], dtype=float32))
('Action ', array([ 9.37082767,  9.89883137], dtype=float32))
('Action ', array([ 8.37178612,  8.90938187], dtype=float32))
('Action ', array([ 9.4135046 ,  9.87501621], dtype=float32))
('Action ', array([ 8.00456905,  7.26916599], dtype=float32))
('Action ', array([ 5.38862514,  6.32143116], dtype=float32))
('Action ', array([ 8.00238132,  7.17665291], dtype=float32))
('Action ', array([ 0.41850942,  0.97653294], dtype=float32))
Episode: 2006/5000, score: 40
('Action ', array([ 8.59548092,  8.96381474], dtype=float32))
('Action ', array([ 6.89022923,  7.55138731], dtype=float32))
('Action ', array([ 8.59548092,  8.963

('Action ', array([ 8.54238415,  8.87611961], dtype=float32))
('Action ', array([ 7.03659725,  7.91402006], dtype=float32))
('Action ', array([ 8.54238415,  8.87611961], dtype=float32))
('Action ', array([ 7.06112576,  7.92933321], dtype=float32))
('Action ', array([ 9.29865932,  8.26169205], dtype=float32))
('Action ', array([ 6.7256813 ,  6.10357618], dtype=float32))
('Action ', array([ 5.24211693,  0.9525305 ], dtype=float32))
('Action ', array([ 5.16257954,  4.43864107], dtype=float32))
('Action ', array([ 5.72256804,  2.10721254], dtype=float32))
('Action ', array([ 5.17289734,  4.44866228], dtype=float32))
('Action ', array([ 5.78698635,  2.17639589], dtype=float32))
('Action ', array([ 7.01785469,  6.12801027], dtype=float32))
('Action ', array([ 4.82018757,  2.72793245], dtype=float32))
('Action ', array([ 6.88325119,  6.00698328], dtype=float32))
('Action ', array([ 4.10693073,  1.07116377], dtype=float32))
('Action ', array([ 6.70494175,  5.95825243], dtype=float32))
('Action

('Action ', array([ 8.58801746,  9.02873135], dtype=float32))
('Action ', array([ 7.87410736,  8.99022388], dtype=float32))
('Action ', array([ 9.17831802,  9.67535877], dtype=float32))
('Action ', array([ 7.86266041,  9.06424809], dtype=float32))
('Action ', array([ 8.70419216,  8.8676424 ], dtype=float32))
('Action ', array([ 7.80650711,  8.85044956], dtype=float32))
('Action ', array([ 6.24923897,  7.07035542], dtype=float32))
('Action ', array([ 7.34370327,  7.40581322], dtype=float32))
('Action ', array([ 0.50755763,  2.33578205], dtype=float32))
Episode: 2021/5000, score: 8
('Action ', array([ 8.59010506,  9.05898762], dtype=float32))
('Action ', array([ 7.1703043 ,  8.05355549], dtype=float32))
('Action ', array([ 8.59010506,  9.05898762], dtype=float32))
('Action ', array([ 7.16687679,  8.0456934 ], dtype=float32))
('Action ', array([ 9.05777645,  8.49908066], dtype=float32))
('Action ', array([ 4.30874062,  2.34211969], dtype=float32))
('Action ', array([ 5.04709053,  5.519553

('Action ', array([ 8.67618561,  9.14119244], dtype=float32))
('Action ', array([ 7.53736162,  8.20054722], dtype=float32))
('Action ', array([ 9.10125923,  7.88514423], dtype=float32))
('Action ', array([ 9.10125923,  7.88514423], dtype=float32))
('Action ', array([ 7.60066366,  8.23274136], dtype=float32))
('Action ', array([ 9.1126585 ,  7.94045544], dtype=float32))
('Action ', array([ 7.59609556,  8.17440987], dtype=float32))
('Action ', array([ 9.1126585 ,  7.94045544], dtype=float32))
('Action ', array([ 8.49298286,  5.42689037], dtype=float32))
('Action ', array([ 7.11350298,  6.78479195], dtype=float32))
('Action ', array([ 10.28436661,   7.54035091], dtype=float32))
('Action ', array([ 7.60909319,  8.19942188], dtype=float32))
('Action ', array([ 9.50886917,  7.69948864], dtype=float32))
('Action ', array([ 7.55732584,  8.22222614], dtype=float32))
('Action ', array([ 10.63515663,   7.72468472], dtype=float32))
('Action ', array([ 10.79326439,   8.66092968], dtype=float32))
('

('Action ', array([ 8.66988182,  8.9835577 ], dtype=float32))
('Action ', array([ 7.62094975,  8.3584938 ], dtype=float32))
('Action ', array([ 8.91496658,  9.0341711 ], dtype=float32))
('Action ', array([ 7.5982542 ,  8.34807682], dtype=float32))
('Action ', array([ 9.29069901,  9.21968555], dtype=float32))
('Action ', array([ 7.09931278,  6.95004416], dtype=float32))
('Action ', array([ 7.29530859,  4.83976698], dtype=float32))
('Action ', array([ 6.91129208,  6.81176615], dtype=float32))
('Action ', array([ 6.72443962,  2.7084918 ], dtype=float32))
('Action ', array([ 7.16302872,  6.67117548], dtype=float32))
('Action ', array([ 7.32566643,  4.88242674], dtype=float32))
('Action ', array([ 7.5854187 ,  6.65980196], dtype=float32))
('Action ', array([ 9.20580673,  7.98125792], dtype=float32))
('Action ', array([ 7.99047565,  7.85827589], dtype=float32))
('Action ', array([ 8.94421291,  8.17852783], dtype=float32))
('Action ', array([ 8.26707935,  8.39715862], dtype=float32))
('Action

('Action ', array([ 8.78551388,  9.0308876 ], dtype=float32))
('Action ', array([ 7.60849953,  9.09147453], dtype=float32))
('Action ', array([ 8.78551388,  9.0308876 ], dtype=float32))
('Action ', array([ 7.60727787,  9.08042908], dtype=float32))
('Action ', array([ 9.38097382,  8.89232635], dtype=float32))
('Action ', array([ 7.57135201,  9.0354414 ], dtype=float32))
('Action ', array([ 8.89994717,  9.72029495], dtype=float32))
('Action ', array([ 6.40325928,  7.43092775], dtype=float32))
('Action ', array([ 8.54564953,  8.41976357], dtype=float32))
('Action ', array([ 6.21371651,  7.18944883], dtype=float32))
('Action ', array([ 5.70606709,  4.20890188], dtype=float32))
('Action ', array([ 4.42150116,  5.11622286], dtype=float32))
Episode: 2047/5000, score: 11
('Action ', array([ 8.79665947,  9.04137421], dtype=float32))
('Action ', array([ 7.70403385,  8.68253613], dtype=float32))
('Action ', array([ 8.79665947,  9.04137421], dtype=float32))
('Action ', array([ 7.69679356,  8.67788

('Action ', array([ 8.9908514 ,  8.89133835], dtype=float32))
('Action ', array([ 7.56044245,  9.02395439], dtype=float32))
('Action ', array([ 9.77305794,  8.38148308], dtype=float32))
('Action ', array([ 7.56044245,  9.02395439], dtype=float32))
('Action ', array([ 10.17948818,   8.04991436], dtype=float32))
('Action ', array([ 7.53214407,  9.05599213], dtype=float32))
('Action ', array([ 10.17948818,   8.04991436], dtype=float32))
('Action ', array([ 7.53420115,  9.08763695], dtype=float32))
('Action ', array([ 9.79221725,  7.62393236], dtype=float32))
('Action ', array([ 7.53420115,  9.08763695], dtype=float32))
('Action ', array([ 10.02639961,   6.85713243], dtype=float32))
('Action ', array([ 7.41211796,  5.29508829], dtype=float32))
('Action ', array([ 7.27654314,  8.60525894], dtype=float32))
('Action ', array([ 4.41544008,  1.08936918], dtype=float32))
('Action ', array([ 7.17819452,  8.50402069], dtype=float32))
('Action ', array([ 3.14524603, -0.86352688], dtype=float32))
Ep

('Action ', array([ 9.07345295,  9.04703522], dtype=float32))
('Action ', array([ 7.93917799,  9.52320004], dtype=float32))
('Action ', array([ 9.52779293,  8.62918568], dtype=float32))
('Action ', array([ 7.93917799,  9.52320004], dtype=float32))
('Action ', array([ 7.66375494,  7.73023558], dtype=float32))
('Action ', array([ 7.92732763,  9.53549957], dtype=float32))
('Action ', array([ 6.63454103,  7.08648252], dtype=float32))
('Action ', array([ 7.99640417,  9.43586731], dtype=float32))
('Action ', array([ 7.67527914,  7.58805799], dtype=float32))
('Action ', array([ 7.97390509,  9.33119106], dtype=float32))
('Action ', array([ 7.71306181,  7.57108641], dtype=float32))
('Action ', array([ 7.93017817,  8.16203594], dtype=float32))
('Action ', array([ 7.02069426,  4.54411268], dtype=float32))
('Action ', array([ 6.64181471,  6.73691034], dtype=float32))
('Action ', array([ 4.55991697,  3.21533155], dtype=float32))
('Action ', array([ 6.47591925,  6.56552076], dtype=float32))
Episode:

('Action ', array([ 9.23272133,  9.02196312], dtype=float32))
('Action ', array([ 7.31285524,  8.29811478], dtype=float32))
('Action ', array([ 9.23272133,  9.02196312], dtype=float32))
('Action ', array([ 7.31285524,  8.29811478], dtype=float32))
('Action ', array([ 9.23272133,  9.02196312], dtype=float32))
('Action ', array([ 7.31285524,  8.29811478], dtype=float32))
('Action ', array([ 9.23272133,  9.02196312], dtype=float32))
('Action ', array([ 7.31285524,  8.29811478], dtype=float32))
('Action ', array([ 9.23272133,  9.02196312], dtype=float32))
('Action ', array([ 7.31285524,  8.29811478], dtype=float32))
('Action ', array([ 9.5686512 ,  8.33072662], dtype=float32))
('Action ', array([ 7.31285524,  8.29811478], dtype=float32))
('Action ', array([ 9.5686512 ,  8.33072662], dtype=float32))
('Action ', array([ 7.31285524,  8.29811478], dtype=float32))
('Action ', array([ 9.7129631 ,  8.73695564], dtype=float32))
('Action ', array([ 7.38460875,  8.32830048], dtype=float32))
('Action

('Action ', array([ 9.16449928,  9.10244083], dtype=float32))
('Action ', array([ 7.39422321,  8.52324867], dtype=float32))
('Action ', array([ 9.16449928,  9.10244083], dtype=float32))
('Action ', array([ 7.39422321,  8.52324867], dtype=float32))
('Action ', array([ 9.16449928,  9.10244083], dtype=float32))
('Action ', array([ 7.39422321,  8.52324867], dtype=float32))
('Action ', array([ 9.78992176,  8.8884325 ], dtype=float32))
('Action ', array([ 7.39422321,  8.52324867], dtype=float32))
('Action ', array([ 10.19825268,   8.93887234], dtype=float32))
('Action ', array([ 7.39422321,  8.52324867], dtype=float32))
('Action ', array([ 9.4189949 ,  8.56578922], dtype=float32))
('Action ', array([ 7.16463852,  8.18480873], dtype=float32))
('Action ', array([ 7.16484928,  8.1869278 ], dtype=float32))
('Action ', array([ 7.72825813,  8.33567619], dtype=float32))
('Action ', array([ 9.46152401,  7.76929045], dtype=float32))
('Action ', array([ 7.72825813,  8.33567619], dtype=float32))
('Acti

('Action ', array([ 8.94056606,  9.22901726], dtype=float32))
('Action ', array([ 7.02169657,  7.93480635], dtype=float32))
('Action ', array([ 8.94056606,  9.22901726], dtype=float32))
('Action ', array([ 6.9805131,  7.9129138], dtype=float32))
('Action ', array([ 9.18732643,  9.12850666], dtype=float32))
('Action ', array([ 6.42900038,  6.45245028], dtype=float32))
('Action ', array([ 6.85747623,  6.13566542], dtype=float32))
('Action ', array([ 4.55795431,  4.12160063], dtype=float32))
('Action ', array([ 4.88552284,  5.28872061], dtype=float32))
('Action ', array([ 4.52666235,  4.0922904 ], dtype=float32))
('Action ', array([ 6.07912159,  4.61802435], dtype=float32))
('Action ', array([ 4.44861555,  4.05341291], dtype=float32))
('Action ', array([ 5.40819311,  3.6571629 ], dtype=float32))
('Action ', array([ 4.47446299,  4.11014891], dtype=float32))
('Action ', array([ 6.03806257,  4.08087301], dtype=float32))
('Action ', array([ 4.85961008,  4.35206938], dtype=float32))
('Action '

('Action ', array([ 7.19639301,  8.35404587], dtype=float32))
('Action ', array([ 9.09487915,  9.21954441], dtype=float32))
('Action ', array([ 8.80208969,  9.20078754], dtype=float32))
('Action ', array([ 7.19639301,  8.35404587], dtype=float32))
('Action ', array([ 8.80208969,  9.20078754], dtype=float32))
('Action ', array([ 7.11228561,  8.27108955], dtype=float32))
('Action ', array([  9.9309597 ,  10.07522488], dtype=float32))
('Action ', array([ 6.66470146,  7.85217524], dtype=float32))
('Action ', array([ 9.00697708,  8.10712528], dtype=float32))
('Action ', array([ 6.4753437 ,  7.63665724], dtype=float32))
('Action ', array([ 4.38832474,  1.79080725], dtype=float32))
('Action ', array([ 6.15552616,  6.5704236 ], dtype=float32))
Episode: 2087/5000, score: 13
('Action ', array([ 8.77085209,  9.18663788], dtype=float32))
('Action ', array([ 6.89434147,  7.74128437], dtype=float32))
('Action ', array([ 9.42071247,  9.54482746], dtype=float32))
('Action ', array([ 6.82154751,  7.710

('Action ', array([ 8.62856293,  9.00295734], dtype=float32))
('Action ', array([ 8.65908527,  7.74860239], dtype=float32))
('Action ', array([ 6.83911228,  7.87002707], dtype=float32))
('Action ', array([ 8.65548992,  7.80538607], dtype=float32))
('Action ', array([ 6.83911228,  7.87002707], dtype=float32))
('Action ', array([ 9.18059063,  9.4047699 ], dtype=float32))
('Action ', array([ 6.83911228,  7.87002707], dtype=float32))
('Action ', array([ 8.65548992,  7.80538607], dtype=float32))
('Action ', array([ 6.85289097,  7.89056826], dtype=float32))
('Action ', array([ 8.65548992,  7.80538607], dtype=float32))
('Action ', array([ 6.96313286,  8.03140926], dtype=float32))
('Action ', array([ 8.65548992,  7.80538607], dtype=float32))
('Action ', array([ 6.87884808,  7.95599985], dtype=float32))
('Action ', array([ 8.18893337,  7.19497919], dtype=float32))
('Action ', array([ 8.13409138,  8.71432781], dtype=float32))
('Action ', array([ 8.71247578,  6.66421747], dtype=float32))
('Action

('Action ', array([ 7.27737999,  3.00192571], dtype=float32))
('Action ', array([ 7.56484318,  8.19643402], dtype=float32))
('Action ', array([ 2.34727073,  1.07792211], dtype=float32))
('Action ', array([ 7.29888821,  7.82947159], dtype=float32))
('Action ', array([ 7.50767326,  6.76655102], dtype=float32))
('Action ', array([ 7.16917038,  7.68386459], dtype=float32))
('Action ', array([ 7.49931335,  7.22472668], dtype=float32))
('Action ', array([ 7.12265778,  7.63538933], dtype=float32))
('Action ', array([ 7.12265778,  7.63538933], dtype=float32))
('Action ', array([ 5.48414803,  2.4837296 ], dtype=float32))
('Action ', array([ 5.4157896 ,  5.38146496], dtype=float32))
('Action ', array([ 6.06738091,  2.49545598], dtype=float32))
('Action ', array([ 5.65871239,  5.75282669], dtype=float32))
('Action ', array([ 5.82540035,  2.47907948], dtype=float32))
('Action ', array([ 5.65708447,  5.75341892], dtype=float32))
('Action ', array([ 8.12145996,  8.02826977], dtype=float32))
('Action

('Action ', array([ 8.67502975,  8.56051922], dtype=float32))
('Action ', array([ 6.76749945,  7.89290571], dtype=float32))
('Action ', array([ 8.67502975,  8.56051922], dtype=float32))
('Action ', array([ 6.76749945,  7.89290571], dtype=float32))
('Action ', array([ 8.67502975,  8.56051922], dtype=float32))
('Action ', array([ 6.76749945,  7.89290571], dtype=float32))
('Action ', array([ 8.11341381,  7.63968515], dtype=float32))
('Action ', array([ 6.76749945,  7.89290571], dtype=float32))
('Action ', array([ 8.03249836,  7.25942087], dtype=float32))
('Action ', array([ 7.4248271 ,  8.95233154], dtype=float32))
('Action ', array([ 8.03249836,  7.25942087], dtype=float32))
('Action ', array([ 7.4248271 ,  8.95233154], dtype=float32))
('Action ', array([ 7.48254728,  6.86342859], dtype=float32))
('Action ', array([ 7.48049974,  8.90007305], dtype=float32))
('Action ', array([ 7.48418283,  8.94498825], dtype=float32))
('Action ', array([ 8.57594585,  6.46757555], dtype=float32))
('Action

('Action ', array([ 8.72062302,  8.62975502], dtype=float32))
('Action ', array([ 6.93970585,  8.70167446], dtype=float32))
('Action ', array([ 9.01035976,  9.0612011 ], dtype=float32))
('Action ', array([ 6.93970585,  8.70167446], dtype=float32))
('Action ', array([ 8.72062302,  8.62975502], dtype=float32))
('Action ', array([ 6.93970585,  8.70167446], dtype=float32))
('Action ', array([ 6.85300922,  8.61804485], dtype=float32))
('Action ', array([ 8.86349678,  8.86849117], dtype=float32))
('Action ', array([ 6.1276598 ,  7.89066458], dtype=float32))
('Action ', array([ 5.08745098,  5.63900995], dtype=float32))
('Action ', array([ 5.84393597,  7.57234621], dtype=float32))
('Action ', array([ 5.53645134,  5.67516565], dtype=float32))
('Action ', array([ 5.98571491,  7.01308489], dtype=float32))
('Action ', array([ 3.15684247,  3.85467029], dtype=float32))
('Action ', array([ 6.1622839 ,  6.68933725], dtype=float32))
Episode: 2115/5000, score: 15
('Action ', array([ 8.77034473,  8.64768

('Action ', array([ 8.62087536,  8.71462536], dtype=float32))
('Action ', array([ 6.89698839,  8.43769455], dtype=float32))
('Action ', array([ 9.06508064,  9.22456741], dtype=float32))
('Action ', array([ 6.88719606,  8.40732574], dtype=float32))
('Action ', array([ 8.96459389,  8.76018238], dtype=float32))
('Action ', array([ 6.85658884,  8.36015606], dtype=float32))
('Action ', array([ 7.05113983,  7.19086838], dtype=float32))
('Action ', array([ 6.19101477,  7.02119064], dtype=float32))
('Action ', array([ 2.83357191,  2.20055509], dtype=float32))
Episode: 2122/5000, score: 8
('Action ', array([ 8.65136814,  8.71633244], dtype=float32))
('Action ', array([ 7.29579782,  9.39985275], dtype=float32))
('Action ', array([ 8.65136814,  8.71633244], dtype=float32))
('Action ', array([ 6.80783319,  8.41924191], dtype=float32))
('Action ', array([ 7.59324265,  8.37949467], dtype=float32))
('Action ', array([ 6.98874712,  8.54402065], dtype=float32))
('Action ', array([ 6.4452281 ,  7.697117

('Action ', array([ 8.75208378,  8.90773201], dtype=float32))
('Action ', array([ 7.02353811,  8.38540459], dtype=float32))
('Action ', array([ 8.75208378,  8.90773201], dtype=float32))
('Action ', array([ 8.73604679,  8.07375431], dtype=float32))
('Action ', array([ 6.53230619,  7.7049284 ], dtype=float32))
('Action ', array([ 8.27367306,  8.03695583], dtype=float32))
('Action ', array([ 4.71196795,  5.54328728], dtype=float32))
('Action ', array([ 8.45512676,  8.282691  ], dtype=float32))
('Action ', array([ 4.61018896,  5.300457  ], dtype=float32))
('Action ', array([ 8.17244434,  7.86010838], dtype=float32))
('Action ', array([ 4.61261511,  5.28015423], dtype=float32))
('Action ', array([ 4.59647608,  5.22347641], dtype=float32))
('Action ', array([ 8.10200119,  7.6928339 ], dtype=float32))
('Action ', array([ 4.61685419,  5.176054  ], dtype=float32))
('Action ', array([ 8.9297142 ,  6.59627438], dtype=float32))
('Action ', array([ 4.74768209,  5.13678932], dtype=float32))
('Action

('Action ', array([ 7.51712465,  8.32237816], dtype=float32))
('Action ', array([ 7.50503111,  8.21456814], dtype=float32))
('Action ', array([ 8.0962286 ,  6.57180214], dtype=float32))
('Action ', array([ 7.58821249,  8.28535461], dtype=float32))
('Action ', array([ 10.64159489,   8.40166664], dtype=float32))
('Action ', array([ 7.34685183,  8.15663815], dtype=float32))
('Action ', array([ 7.354424  ,  5.09073448], dtype=float32))
('Action ', array([ 6.51450491,  7.16794014], dtype=float32))
('Action ', array([ 7.02927065,  3.21435738], dtype=float32))
('Action ', array([ 6.5031352 ,  7.17420006], dtype=float32))
('Action ', array([ 6.69731188, -4.48540688], dtype=float32))
('Action ', array([ 6.61570883,  7.1263752 ], dtype=float32))
('Action ', array([ 10.25765896,  -3.85636711], dtype=float32))
('Action ', array([ 7.81360292,  7.59384918], dtype=float32))
('Action ', array([ 10.99640465,  -0.71273232], dtype=float32))
('Action ', array([ 8.10830498,  7.14493752], dtype=float32))
('

('Action ', array([ 7.05047178,  8.95363522], dtype=float32))
('Action ', array([ 8.77403831,  9.17241287], dtype=float32))
('Action ', array([ 7.01529551,  8.90938473], dtype=float32))
('Action ', array([  7.62325954,  10.10827541], dtype=float32))
('Action ', array([ 6.4507947,  8.2710638], dtype=float32))
('Action ', array([ 3.49758196,  6.46928835], dtype=float32))
('Action ', array([ 6.28733301,  8.2191925 ], dtype=float32))
('Action ', array([-0.27308512,  1.01717818], dtype=float32))
Episode: 2145/5000, score: 8
('Action ', array([ 8.81923962,  9.1968832 ], dtype=float32))
('Action ', array([ 6.77512264,  8.38429928], dtype=float32))
('Action ', array([ 9.26074886,  9.46394444], dtype=float32))
('Action ', array([ 6.80013752,  8.35454273], dtype=float32))
('Action ', array([ 8.57397366,  9.25987339], dtype=float32))
('Action ', array([ 5.62678528,  6.7576704 ], dtype=float32))
('Action ', array([ 2.30995846,  3.16732311], dtype=float32))
('Action ', array([ 5.61745071,  6.591611

('Action ', array([ 8.90200424,  9.07943153], dtype=float32))
('Action ', array([ 6.30283689,  9.15875149], dtype=float32))
('Action ', array([ 8.90200424,  9.07943153], dtype=float32))
('Action ', array([ 6.37392664,  9.25133801], dtype=float32))
('Action ', array([  9.9178257 ,  10.03557014], dtype=float32))
('Action ', array([ 5.78591108,  8.66209888], dtype=float32))
('Action ', array([ 9.35958576,  9.1143961 ], dtype=float32))
('Action ', array([ 5.72392607,  8.58667088], dtype=float32))
('Action ', array([ 6.46673918,  7.18838263], dtype=float32))
('Action ', array([ 4.90532923,  6.85071135], dtype=float32))
Episode: 2154/5000, score: 9
('Action ', array([ 8.94248295,  9.07204723], dtype=float32))
('Action ', array([ 11.37227249,  10.48058224], dtype=float32))
('Action ', array([ 6.78752565,  9.62373066], dtype=float32))
('Action ', array([ 10.5049963 ,   9.18570232], dtype=float32))
('Action ', array([ 6.77872324,  9.66243839], dtype=float32))
('Action ', array([ 10.08703613,   

('Action ', array([ 9.12919426,  9.34070396], dtype=float32))
('Action ', array([  6.98099232,  10.30737305], dtype=float32))
('Action ', array([ 10.06308937,  10.56737518], dtype=float32))
('Action ', array([  6.9192028 ,  10.14905167], dtype=float32))
('Action ', array([  9.723773  ,  10.36004257], dtype=float32))
('Action ', array([  6.91982555,  10.14346313], dtype=float32))
('Action ', array([ 10.02750015,  10.31472397], dtype=float32))
('Action ', array([ 5.56454754,  7.4329443 ], dtype=float32))
('Action ', array([ 4.32740974,  3.20352149], dtype=float32))
Episode: 2162/5000, score: 8
('Action ', array([ 9.12548447,  9.34779644], dtype=float32))
('Action ', array([ 6.67601109,  9.73710537], dtype=float32))
('Action ', array([ 9.83242226,  9.57973576], dtype=float32))
('Action ', array([  7.10074615,  10.25155354], dtype=float32))
('Action ', array([ 11.28147984,  10.83450985], dtype=float32))
('Action ', array([  7.29704189,  10.26715946], dtype=float32))
('Action ', array([ 11.

('Action ', array([ 9.14732647,  9.49915218], dtype=float32))
('Action ', array([ 7.09734583,  9.93468952], dtype=float32))
('Action ', array([ 9.14732647,  9.49915218], dtype=float32))
('Action ', array([ 7.07697916,  9.8770752 ], dtype=float32))
('Action ', array([ 8.39423943,  9.92446613], dtype=float32))
('Action ', array([ 5.96634531,  8.2927084 ], dtype=float32))
('Action ', array([ 5.54382753,  6.01816273], dtype=float32))
('Action ', array([ 5.79918051,  8.12216759], dtype=float32))
Episode: 2171/5000, score: 7
('Action ', array([ 9.20596123,  9.52001858], dtype=float32))
('Action ', array([ 10.63579082,   9.43454742], dtype=float32))
('Action ', array([ 7.14154863,  9.4952383 ], dtype=float32))
('Action ', array([ 10.66939926,   9.33086014], dtype=float32))
('Action ', array([ 7.14411497,  9.4957962 ], dtype=float32))
('Action ', array([ 10.86763668,   8.5497427 ], dtype=float32))
('Action ', array([ 7.12386656,  9.57431889], dtype=float32))
('Action ', array([ 7.15531683,  9.

('Action ', array([ 9.33783245,  9.86281013], dtype=float32))
('Action ', array([  8.02788925,  10.18117332], dtype=float32))
('Action ', array([ 11.85611057,  12.4688282 ], dtype=float32))
('Action ', array([ 7.73972607,  9.81229019], dtype=float32))
('Action ', array([ 8.09951878,  8.6423378 ], dtype=float32))
('Action ', array([ 7.6573391 ,  9.56195164], dtype=float32))
('Action ', array([ 6.81504631,  7.27628374], dtype=float32))
('Action ', array([ 2.79036522,  4.26325655], dtype=float32))
('Action ', array([ 6.04213047,  5.94651556], dtype=float32))
Episode: 2180/5000, score: 9
('Action ', array([ 9.36641121,  9.86064053], dtype=float32))
('Action ', array([ 7.55962944,  9.60911369], dtype=float32))
('Action ', array([ 10.81957626,  11.25166988], dtype=float32))
('Action ', array([ 7.95405674,  9.92163944], dtype=float32))
('Action ', array([ 10.0616436 ,  10.19921398], dtype=float32))
('Action ', array([ 6.9003973 ,  8.20011234], dtype=float32))
('Action ', array([ 6.17831898,  

('Action ', array([ 9.5060873 ,  9.80644608], dtype=float32))
('Action ', array([ 10.35496044,   9.40811539], dtype=float32))
('Action ', array([ 8.05156803,  9.35061932], dtype=float32))
('Action ', array([ 10.87391186,   8.95371628], dtype=float32))
('Action ', array([ 8.03280258,  9.32785988], dtype=float32))
('Action ', array([ 11.34939861,   7.20084572], dtype=float32))
('Action ', array([ 10.66027546,   5.72462654], dtype=float32))
('Action ', array([ 8.03280258,  9.32785988], dtype=float32))
('Action ', array([ 10.66027546,   5.72462654], dtype=float32))
('Action ', array([ 6.7207737 ,  8.22927284], dtype=float32))
('Action ', array([ 10.65940094,   5.70542717], dtype=float32))
('Action ', array([ 10.62664509,   5.82893753], dtype=float32))
('Action ', array([ 6.7207737 ,  8.22927284], dtype=float32))
('Action ', array([ 10.62664509,   5.82893753], dtype=float32))
('Action ', array([ 6.7207737 ,  8.22927284], dtype=float32))
('Action ', array([ 6.7207737 ,  8.22927284], dtype=fl

('Action ', array([ 9.46346474,  9.66093636], dtype=float32))
('Action ', array([ 7.60060883,  9.1374197 ], dtype=float32))
('Action ', array([ 9.96530914,  9.51795387], dtype=float32))
('Action ', array([ 10.04529095,   9.50478077], dtype=float32))
('Action ', array([ 7.63319111,  9.14012241], dtype=float32))
('Action ', array([ 10.04529095,   9.50478077], dtype=float32))
('Action ', array([ 7.63319111,  9.14012241], dtype=float32))
('Action ', array([ 10.14959908,   9.59152412], dtype=float32))
('Action ', array([ 7.63319111,  9.14012241], dtype=float32))
('Action ', array([ 10.15211582,   9.66797733], dtype=float32))
('Action ', array([ 7.63319111,  9.14012241], dtype=float32))
('Action ', array([ 10.21178532,   9.6920414 ], dtype=float32))
('Action ', array([ 7.6419487 ,  9.14117622], dtype=float32))
('Action ', array([ 10.05175972,   9.65406609], dtype=float32))
('Action ', array([ 7.6419487 ,  9.14117622], dtype=float32))
('Action ', array([ 10.06357574,   9.64191437], dtype=floa

('Action ', array([ 6.40911579,  5.72041512], dtype=float32))
('Action ', array([ 4.97501373, -0.75833535], dtype=float32))
('Action ', array([ 7.0966959 ,  6.54008484], dtype=float32))
('Action ', array([-4.03532887, -0.78476739], dtype=float32))
Episode: 2201/5000, score: 32
('Action ', array([ 9.54328346,  9.62016296], dtype=float32))
('Action ', array([ 8.22452641,  9.57107162], dtype=float32))
('Action ', array([ 9.81768322,  7.63600302], dtype=float32))
('Action ', array([ 8.35333824,  9.97034645], dtype=float32))
('Action ', array([ 9.54102039,  5.55831671], dtype=float32))
('Action ', array([ 8.22469711,  9.77692223], dtype=float32))
('Action ', array([ 7.98826838,  4.5515151 ], dtype=float32))
('Action ', array([ 8.22873211,  9.78846359], dtype=float32))
('Action ', array([ 8.77886009,  4.68523169], dtype=float32))
('Action ', array([ 8.22197247,  9.77802944], dtype=float32))
('Action ', array([ 8.77886009,  4.68523169], dtype=float32))
('Action ', array([ 8.22197247,  9.77802

KeyboardInterrupt: 