In [1]:
import numpy as np
from PIL import Image

In [2]:

import torch
import torch.nn as nn
import torch.optim as optim
import torch.nn.functional as F
import torchvision.transforms as T

import argparse
import time
import numpy as np
import collections

from tensorboardX import SummaryWriter

In [3]:
import gym

env = gym.make("FetchReach-v1")
DEFAULT_ENV_NAME="FetchReach-v1"

  result = entry_point.load(False)


In [4]:
print(env.action_space)
print(env.action_space.sample())

Box(4,)
[0.09762701 0.43037874 0.20552675 0.08976637]


In [5]:
print(env.observation_space)

Dict(achieved_goal:Box(3,), desired_goal:Box(3,), observation:Box(10,))


In [6]:
class DQN(nn.Module):

    def __init__(self):
        super(DQN, self).__init__()
        # 4 input image channel, 32 output channels, 3x3 square convolution
        # kernel
        self.pipe = nn.Sequential(
            nn.Linear(16,128),
            nn.ReLU(),
            nn.Linear(128,256),
            nn.ReLU(),
            nn.Linear(256,4)
        )

    def forward(self, x):  
        x= x.float()
        return self.pipe(x)


In [7]:
GAMMA = 0.99
BATCH_SIZE = 32
REPLAY_SIZE = 10000
REPLAY_START_SIZE = 10000
LEARNING_RATE = 1e-4
SYNC_TARGET_FRAMES = 1000

In [8]:
#epsilon decay, for choosing random actions to explore space
EPSILON_DECAY_LAST_FRAME = 10**5
EPSILON_START = 1.0
EPSILON_FINAL = 0.02
#Going from 1 to .02 in 100000 frames
MEAN_REWARD_BOUND=50

In [9]:
#define what experience is
Experience = collections.namedtuple("Experience", 
                        field_names = ['state','action','reward', 'done','new_state'])

class ExperienceBuffer:
     #This acts as our replay buffer
    def __init__(self,capacity):
        self.buffer = collections.deque(maxlen=capacity) #rotating buffer
    
    def __len__(self):
        return len(self.buffer)
    
    def append(self, experience):
        self.buffer.append(experience)
        
    def sample(self,batch_size):
        indices = np.random.choice(
            len(self.buffer), batch_size, replace =False)
        
        states,actions,rewards,dones, next_states = \
            zip(*[self.buffer[idx] for idx in indices])
        
        states,actions = np.array(states),np.array(actions)
        rewards = np.array(rewards,dtype=np.float32)
        dones =np.array(dones, dtype=np.float32)
        return states,actions,rewards,dones,next_states

In [10]:
#make our agent that acts and learns in the environment
class Agent:
    def __init__(self, env, exp_buffer):
        self.env = env
        self.exp_buffer = exp_buffer
        self._reset()
        
    def _reset(self):
        state = env.reset()
        
        
        self.state = np.concatenate(list(state.values()))
        self.total_reward = 0.0
    
    def play_step(self, net, epsilong=0.0, device ='cpu'):
        done_reward = None
        
        if np.random.random() < epsilon:
            action = env.action_space.sample()
        else:
            state_a = np.array([self.state], copy=False)
            state_v = torch.tensor(state_a).to(device)
            q_vals_v =  net(state_v)
            _, act_v = torch.max(q_vals_v,dim=1)
            
            #print("whats going on here?")
            action = int(act_v.item())
            
            #take the action and update
            #env.show()
            new_state, reward, is_done, _ = self.env.step(action)  
            new_state = np.concatenate(list(new_state.values()))
            reward +=1.0
            self.total_reward += reward
            #do we need this? is it doing a copy?
            new_state = new_state
            
            exp = Experience(self.state,action,reward,is_done,new_state)
            
            self.exp_buffer.append(exp)
            self.state = new_state
            
            if(is_done):
                done_reward = self.total_reward
                self._reset()
            return done_reward
        
def calc_loss(batch, net, target_net, device='cpu'):
    states,actions,rewards,dones,next_states = batch
    
    
    states_v = torch.tensor(states).to(device)
    next_states_v = torch.tensor(next_states).to(device)
    actions_v = torch.tensor(actions).to(device)
    rewards_v = torch.tensor(rewards).to(device)
    done_mask = torch.ByteTensor(dones).to(device)

    #predictions
    #look into gather further
    state_action_values = net(states_v).gather(1,actions_v.unsqueeze(-1)).squeeze(-1)

    #what is the value of being in the state that our action took us to?
    next_state_values = target_net(next_states_v).max(1)[0] #take the max along the first axis


    # saying the reward of the step after finishing is zero
    # required to converege
    next_state_values[done_mask] = 0.0

    #we do not want to perform backprop on this 
    next_state_values = next_state_values.detach() 

    #-------------Bellman equation------------------
    expected_state_action_values = next_state_values * GAMMA + rewards_v

    return nn.MSELoss()(state_action_values, expected_state_action_values)

In [11]:
if __name__ == "__main__":
    #parser = argparse.ArgumentParser()
    #parser.add_argument("--cude", default=False, action='store_true', help="Enable cuda")
    
    #parser.add_argument("--env", default= DEFAULT_ENV_NAME, 
    #                    help="name of the environment, default="+DEFAULT_ENV_NAME)
    
    #parser.add_argument("--reward", type=float, default=MEAN_REWARD_BOUND, 
    #                    help="Mean reward boundary for stop of training, default= %.2f"% MEAN_REWARD_BOUND)
    
    #args = parser.parse_args()
    args= [False,DEFAULT_ENV_NAME,MEAN_REWARD_BOUND]
    #device= torch.device("cuda" if args.cuda else "cpu")
    device = 'cpu'
    
    env = gym.make(DEFAULT_ENV_NAME)#args.env)
    net = DQN().to(device)
    
    target_net = DQN().to(device)
    
    writer = SummaryWriter(comment='-'+DEFAULT_ENV_NAME)#args.env)
    print(net)
    
    buffer = ExperienceBuffer(REPLAY_SIZE)
    agent = Agent(env, buffer)
    
    epsilon = EPSILON_START
    
    optimizer = optim.Adam(net.parameters(), lr=LEARNING_RATE)
    total_rewards = []
    frame_idx = 0
    ts_frame = 0
    ts = time.time()
    
    best_mean_reward = None
    
    while True:
        frame_idx += 1
        epsilon = max(EPSILON_FINAL, EPSILON_START - (frame_idx / EPSILON_DECAY_LAST_FRAME))
        
        reward = agent.play_step(net, epsilon, device=device)
        if reward is not None:
            total_rewards.append(reward)
            speed = (frame_idx - ts_frame) / (time.time() - ts)
            ts_frame = frame_idx
            ts = time.time()
            
            mean_reward = np.mean(total_rewards[-100:])
            print("%d: done %d games, mean reward %.3f, eps %.2f, speed %.2f f/s" %(
                frame_idx, len(total_rewards), mean_reward, epsilon, speed
            ))
            
            writer.add_scalar("epsilon", epsilon, frame_idx)
            writer.add_scalar("speed", speed, frame_idx)
            writer.add_scalar("reward_100", mean_reward, frame_idx)
            writer.add_scalar("reward", reward, frame_idx)
            
            if best_mean_reward  is None or best_mean_reward < mean_reward:
                torch.save(net.state_dict(), DEFAULT_ENV_NAME+"-best.dat")
                if(best_mean_reward is not None):
                    print('best mean reward updated %.3f -> %.3f, model saved'%
                             (best_mean_reward, mean_reward))
                    best_mean_reward = mean_reward
                if(mean_reward > MEAN_REWARD_BOUND):
                    print("solved in %d frames!" % frame_idx)
                    break
                
            if(len(buffer) < REPLAY_START_SIZE):
                continue
            
            if(frame_idx % SYNC_TARGET_FRAMES == 0):
                target_net.load_state_dict(net.state_dict())
            
            optimizer.zero_grad()
            batch = buffer.sample(BATCH_SIZE)
            loss_t = calc_loss(batch, net, target_net, device=device)
            
            loss_t.backward()
            optimizer.step()

DQN(
  (pipe): Sequential(
    (0): Linear(in_features=16, out_features=128, bias=True)
    (1): ReLU()
    (2): Linear(in_features=128, out_features=256, bias=True)
    (3): ReLU()
    (4): Linear(in_features=256, out_features=4, bias=True)
  )
)
2942: done 1 games, mean reward -50.000, eps 0.97, speed 17051.92 f/s
4081: done 2 games, mean reward -50.000, eps 0.96, speed 10313.58 f/s
5063: done 3 games, mean reward -50.000, eps 0.95, speed 7457.76 f/s
6109: done 4 games, mean reward -50.000, eps 0.94, speed 5868.76 f/s
6985: done 5 games, mean reward -50.000, eps 0.93, speed 7718.93 f/s
7709: done 6 games, mean reward -50.000, eps 0.92, speed 6862.23 f/s
8307: done 7 games, mean reward -50.000, eps 0.92, speed 4877.94 f/s
8861: done 8 games, mean reward -50.000, eps 0.91, speed 3270.33 f/s
9495: done 9 games, mean reward -50.000, eps 0.91, speed 3538.45 f/s
9847: done 10 games, mean reward -50.000, eps 0.90, speed 1948.03 f/s
10357: done 11 games, mean reward -50.000, eps 0.90, speed 

33635: done 113 games, mean reward -48.750, eps 0.66, speed 1495.54 f/s
33804: done 114 games, mean reward -48.750, eps 0.66, speed 1321.76 f/s
33970: done 115 games, mean reward -48.750, eps 0.66, speed 1621.84 f/s
34085: done 116 games, mean reward -48.750, eps 0.66, speed 1157.72 f/s
34241: done 117 games, mean reward -48.750, eps 0.66, speed 1596.72 f/s
34374: done 118 games, mean reward -48.750, eps 0.66, speed 1275.99 f/s
34533: done 119 games, mean reward -48.750, eps 0.65, speed 1343.19 f/s
34673: done 120 games, mean reward -48.750, eps 0.65, speed 1349.52 f/s
34822: done 121 games, mean reward -48.750, eps 0.65, speed 1533.99 f/s
34957: done 122 games, mean reward -48.750, eps 0.65, speed 1342.29 f/s
35113: done 123 games, mean reward -48.750, eps 0.65, speed 1585.66 f/s
35260: done 124 games, mean reward -48.750, eps 0.65, speed 1444.72 f/s
35389: done 125 games, mean reward -48.750, eps 0.65, speed 1135.00 f/s
35517: done 126 games, mean reward -48.750, eps 0.64, speed 1175

47791: done 229 games, mean reward -48.880, eps 0.52, speed 1145.26 f/s
47893: done 230 games, mean reward -48.880, eps 0.52, speed 1070.13 f/s
47985: done 231 games, mean reward -48.870, eps 0.52, speed 972.32 f/s
48084: done 232 games, mean reward -48.870, eps 0.52, speed 1022.74 f/s
48175: done 233 games, mean reward -48.870, eps 0.52, speed 966.61 f/s
48280: done 234 games, mean reward -48.870, eps 0.52, speed 1027.31 f/s
48388: done 235 games, mean reward -48.870, eps 0.52, speed 1093.50 f/s
48503: done 236 games, mean reward -48.870, eps 0.51, speed 1214.28 f/s
48598: done 237 games, mean reward -48.870, eps 0.51, speed 1008.23 f/s
48694: done 238 games, mean reward -48.870, eps 0.51, speed 994.61 f/s
48795: done 239 games, mean reward -48.870, eps 0.51, speed 1067.06 f/s
48893: done 240 games, mean reward -49.370, eps 0.51, speed 1032.58 f/s
48998: done 241 games, mean reward -49.360, eps 0.51, speed 1080.41 f/s
49087: done 242 games, mean reward -49.360, eps 0.51, speed 939.01 

58600: done 345 games, mean reward -49.880, eps 0.41, speed 868.14 f/s
58691: done 346 games, mean reward -49.880, eps 0.41, speed 953.72 f/s
58784: done 347 games, mean reward -49.880, eps 0.41, speed 942.75 f/s
58893: done 348 games, mean reward -49.880, eps 0.41, speed 1077.18 f/s
58987: done 349 games, mean reward -49.880, eps 0.41, speed 934.30 f/s
59068: done 350 games, mean reward -49.890, eps 0.41, speed 852.02 f/s
59156: done 351 games, mean reward -49.890, eps 0.41, speed 911.70 f/s
59251: done 352 games, mean reward -49.890, eps 0.41, speed 998.65 f/s
59346: done 353 games, mean reward -49.890, eps 0.41, speed 1001.51 f/s
59423: done 354 games, mean reward -49.890, eps 0.41, speed 785.47 f/s
59496: done 355 games, mean reward -49.890, eps 0.41, speed 751.73 f/s
59582: done 356 games, mean reward -49.890, eps 0.40, speed 884.31 f/s
59663: done 357 games, mean reward -49.890, eps 0.40, speed 827.43 f/s
59742: done 358 games, mean reward -49.890, eps 0.40, speed 806.23 f/s
5982

67744: done 461 games, mean reward -49.900, eps 0.32, speed 742.48 f/s
67824: done 462 games, mean reward -49.900, eps 0.32, speed 817.69 f/s
67895: done 463 games, mean reward -49.900, eps 0.32, speed 729.35 f/s
67961: done 464 games, mean reward -49.900, eps 0.32, speed 677.26 f/s
68042: done 465 games, mean reward -49.900, eps 0.32, speed 826.63 f/s
68117: done 466 games, mean reward -49.900, eps 0.32, speed 773.56 f/s
68191: done 467 games, mean reward -49.900, eps 0.32, speed 756.75 f/s
68269: done 468 games, mean reward -49.900, eps 0.32, speed 799.89 f/s
68346: done 469 games, mean reward -49.900, eps 0.32, speed 792.18 f/s
68416: done 470 games, mean reward -49.900, eps 0.32, speed 714.99 f/s
68483: done 471 games, mean reward -49.900, eps 0.32, speed 691.87 f/s
68558: done 472 games, mean reward -49.890, eps 0.31, speed 772.16 f/s
68628: done 473 games, mean reward -49.910, eps 0.31, speed 718.78 f/s
68694: done 474 games, mean reward -49.910, eps 0.31, speed 681.41 f/s
68769:

75923: done 578 games, mean reward -49.960, eps 0.24, speed 734.28 f/s
75996: done 579 games, mean reward -49.960, eps 0.24, speed 770.33 f/s
76063: done 580 games, mean reward -49.950, eps 0.24, speed 710.65 f/s
76121: done 581 games, mean reward -49.950, eps 0.24, speed 602.48 f/s
76198: done 582 games, mean reward -49.960, eps 0.24, speed 810.63 f/s
76265: done 583 games, mean reward -49.960, eps 0.24, speed 710.97 f/s
76345: done 584 games, mean reward -49.960, eps 0.24, speed 822.92 f/s
76408: done 585 games, mean reward -49.960, eps 0.24, speed 663.54 f/s
76469: done 586 games, mean reward -49.950, eps 0.24, speed 647.51 f/s
76532: done 587 games, mean reward -49.950, eps 0.23, speed 655.76 f/s
76596: done 588 games, mean reward -49.950, eps 0.23, speed 675.46 f/s
76661: done 589 games, mean reward -49.950, eps 0.23, speed 690.61 f/s
76730: done 590 games, mean reward -49.950, eps 0.23, speed 577.28 f/s
76802: done 591 games, mean reward -49.950, eps 0.23, speed 762.02 f/s
76876:

83272: done 694 games, mean reward -49.930, eps 0.17, speed 313.50 f/s
83329: done 695 games, mean reward -49.930, eps 0.17, speed 397.39 f/s
83386: done 696 games, mean reward -49.930, eps 0.17, speed 389.01 f/s
83443: done 697 games, mean reward -49.930, eps 0.17, speed 330.20 f/s
83507: done 698 games, mean reward -49.930, eps 0.16, speed 470.95 f/s
83564: done 699 games, mean reward -49.930, eps 0.16, speed 560.59 f/s
83623: done 700 games, mean reward -49.940, eps 0.16, speed 545.82 f/s
83687: done 701 games, mean reward -49.940, eps 0.16, speed 639.55 f/s
83747: done 702 games, mean reward -49.940, eps 0.16, speed 538.67 f/s
83802: done 703 games, mean reward -49.940, eps 0.16, speed 450.81 f/s
83861: done 704 games, mean reward -49.940, eps 0.16, speed 569.52 f/s
83922: done 705 games, mean reward -49.940, eps 0.16, speed 532.06 f/s
83986: done 706 games, mean reward -49.940, eps 0.16, speed 632.13 f/s
84045: done 707 games, mean reward -49.940, eps 0.16, speed 605.32 f/s
84102:

89961: done 810 games, mean reward -49.920, eps 0.10, speed 482.25 f/s
90024: done 811 games, mean reward -49.920, eps 0.10, speed 584.67 f/s
90080: done 812 games, mean reward -49.920, eps 0.10, speed 524.09 f/s
90137: done 813 games, mean reward -49.920, eps 0.10, speed 534.01 f/s
90194: done 814 games, mean reward -49.920, eps 0.10, speed 526.06 f/s
90248: done 815 games, mean reward -49.920, eps 0.10, speed 547.87 f/s
90303: done 816 games, mean reward -49.920, eps 0.10, speed 596.17 f/s
90360: done 817 games, mean reward -49.920, eps 0.10, speed 576.47 f/s
90416: done 818 games, mean reward -49.910, eps 0.10, speed 573.19 f/s
90470: done 819 games, mean reward -49.910, eps 0.10, speed 586.34 f/s
90523: done 820 games, mean reward -49.910, eps 0.09, speed 563.34 f/s
90581: done 821 games, mean reward -49.910, eps 0.09, speed 581.93 f/s
90631: done 822 games, mean reward -49.910, eps 0.09, speed 295.70 f/s
90685: done 823 games, mean reward -49.910, eps 0.09, speed 247.33 f/s
90738:

96315: done 928 games, mean reward -49.910, eps 0.04, speed 544.03 f/s
96365: done 929 games, mean reward -49.910, eps 0.04, speed 528.05 f/s
96418: done 930 games, mean reward -49.910, eps 0.04, speed 559.79 f/s
96469: done 931 games, mean reward -49.910, eps 0.04, speed 535.72 f/s
96520: done 932 games, mean reward -49.910, eps 0.03, speed 537.71 f/s
96571: done 933 games, mean reward -49.930, eps 0.03, speed 538.80 f/s
96621: done 934 games, mean reward -49.930, eps 0.03, speed 521.69 f/s
96672: done 935 games, mean reward -49.930, eps 0.03, speed 537.60 f/s
96722: done 936 games, mean reward -49.950, eps 0.03, speed 528.19 f/s
96774: done 937 games, mean reward -49.950, eps 0.03, speed 546.08 f/s
96826: done 938 games, mean reward -49.950, eps 0.03, speed 551.65 f/s
96877: done 939 games, mean reward -49.950, eps 0.03, speed 540.20 f/s
96929: done 940 games, mean reward -49.950, eps 0.03, speed 546.54 f/s
96979: done 941 games, mean reward -49.950, eps 0.03, speed 529.53 f/s
97029:

102197: done 1043 games, mean reward -49.970, eps 0.02, speed 540.16 f/s
102248: done 1044 games, mean reward -49.970, eps 0.02, speed 513.50 f/s
102300: done 1045 games, mean reward -49.970, eps 0.02, speed 579.33 f/s
102351: done 1046 games, mean reward -49.970, eps 0.02, speed 534.43 f/s
102401: done 1047 games, mean reward -49.970, eps 0.02, speed 529.10 f/s
102451: done 1048 games, mean reward -49.970, eps 0.02, speed 527.58 f/s
102501: done 1049 games, mean reward -49.970, eps 0.02, speed 498.95 f/s
102552: done 1050 games, mean reward -49.970, eps 0.02, speed 537.14 f/s
102603: done 1051 games, mean reward -49.970, eps 0.02, speed 537.93 f/s
102654: done 1052 games, mean reward -49.970, eps 0.02, speed 465.97 f/s
102707: done 1053 games, mean reward -49.970, eps 0.02, speed 500.55 f/s
102757: done 1054 games, mean reward -49.970, eps 0.02, speed 492.11 f/s
102807: done 1055 games, mean reward -49.970, eps 0.02, speed 526.59 f/s
102861: done 1056 games, mean reward -49.970, eps 0

108032: done 1157 games, mean reward -49.930, eps 0.02, speed 568.83 f/s
108082: done 1158 games, mean reward -49.940, eps 0.02, speed 527.58 f/s
108132: done 1159 games, mean reward -49.920, eps 0.02, speed 538.27 f/s
108183: done 1160 games, mean reward -49.920, eps 0.02, speed 541.28 f/s
108233: done 1161 games, mean reward -49.920, eps 0.02, speed 545.49 f/s
108283: done 1162 games, mean reward -49.920, eps 0.02, speed 541.71 f/s
108333: done 1163 games, mean reward -49.920, eps 0.02, speed 535.70 f/s
108384: done 1164 games, mean reward -49.920, eps 0.02, speed 554.21 f/s
108435: done 1165 games, mean reward -49.920, eps 0.02, speed 555.33 f/s
108485: done 1166 games, mean reward -49.920, eps 0.02, speed 538.35 f/s
108537: done 1167 games, mean reward -49.920, eps 0.02, speed 565.43 f/s
108588: done 1168 games, mean reward -49.920, eps 0.02, speed 554.61 f/s
108639: done 1169 games, mean reward -49.920, eps 0.02, speed 434.03 f/s
108690: done 1170 games, mean reward -49.920, eps 0

113870: done 1271 games, mean reward -49.920, eps 0.02, speed 316.52 f/s
113920: done 1272 games, mean reward -49.920, eps 0.02, speed 356.67 f/s
113971: done 1273 games, mean reward -49.920, eps 0.02, speed 378.43 f/s
114021: done 1274 games, mean reward -49.920, eps 0.02, speed 405.46 f/s
114071: done 1275 games, mean reward -49.910, eps 0.02, speed 369.81 f/s
114121: done 1276 games, mean reward -49.910, eps 0.02, speed 380.32 f/s
114172: done 1277 games, mean reward -49.930, eps 0.02, speed 382.23 f/s
114222: done 1278 games, mean reward -49.930, eps 0.02, speed 265.02 f/s
114272: done 1279 games, mean reward -49.930, eps 0.02, speed 288.66 f/s
114325: done 1280 games, mean reward -49.930, eps 0.02, speed 272.28 f/s
114375: done 1281 games, mean reward -49.940, eps 0.02, speed 246.98 f/s
114425: done 1282 games, mean reward -49.940, eps 0.02, speed 274.30 f/s
114476: done 1283 games, mean reward -49.940, eps 0.02, speed 353.12 f/s
114526: done 1284 games, mean reward -49.940, eps 0

119617: done 1384 games, mean reward -49.910, eps 0.02, speed 534.40 f/s
119667: done 1385 games, mean reward -49.910, eps 0.02, speed 529.04 f/s
119717: done 1386 games, mean reward -49.910, eps 0.02, speed 529.04 f/s
119769: done 1387 games, mean reward -49.910, eps 0.02, speed 546.08 f/s
119822: done 1388 games, mean reward -49.910, eps 0.02, speed 563.46 f/s
119872: done 1389 games, mean reward -49.910, eps 0.02, speed 503.44 f/s
119923: done 1390 games, mean reward -49.910, eps 0.02, speed 535.25 f/s
119974: done 1391 games, mean reward -49.910, eps 0.02, speed 538.51 f/s
120026: done 1392 games, mean reward -49.910, eps 0.02, speed 550.53 f/s
120077: done 1393 games, mean reward -49.910, eps 0.02, speed 491.77 f/s
120129: done 1394 games, mean reward -49.910, eps 0.02, speed 482.95 f/s
120182: done 1395 games, mean reward -49.910, eps 0.02, speed 557.90 f/s
120232: done 1396 games, mean reward -49.910, eps 0.02, speed 489.58 f/s
120282: done 1397 games, mean reward -49.910, eps 0

125492: done 1499 games, mean reward -49.920, eps 0.02, speed 531.43 f/s
125543: done 1500 games, mean reward -49.920, eps 0.02, speed 533.79 f/s
125593: done 1501 games, mean reward -49.920, eps 0.02, speed 529.14 f/s
125645: done 1502 games, mean reward -49.920, eps 0.02, speed 486.60 f/s
125696: done 1503 games, mean reward -49.920, eps 0.02, speed 538.22 f/s
125747: done 1504 games, mean reward -49.920, eps 0.02, speed 535.92 f/s
125797: done 1505 games, mean reward -49.920, eps 0.02, speed 522.29 f/s
125849: done 1506 games, mean reward -49.920, eps 0.02, speed 549.29 f/s
125901: done 1507 games, mean reward -49.920, eps 0.02, speed 550.41 f/s
125951: done 1508 games, mean reward -49.920, eps 0.02, speed 523.92 f/s
126001: done 1509 games, mean reward -49.920, eps 0.02, speed 528.55 f/s
126051: done 1510 games, mean reward -49.920, eps 0.02, speed 508.86 f/s
126102: done 1511 games, mean reward -49.930, eps 0.02, speed 531.43 f/s
126154: done 1512 games, mean reward -49.930, eps 0

131305: done 1613 games, mean reward -49.900, eps 0.02, speed 443.38 f/s
131357: done 1614 games, mean reward -49.900, eps 0.02, speed 533.98 f/s
131407: done 1615 games, mean reward -49.900, eps 0.02, speed 516.46 f/s
131460: done 1616 games, mean reward -49.900, eps 0.02, speed 542.69 f/s
131511: done 1617 games, mean reward -49.900, eps 0.02, speed 536.62 f/s
131562: done 1618 games, mean reward -49.900, eps 0.02, speed 540.12 f/s
131614: done 1619 games, mean reward -49.900, eps 0.02, speed 545.49 f/s
131667: done 1620 games, mean reward -49.900, eps 0.02, speed 556.51 f/s
131717: done 1621 games, mean reward -49.900, eps 0.02, speed 475.18 f/s
131767: done 1622 games, mean reward -49.900, eps 0.02, speed 505.83 f/s
131817: done 1623 games, mean reward -49.900, eps 0.02, speed 517.54 f/s
131867: done 1624 games, mean reward -49.900, eps 0.02, speed 511.32 f/s
131917: done 1625 games, mean reward -49.900, eps 0.02, speed 407.62 f/s
131969: done 1626 games, mean reward -49.900, eps 0

137094: done 1726 games, mean reward -49.920, eps 0.02, speed 431.98 f/s
137145: done 1727 games, mean reward -49.900, eps 0.02, speed 354.28 f/s
137196: done 1728 games, mean reward -49.900, eps 0.02, speed 415.33 f/s
137248: done 1729 games, mean reward -49.900, eps 0.02, speed 370.83 f/s
137300: done 1730 games, mean reward -49.890, eps 0.02, speed 426.56 f/s
137350: done 1731 games, mean reward -49.890, eps 0.02, speed 464.68 f/s
137402: done 1732 games, mean reward -49.890, eps 0.02, speed 474.26 f/s
137453: done 1733 games, mean reward -49.890, eps 0.02, speed 519.92 f/s
137505: done 1734 games, mean reward -49.890, eps 0.02, speed 368.53 f/s
137556: done 1735 games, mean reward -49.890, eps 0.02, speed 380.09 f/s
137607: done 1736 games, mean reward -49.890, eps 0.02, speed 410.56 f/s
137657: done 1737 games, mean reward -49.890, eps 0.02, speed 366.95 f/s
137708: done 1738 games, mean reward -49.890, eps 0.02, speed 453.86 f/s
137759: done 1739 games, mean reward -49.890, eps 0

142966: done 1841 games, mean reward -49.900, eps 0.02, speed 534.82 f/s
143018: done 1842 games, mean reward -49.900, eps 0.02, speed 561.34 f/s
143069: done 1843 games, mean reward -49.900, eps 0.02, speed 550.79 f/s
143120: done 1844 games, mean reward -49.900, eps 0.02, speed 540.33 f/s
143171: done 1845 games, mean reward -49.900, eps 0.02, speed 549.42 f/s
143222: done 1846 games, mean reward -49.900, eps 0.02, speed 530.75 f/s
143272: done 1847 games, mean reward -49.900, eps 0.02, speed 523.06 f/s
143322: done 1848 games, mean reward -49.910, eps 0.02, speed 528.33 f/s
143372: done 1849 games, mean reward -49.910, eps 0.02, speed 367.88 f/s
143424: done 1850 games, mean reward -49.910, eps 0.02, speed 397.82 f/s
143474: done 1851 games, mean reward -49.910, eps 0.02, speed 521.74 f/s
143525: done 1852 games, mean reward -49.910, eps 0.02, speed 548.09 f/s
143576: done 1853 games, mean reward -49.890, eps 0.02, speed 509.15 f/s
143628: done 1854 games, mean reward -49.890, eps 0

148830: done 1956 games, mean reward -49.890, eps 0.02, speed 490.75 f/s
148881: done 1957 games, mean reward -49.890, eps 0.02, speed 537.88 f/s
148932: done 1958 games, mean reward -49.890, eps 0.02, speed 538.45 f/s
148982: done 1959 games, mean reward -49.890, eps 0.02, speed 490.29 f/s
149034: done 1960 games, mean reward -49.890, eps 0.02, speed 541.67 f/s
149085: done 1961 games, mean reward -49.890, eps 0.02, speed 353.26 f/s
149135: done 1962 games, mean reward -49.890, eps 0.02, speed 372.99 f/s
149186: done 1963 games, mean reward -49.910, eps 0.02, speed 508.28 f/s
149236: done 1964 games, mean reward -49.910, eps 0.02, speed 540.10 f/s
149286: done 1965 games, mean reward -49.910, eps 0.02, speed 423.22 f/s
149339: done 1966 games, mean reward -49.910, eps 0.02, speed 399.87 f/s
149391: done 1967 games, mean reward -49.910, eps 0.02, speed 485.35 f/s
149444: done 1968 games, mean reward -49.910, eps 0.02, speed 551.92 f/s
149495: done 1969 games, mean reward -49.910, eps 0

154718: done 2071 games, mean reward -49.920, eps 0.02, speed 489.94 f/s
154772: done 2072 games, mean reward -49.920, eps 0.02, speed 566.21 f/s
154823: done 2073 games, mean reward -49.920, eps 0.02, speed 537.39 f/s
154873: done 2074 games, mean reward -49.920, eps 0.02, speed 495.25 f/s
154924: done 2075 games, mean reward -49.900, eps 0.02, speed 538.45 f/s
154977: done 2076 games, mean reward -49.900, eps 0.02, speed 559.45 f/s
155029: done 2077 games, mean reward -49.900, eps 0.02, speed 516.45 f/s
155080: done 2078 games, mean reward -49.900, eps 0.02, speed 539.13 f/s
155131: done 2079 games, mean reward -49.900, eps 0.02, speed 541.30 f/s
155181: done 2080 games, mean reward -49.900, eps 0.02, speed 496.99 f/s
155232: done 2081 games, mean reward -49.900, eps 0.02, speed 503.56 f/s
155284: done 2082 games, mean reward -49.900, eps 0.02, speed 546.47 f/s
155334: done 2083 games, mean reward -49.900, eps 0.02, speed 489.51 f/s
155384: done 2084 games, mean reward -49.900, eps 0

160544: done 2185 games, mean reward -49.960, eps 0.02, speed 460.17 f/s
160596: done 2186 games, mean reward -49.960, eps 0.02, speed 543.44 f/s
160646: done 2187 games, mean reward -49.960, eps 0.02, speed 529.48 f/s
160698: done 2188 games, mean reward -49.950, eps 0.02, speed 511.56 f/s
160750: done 2189 games, mean reward -49.950, eps 0.02, speed 546.90 f/s
160801: done 2190 games, mean reward -49.960, eps 0.02, speed 538.82 f/s
160853: done 2191 games, mean reward -49.960, eps 0.02, speed 512.10 f/s
160903: done 2192 games, mean reward -49.960, eps 0.02, speed 527.35 f/s
160956: done 2193 games, mean reward -49.960, eps 0.02, speed 558.53 f/s
161009: done 2194 games, mean reward -49.960, eps 0.02, speed 522.86 f/s
161060: done 2195 games, mean reward -49.960, eps 0.02, speed 536.61 f/s
161112: done 2196 games, mean reward -49.960, eps 0.02, speed 546.92 f/s
161162: done 2197 games, mean reward -49.960, eps 0.02, speed 491.63 f/s
161213: done 2198 games, mean reward -49.960, eps 0

166358: done 2299 games, mean reward -49.920, eps 0.02, speed 502.47 f/s
166408: done 2300 games, mean reward -49.920, eps 0.02, speed 527.43 f/s
166460: done 2301 games, mean reward -49.920, eps 0.02, speed 549.01 f/s
166512: done 2302 games, mean reward -49.920, eps 0.02, speed 512.18 f/s
166563: done 2303 games, mean reward -49.920, eps 0.02, speed 536.18 f/s
166614: done 2304 games, mean reward -49.920, eps 0.02, speed 536.84 f/s
166664: done 2305 games, mean reward -49.920, eps 0.02, speed 491.60 f/s
166714: done 2306 games, mean reward -49.920, eps 0.02, speed 525.45 f/s
166765: done 2307 games, mean reward -49.920, eps 0.02, speed 535.66 f/s
166816: done 2308 games, mean reward -49.920, eps 0.02, speed 503.29 f/s
166867: done 2309 games, mean reward -49.910, eps 0.02, speed 533.12 f/s
166918: done 2310 games, mean reward -49.910, eps 0.02, speed 479.99 f/s
166968: done 2311 games, mean reward -49.910, eps 0.02, speed 494.92 f/s
167019: done 2312 games, mean reward -49.910, eps 0

172190: done 2413 games, mean reward -49.910, eps 0.02, speed 498.77 f/s
172240: done 2414 games, mean reward -49.910, eps 0.02, speed 541.32 f/s
172292: done 2415 games, mean reward -49.910, eps 0.02, speed 566.65 f/s
172342: done 2416 games, mean reward -49.910, eps 0.02, speed 502.81 f/s
172395: done 2417 games, mean reward -49.920, eps 0.02, speed 572.98 f/s
172446: done 2418 games, mean reward -49.920, eps 0.02, speed 553.90 f/s
172497: done 2419 games, mean reward -49.930, eps 0.02, speed 513.49 f/s
172547: done 2420 games, mean reward -49.930, eps 0.02, speed 540.96 f/s
172597: done 2421 games, mean reward -49.930, eps 0.02, speed 543.85 f/s
172649: done 2422 games, mean reward -49.930, eps 0.02, speed 523.01 f/s
172699: done 2423 games, mean reward -49.930, eps 0.02, speed 543.37 f/s
172749: done 2424 games, mean reward -49.930, eps 0.02, speed 543.90 f/s
172799: done 2425 games, mean reward -49.930, eps 0.02, speed 501.54 f/s
172850: done 2426 games, mean reward -49.930, eps 0

177997: done 2527 games, mean reward -49.940, eps 0.02, speed 504.57 f/s
178048: done 2528 games, mean reward -49.940, eps 0.02, speed 538.56 f/s
178100: done 2529 games, mean reward -49.940, eps 0.02, speed 548.05 f/s
178153: done 2530 games, mean reward -49.940, eps 0.02, speed 474.85 f/s
178206: done 2531 games, mean reward -49.940, eps 0.02, speed 528.49 f/s
178259: done 2532 games, mean reward -49.940, eps 0.02, speed 538.79 f/s
178309: done 2533 games, mean reward -49.940, eps 0.02, speed 501.93 f/s
178359: done 2534 games, mean reward -49.940, eps 0.02, speed 543.72 f/s
178410: done 2535 games, mean reward -49.940, eps 0.02, speed 555.05 f/s
178460: done 2536 games, mean reward -49.940, eps 0.02, speed 504.68 f/s
178510: done 2537 games, mean reward -49.940, eps 0.02, speed 541.78 f/s
178561: done 2538 games, mean reward -49.940, eps 0.02, speed 545.64 f/s
178611: done 2539 games, mean reward -49.950, eps 0.02, speed 497.65 f/s
178661: done 2540 games, mean reward -49.950, eps 0

183811: done 2641 games, mean reward -49.930, eps 0.02, speed 493.83 f/s
183864: done 2642 games, mean reward -49.930, eps 0.02, speed 581.49 f/s
183915: done 2643 games, mean reward -49.930, eps 0.02, speed 552.26 f/s
183967: done 2644 games, mean reward -49.930, eps 0.02, speed 526.18 f/s
184018: done 2645 games, mean reward -49.930, eps 0.02, speed 548.42 f/s
184069: done 2646 games, mean reward -49.930, eps 0.02, speed 554.88 f/s
184121: done 2647 games, mean reward -49.930, eps 0.02, speed 523.30 f/s
184171: done 2648 games, mean reward -49.930, eps 0.02, speed 542.54 f/s
184222: done 2649 games, mean reward -49.930, eps 0.02, speed 557.00 f/s
184274: done 2650 games, mean reward -49.930, eps 0.02, speed 525.52 f/s
184325: done 2651 games, mean reward -49.930, eps 0.02, speed 553.76 f/s
184377: done 2652 games, mean reward -49.930, eps 0.02, speed 565.96 f/s
184429: done 2653 games, mean reward -49.930, eps 0.02, speed 520.22 f/s
184480: done 2654 games, mean reward -49.930, eps 0

189637: done 2755 games, mean reward -49.920, eps 0.02, speed 494.64 f/s
189689: done 2756 games, mean reward -49.920, eps 0.02, speed 563.54 f/s
189739: done 2757 games, mean reward -49.920, eps 0.02, speed 535.25 f/s
189789: done 2758 games, mean reward -49.920, eps 0.02, speed 498.63 f/s
189840: done 2759 games, mean reward -49.920, eps 0.02, speed 548.13 f/s
189891: done 2760 games, mean reward -49.920, eps 0.02, speed 555.92 f/s
189943: done 2761 games, mean reward -49.920, eps 0.02, speed 516.75 f/s
189993: done 2762 games, mean reward -49.920, eps 0.02, speed 541.78 f/s
190046: done 2763 games, mean reward -49.920, eps 0.02, speed 574.77 f/s
190097: done 2764 games, mean reward -49.920, eps 0.02, speed 515.69 f/s
190148: done 2765 games, mean reward -49.920, eps 0.02, speed 553.92 f/s
190198: done 2766 games, mean reward -49.920, eps 0.02, speed 543.64 f/s
190250: done 2767 games, mean reward -49.940, eps 0.02, speed 483.56 f/s
190300: done 2768 games, mean reward -49.940, eps 0

195463: done 2869 games, mean reward -49.930, eps 0.02, speed 502.14 f/s
195514: done 2870 games, mean reward -49.930, eps 0.02, speed 551.92 f/s
195564: done 2871 games, mean reward -49.930, eps 0.02, speed 544.66 f/s
195615: done 2872 games, mean reward -49.930, eps 0.02, speed 510.53 f/s
195665: done 2873 games, mean reward -49.930, eps 0.02, speed 542.17 f/s
195716: done 2874 games, mean reward -49.930, eps 0.02, speed 555.77 f/s
195768: done 2875 games, mean reward -49.920, eps 0.02, speed 522.83 f/s
195820: done 2876 games, mean reward -49.920, eps 0.02, speed 564.45 f/s
195870: done 2877 games, mean reward -49.920, eps 0.02, speed 545.47 f/s
195920: done 2878 games, mean reward -49.920, eps 0.02, speed 502.12 f/s
195971: done 2879 games, mean reward -49.920, eps 0.02, speed 552.72 f/s
196022: done 2880 games, mean reward -49.920, eps 0.02, speed 553.83 f/s
196072: done 2881 games, mean reward -49.920, eps 0.02, speed 498.40 f/s
196124: done 2882 games, mean reward -49.920, eps 0

201278: done 2983 games, mean reward -49.930, eps 0.02, speed 519.06 f/s
201329: done 2984 games, mean reward -49.930, eps 0.02, speed 537.57 f/s
201379: done 2985 games, mean reward -49.930, eps 0.02, speed 530.17 f/s
201429: done 2986 games, mean reward -49.930, eps 0.02, speed 495.91 f/s
201479: done 2987 games, mean reward -49.930, eps 0.02, speed 527.53 f/s
201530: done 2988 games, mean reward -49.930, eps 0.02, speed 540.59 f/s
201580: done 2989 games, mean reward -49.930, eps 0.02, speed 494.41 f/s
201632: done 2990 games, mean reward -49.930, eps 0.02, speed 550.10 f/s
201683: done 2991 games, mean reward -49.930, eps 0.02, speed 539.86 f/s
201738: done 2992 games, mean reward -49.930, eps 0.02, speed 531.89 f/s
201788: done 2993 games, mean reward -49.930, eps 0.02, speed 524.31 f/s
201838: done 2994 games, mean reward -49.930, eps 0.02, speed 525.94 f/s
201893: done 2995 games, mean reward -49.930, eps 0.02, speed 543.82 f/s
201944: done 2996 games, mean reward -49.930, eps 0

207081: done 3097 games, mean reward -49.960, eps 0.02, speed 504.32 f/s
207131: done 3098 games, mean reward -49.960, eps 0.02, speed 541.17 f/s
207183: done 3099 games, mean reward -49.950, eps 0.02, speed 565.20 f/s
207234: done 3100 games, mean reward -49.960, eps 0.02, speed 513.03 f/s
207287: done 3101 games, mean reward -49.960, eps 0.02, speed 572.20 f/s
207339: done 3102 games, mean reward -49.950, eps 0.02, speed 565.01 f/s
207389: done 3103 games, mean reward -49.950, eps 0.02, speed 503.86 f/s
207440: done 3104 games, mean reward -49.940, eps 0.02, speed 554.54 f/s
207490: done 3105 games, mean reward -49.940, eps 0.02, speed 545.67 f/s
207541: done 3106 games, mean reward -49.940, eps 0.02, speed 514.03 f/s
207592: done 3107 games, mean reward -49.940, eps 0.02, speed 551.89 f/s
207642: done 3108 games, mean reward -49.940, eps 0.02, speed 544.38 f/s
207692: done 3109 games, mean reward -49.940, eps 0.02, speed 504.30 f/s
207744: done 3110 games, mean reward -49.940, eps 0

212892: done 3211 games, mean reward -49.940, eps 0.02, speed 503.88 f/s
212943: done 3212 games, mean reward -49.940, eps 0.02, speed 533.98 f/s
212993: done 3213 games, mean reward -49.940, eps 0.02, speed 529.06 f/s
213045: done 3214 games, mean reward -49.940, eps 0.02, speed 513.72 f/s
213096: done 3215 games, mean reward -49.940, eps 0.02, speed 537.28 f/s
213146: done 3216 games, mean reward -49.940, eps 0.02, speed 526.67 f/s
213197: done 3217 games, mean reward -49.940, eps 0.02, speed 504.30 f/s
213247: done 3218 games, mean reward -49.940, eps 0.02, speed 527.43 f/s
213297: done 3219 games, mean reward -49.940, eps 0.02, speed 529.85 f/s
213349: done 3220 games, mean reward -49.940, eps 0.02, speed 511.11 f/s
213401: done 3221 games, mean reward -49.940, eps 0.02, speed 539.37 f/s
213451: done 3222 games, mean reward -49.940, eps 0.02, speed 526.50 f/s
213502: done 3223 games, mean reward -49.950, eps 0.02, speed 503.27 f/s
213552: done 3224 games, mean reward -49.950, eps 0

218709: done 3325 games, mean reward -49.920, eps 0.02, speed 498.88 f/s
218759: done 3326 games, mean reward -49.920, eps 0.02, speed 541.91 f/s
218809: done 3327 games, mean reward -49.920, eps 0.02, speed 542.16 f/s
218859: done 3328 games, mean reward -49.920, eps 0.02, speed 498.84 f/s
218910: done 3329 games, mean reward -49.920, eps 0.02, speed 552.31 f/s
218962: done 3330 games, mean reward -49.920, eps 0.02, speed 559.67 f/s
219014: done 3331 games, mean reward -49.920, eps 0.02, speed 519.19 f/s
219066: done 3332 games, mean reward -49.920, eps 0.02, speed 564.47 f/s
219117: done 3333 games, mean reward -49.920, eps 0.02, speed 553.62 f/s
219170: done 3334 games, mean reward -49.920, eps 0.02, speed 527.81 f/s
219220: done 3335 games, mean reward -49.920, eps 0.02, speed 538.33 f/s
219271: done 3336 games, mean reward -49.910, eps 0.02, speed 553.69 f/s
219324: done 3337 games, mean reward -49.910, eps 0.02, speed 525.95 f/s
219375: done 3338 games, mean reward -49.910, eps 0

224560: done 3440 games, mean reward -49.920, eps 0.02, speed 503.88 f/s
224610: done 3441 games, mean reward -49.920, eps 0.02, speed 527.70 f/s
224661: done 3442 games, mean reward -49.920, eps 0.02, speed 537.08 f/s
224711: done 3443 games, mean reward -49.920, eps 0.02, speed 496.11 f/s
224763: done 3444 games, mean reward -49.920, eps 0.02, speed 547.73 f/s
224815: done 3445 games, mean reward -49.920, eps 0.02, speed 550.18 f/s
224866: done 3446 games, mean reward -49.920, eps 0.02, speed 498.47 f/s
224916: done 3447 games, mean reward -49.920, eps 0.02, speed 527.53 f/s
224967: done 3448 games, mean reward -49.900, eps 0.02, speed 537.69 f/s
225019: done 3449 games, mean reward -49.900, eps 0.02, speed 513.97 f/s
225072: done 3450 games, mean reward -49.900, eps 0.02, speed 558.76 f/s
225122: done 3451 games, mean reward -49.900, eps 0.02, speed 527.51 f/s
225173: done 3452 games, mean reward -49.900, eps 0.02, speed 500.57 f/s
225225: done 3453 games, mean reward -49.900, eps 0

230370: done 3554 games, mean reward -49.940, eps 0.02, speed 492.21 f/s
230422: done 3555 games, mean reward -49.940, eps 0.02, speed 547.24 f/s
230475: done 3556 games, mean reward -49.940, eps 0.02, speed 559.32 f/s
230526: done 3557 games, mean reward -49.940, eps 0.02, speed 505.64 f/s
230578: done 3558 games, mean reward -49.940, eps 0.02, speed 549.84 f/s
230629: done 3559 games, mean reward -49.940, eps 0.02, speed 541.06 f/s
230680: done 3560 games, mean reward -49.940, eps 0.02, speed 502.88 f/s
230730: done 3561 games, mean reward -49.940, eps 0.02, speed 529.58 f/s
230780: done 3562 games, mean reward -49.940, eps 0.02, speed 540.17 f/s
230832: done 3563 games, mean reward -49.940, eps 0.02, speed 522.37 f/s
230883: done 3564 games, mean reward -49.940, eps 0.02, speed 539.18 f/s
230933: done 3565 games, mean reward -49.940, eps 0.02, speed 537.24 f/s
230985: done 3566 games, mean reward -49.940, eps 0.02, speed 513.77 f/s
231035: done 3567 games, mean reward -49.930, eps 0

236198: done 3668 games, mean reward -49.410, eps 0.02, speed 490.45 f/s
236250: done 3669 games, mean reward -49.410, eps 0.02, speed 546.53 f/s
236304: done 3670 games, mean reward -49.410, eps 0.02, speed 564.26 f/s
236354: done 3671 games, mean reward -49.410, eps 0.02, speed 493.64 f/s
236404: done 3672 games, mean reward -49.410, eps 0.02, speed 526.17 f/s
236454: done 3673 games, mean reward -49.410, eps 0.02, speed 527.57 f/s
236505: done 3674 games, mean reward -49.410, eps 0.02, speed 499.89 f/s
236557: done 3675 games, mean reward -49.410, eps 0.02, speed 549.81 f/s
236607: done 3676 games, mean reward -49.410, eps 0.02, speed 528.76 f/s
236658: done 3677 games, mean reward -49.410, eps 0.02, speed 504.20 f/s
236708: done 3678 games, mean reward -49.410, eps 0.02, speed 527.26 f/s
236759: done 3679 games, mean reward -49.410, eps 0.02, speed 536.76 f/s
236809: done 3680 games, mean reward -49.410, eps 0.02, speed 495.85 f/s
236861: done 3681 games, mean reward -49.410, eps 0

242023: done 3782 games, mean reward -49.390, eps 0.02, speed 501.86 f/s
242073: done 3783 games, mean reward -49.390, eps 0.02, speed 536.66 f/s
242124: done 3784 games, mean reward -49.390, eps 0.02, speed 544.57 f/s
242176: done 3785 games, mean reward -49.390, eps 0.02, speed 509.29 f/s
242227: done 3786 games, mean reward -49.390, eps 0.02, speed 545.47 f/s
242277: done 3787 games, mean reward -49.390, eps 0.02, speed 528.66 f/s
242330: done 3788 games, mean reward -49.390, eps 0.02, speed 512.49 f/s
242381: done 3789 games, mean reward -49.390, eps 0.02, speed 536.32 f/s
242432: done 3790 games, mean reward -49.400, eps 0.02, speed 540.37 f/s
242483: done 3791 games, mean reward -49.400, eps 0.02, speed 504.45 f/s
242534: done 3792 games, mean reward -49.400, eps 0.02, speed 536.95 f/s
242584: done 3793 games, mean reward -49.400, eps 0.02, speed 525.73 f/s
242634: done 3794 games, mean reward -49.400, eps 0.02, speed 489.36 f/s
242685: done 3795 games, mean reward -49.400, eps 0

247837: done 3896 games, mean reward -49.460, eps 0.02, speed 495.24 f/s
247888: done 3897 games, mean reward -49.460, eps 0.02, speed 524.76 f/s
247939: done 3898 games, mean reward -49.460, eps 0.02, speed 538.65 f/s
247989: done 3899 games, mean reward -49.460, eps 0.02, speed 495.99 f/s
248039: done 3900 games, mean reward -49.460, eps 0.02, speed 528.22 f/s
248091: done 3901 games, mean reward -49.460, eps 0.02, speed 548.80 f/s
248142: done 3902 games, mean reward -49.440, eps 0.02, speed 503.70 f/s
248193: done 3903 games, mean reward -49.440, eps 0.02, speed 537.45 f/s
248243: done 3904 games, mean reward -49.940, eps 0.02, speed 528.83 f/s
248297: done 3905 games, mean reward -49.940, eps 0.02, speed 530.14 f/s
248348: done 3906 games, mean reward -49.940, eps 0.02, speed 535.79 f/s
248400: done 3907 games, mean reward -49.940, eps 0.02, speed 547.33 f/s
248453: done 3908 games, mean reward -49.940, eps 0.02, speed 524.65 f/s
248504: done 3909 games, mean reward -49.940, eps 0

253649: done 4010 games, mean reward -48.800, eps 0.02, speed 515.64 f/s
253700: done 4011 games, mean reward -48.800, eps 0.02, speed 550.52 f/s
253750: done 4012 games, mean reward -48.800, eps 0.02, speed 538.46 f/s
253801: done 4013 games, mean reward -48.800, eps 0.02, speed 509.54 f/s
253851: done 4014 games, mean reward -48.800, eps 0.02, speed 542.40 f/s
253902: done 4015 games, mean reward -48.780, eps 0.02, speed 556.35 f/s
253953: done 4016 games, mean reward -48.780, eps 0.02, speed 517.47 f/s
254004: done 4017 games, mean reward -48.780, eps 0.02, speed 554.41 f/s
254055: done 4018 games, mean reward -48.780, eps 0.02, speed 552.27 f/s
254106: done 4019 games, mean reward -48.780, eps 0.02, speed 510.63 f/s
254156: done 4020 games, mean reward -48.780, eps 0.02, speed 544.12 f/s
254206: done 4021 games, mean reward -48.790, eps 0.02, speed 542.41 f/s
254261: done 4022 games, mean reward -48.790, eps 0.02, speed 548.45 f/s
254311: done 4023 games, mean reward -48.790, eps 0

259454: done 4124 games, mean reward -49.440, eps 0.02, speed 487.51 f/s
259505: done 4125 games, mean reward -49.440, eps 0.02, speed 535.30 f/s
259555: done 4126 games, mean reward -49.440, eps 0.02, speed 498.27 f/s
259607: done 4127 games, mean reward -49.440, eps 0.02, speed 504.05 f/s
259658: done 4128 games, mean reward -49.440, eps 0.02, speed 534.94 f/s
259709: done 4129 games, mean reward -49.440, eps 0.02, speed 536.44 f/s
259759: done 4130 games, mean reward -49.440, eps 0.02, speed 487.65 f/s
259811: done 4131 games, mean reward -49.440, eps 0.02, speed 546.55 f/s
259862: done 4132 games, mean reward -49.440, eps 0.02, speed 539.28 f/s
259913: done 4133 games, mean reward -49.440, eps 0.02, speed 500.91 f/s
259964: done 4134 games, mean reward -49.440, eps 0.02, speed 535.90 f/s
260014: done 4135 games, mean reward -49.440, eps 0.02, speed 528.18 f/s
260064: done 4136 games, mean reward -49.940, eps 0.02, speed 462.44 f/s
260116: done 4137 games, mean reward -49.940, eps 0

265210: done 4237 games, mean reward -49.470, eps 0.02, speed 494.27 f/s
265261: done 4238 games, mean reward -49.470, eps 0.02, speed 536.99 f/s
265312: done 4239 games, mean reward -49.470, eps 0.02, speed 538.05 f/s
265362: done 4240 games, mean reward -49.470, eps 0.02, speed 490.20 f/s
265413: done 4241 games, mean reward -49.470, eps 0.02, speed 536.64 f/s
265463: done 4242 games, mean reward -49.470, eps 0.02, speed 525.87 f/s
265513: done 4243 games, mean reward -49.470, eps 0.02, speed 491.96 f/s
265565: done 4244 games, mean reward -49.470, eps 0.02, speed 547.84 f/s
265615: done 4245 games, mean reward -49.470, eps 0.02, speed 527.35 f/s
265665: done 4246 games, mean reward -49.470, eps 0.02, speed 494.86 f/s
265717: done 4247 games, mean reward -49.470, eps 0.02, speed 546.79 f/s
265768: done 4248 games, mean reward -49.470, eps 0.02, speed 536.81 f/s
265819: done 4249 games, mean reward -49.470, eps 0.02, speed 498.68 f/s
265871: done 4250 games, mean reward -49.970, eps 0

271033: done 4351 games, mean reward -49.920, eps 0.02, speed 518.08 f/s
271084: done 4352 games, mean reward -49.920, eps 0.02, speed 553.39 f/s
271134: done 4353 games, mean reward -49.920, eps 0.02, speed 543.67 f/s
271185: done 4354 games, mean reward -49.930, eps 0.02, speed 518.97 f/s
271238: done 4355 games, mean reward -49.930, eps 0.02, speed 573.97 f/s
271290: done 4356 games, mean reward -49.930, eps 0.02, speed 563.46 f/s
271340: done 4357 games, mean reward -49.930, eps 0.02, speed 502.37 f/s
271390: done 4358 games, mean reward -49.930, eps 0.02, speed 541.29 f/s
271441: done 4359 games, mean reward -49.930, eps 0.02, speed 553.78 f/s
271492: done 4360 games, mean reward -49.930, eps 0.02, speed 510.51 f/s
271543: done 4361 games, mean reward -49.930, eps 0.02, speed 551.85 f/s
271593: done 4362 games, mean reward -49.930, eps 0.02, speed 527.23 f/s
271644: done 4363 games, mean reward -49.930, eps 0.02, speed 494.40 f/s
271694: done 4364 games, mean reward -49.930, eps 0

276853: done 4465 games, mean reward -49.900, eps 0.02, speed 491.63 f/s
276907: done 4466 games, mean reward -49.900, eps 0.02, speed 569.43 f/s
276959: done 4467 games, mean reward -49.900, eps 0.02, speed 550.53 f/s
277009: done 4468 games, mean reward -49.910, eps 0.02, speed 493.63 f/s
277060: done 4469 games, mean reward -49.910, eps 0.02, speed 536.33 f/s
277111: done 4470 games, mean reward -49.910, eps 0.02, speed 540.45 f/s
277162: done 4471 games, mean reward -49.910, eps 0.02, speed 502.82 f/s
277215: done 4472 games, mean reward -49.910, eps 0.02, speed 558.49 f/s
277267: done 4473 games, mean reward -49.920, eps 0.02, speed 549.52 f/s
277319: done 4474 games, mean reward -49.920, eps 0.02, speed 495.46 f/s
277370: done 4475 games, mean reward -49.920, eps 0.02, speed 539.02 f/s
277421: done 4476 games, mean reward -49.920, eps 0.02, speed 539.45 f/s
277472: done 4477 games, mean reward -49.920, eps 0.02, speed 500.74 f/s
277522: done 4478 games, mean reward -49.920, eps 0

282714: done 4580 games, mean reward -49.890, eps 0.02, speed 493.08 f/s
282765: done 4581 games, mean reward -49.890, eps 0.02, speed 531.38 f/s
282816: done 4582 games, mean reward -49.890, eps 0.02, speed 537.78 f/s
282866: done 4583 games, mean reward -49.900, eps 0.02, speed 485.62 f/s
282917: done 4584 games, mean reward -49.900, eps 0.02, speed 535.94 f/s
282969: done 4585 games, mean reward -49.900, eps 0.02, speed 547.03 f/s
283020: done 4586 games, mean reward -49.900, eps 0.02, speed 504.67 f/s
283070: done 4587 games, mean reward -49.900, eps 0.02, speed 525.19 f/s
283121: done 4588 games, mean reward -49.900, eps 0.02, speed 538.37 f/s
283173: done 4589 games, mean reward -49.900, eps 0.02, speed 506.25 f/s
283224: done 4590 games, mean reward -49.900, eps 0.02, speed 538.09 f/s
283275: done 4591 games, mean reward -49.900, eps 0.02, speed 536.49 f/s
283325: done 4592 games, mean reward -49.900, eps 0.02, speed 495.44 f/s
283376: done 4593 games, mean reward -49.900, eps 0

288520: done 4694 games, mean reward -49.880, eps 0.02, speed 489.92 f/s
288571: done 4695 games, mean reward -49.880, eps 0.02, speed 550.19 f/s
288623: done 4696 games, mean reward -49.880, eps 0.02, speed 563.55 f/s
288674: done 4697 games, mean reward -49.880, eps 0.02, speed 510.60 f/s
288725: done 4698 games, mean reward -49.880, eps 0.02, speed 551.35 f/s
288776: done 4699 games, mean reward -49.880, eps 0.02, speed 552.42 f/s
288827: done 4700 games, mean reward -49.880, eps 0.02, speed 510.96 f/s
288877: done 4701 games, mean reward -49.880, eps 0.02, speed 539.89 f/s
288928: done 4702 games, mean reward -49.880, eps 0.02, speed 552.60 f/s
288980: done 4703 games, mean reward -49.910, eps 0.02, speed 519.77 f/s
289030: done 4704 games, mean reward -49.910, eps 0.02, speed 542.36 f/s
289080: done 4705 games, mean reward -49.910, eps 0.02, speed 535.36 f/s
289134: done 4706 games, mean reward -49.900, eps 0.02, speed 535.12 f/s
289185: done 4707 games, mean reward -49.900, eps 0

294327: done 4808 games, mean reward -49.980, eps 0.02, speed 494.13 f/s
294377: done 4809 games, mean reward -49.980, eps 0.02, speed 526.95 f/s
294428: done 4810 games, mean reward -49.980, eps 0.02, speed 538.71 f/s
294479: done 4811 games, mean reward -49.980, eps 0.02, speed 504.09 f/s
294530: done 4812 games, mean reward -49.970, eps 0.02, speed 537.75 f/s
294580: done 4813 games, mean reward -49.970, eps 0.02, speed 529.32 f/s
294631: done 4814 games, mean reward -49.950, eps 0.02, speed 500.18 f/s
294683: done 4815 games, mean reward -49.950, eps 0.02, speed 548.59 f/s
294736: done 4816 games, mean reward -49.950, eps 0.02, speed 559.11 f/s
294786: done 4817 games, mean reward -49.950, eps 0.02, speed 493.68 f/s
294836: done 4818 games, mean reward -49.950, eps 0.02, speed 527.13 f/s
294888: done 4819 games, mean reward -49.960, eps 0.02, speed 558.31 f/s
294938: done 4820 games, mean reward -49.960, eps 0.02, speed 494.20 f/s
294990: done 4821 games, mean reward -49.960, eps 0

300147: done 4922 games, mean reward -49.390, eps 0.02, speed 515.72 f/s
300197: done 4923 games, mean reward -49.410, eps 0.02, speed 552.09 f/s
300249: done 4924 games, mean reward -49.410, eps 0.02, speed 574.21 f/s
300299: done 4925 games, mean reward -49.410, eps 0.02, speed 504.34 f/s
300349: done 4926 games, mean reward -49.410, eps 0.02, speed 552.17 f/s
300403: done 4927 games, mean reward -49.410, eps 0.02, speed 595.31 f/s
300455: done 4928 games, mean reward -48.980, eps 0.02, speed 528.50 f/s
300506: done 4929 games, mean reward -48.980, eps 0.02, speed 562.31 f/s
300557: done 4930 games, mean reward -48.980, eps 0.02, speed 562.58 f/s
300607: done 4931 games, mean reward -48.980, eps 0.02, speed 514.90 f/s
300661: done 4932 games, mean reward -49.000, eps 0.02, speed 592.32 f/s
300714: done 4933 games, mean reward -49.000, eps 0.02, speed 577.06 f/s
300765: done 4934 games, mean reward -49.000, eps 0.02, speed 515.61 f/s
300816: done 4935 games, mean reward -49.000, eps 0

305950: done 5036 games, mean reward -49.610, eps 0.02, speed 515.52 f/s
306001: done 5037 games, mean reward -49.610, eps 0.02, speed 561.74 f/s
306052: done 5038 games, mean reward -49.990, eps 0.02, speed 562.63 f/s
306104: done 5039 games, mean reward -49.990, eps 0.02, speed 530.40 f/s
306156: done 5040 games, mean reward -49.990, eps 0.02, speed 572.28 f/s
306206: done 5041 games, mean reward -49.990, eps 0.02, speed 554.26 f/s
306258: done 5042 games, mean reward -49.990, eps 0.02, speed 533.03 f/s
306309: done 5043 games, mean reward -49.990, eps 0.02, speed 564.94 f/s
306359: done 5044 games, mean reward -49.990, eps 0.02, speed 555.30 f/s
306411: done 5045 games, mean reward -49.990, eps 0.02, speed 522.87 f/s
306462: done 5046 games, mean reward -49.990, eps 0.02, speed 563.74 f/s
306512: done 5047 games, mean reward -49.990, eps 0.02, speed 553.68 f/s
306562: done 5048 games, mean reward -49.990, eps 0.02, speed 508.09 f/s
306612: done 5049 games, mean reward -49.990, eps 0

311793: done 5151 games, mean reward -49.000, eps 0.02, speed 442.56 f/s
311844: done 5152 games, mean reward -49.000, eps 0.02, speed 540.35 f/s
311896: done 5153 games, mean reward -49.000, eps 0.02, speed 553.08 f/s
311946: done 5154 games, mean reward -49.000, eps 0.02, speed 473.82 f/s
311997: done 5155 games, mean reward -49.000, eps 0.02, speed 535.69 f/s
312047: done 5156 games, mean reward -49.000, eps 0.02, speed 518.72 f/s
312098: done 5157 games, mean reward -49.000, eps 0.02, speed 449.73 f/s
312148: done 5158 games, mean reward -48.500, eps 0.02, speed 521.84 f/s
312199: done 5159 games, mean reward -48.500, eps 0.02, speed 531.35 f/s
312249: done 5160 games, mean reward -48.500, eps 0.02, speed 488.22 f/s
312302: done 5161 games, mean reward -48.500, eps 0.02, speed 555.25 f/s
312352: done 5162 games, mean reward -48.500, eps 0.02, speed 520.86 f/s
312403: done 5163 games, mean reward -48.500, eps 0.02, speed 489.45 f/s
312454: done 5164 games, mean reward -48.500, eps 0

317637: done 5266 games, mean reward -49.400, eps 0.02, speed 548.77 f/s
317688: done 5267 games, mean reward -49.400, eps 0.02, speed 548.03 f/s
317739: done 5268 games, mean reward -49.400, eps 0.02, speed 550.44 f/s
317789: done 5269 games, mean reward -49.400, eps 0.02, speed 517.93 f/s
317842: done 5270 games, mean reward -49.400, eps 0.02, speed 555.54 f/s
317893: done 5271 games, mean reward -49.400, eps 0.02, speed 504.60 f/s
317945: done 5272 games, mean reward -49.400, eps 0.02, speed 531.06 f/s
317996: done 5273 games, mean reward -49.400, eps 0.02, speed 533.55 f/s
318050: done 5274 games, mean reward -49.400, eps 0.02, speed 566.82 f/s
318101: done 5275 games, mean reward -49.400, eps 0.02, speed 531.72 f/s
318152: done 5276 games, mean reward -49.400, eps 0.02, speed 544.76 f/s
318203: done 5277 games, mean reward -49.400, eps 0.02, speed 543.97 f/s
318255: done 5278 games, mean reward -49.400, eps 0.02, speed 540.48 f/s
318305: done 5279 games, mean reward -49.400, eps 0

323458: done 5380 games, mean reward -49.450, eps 0.02, speed 529.49 f/s
323508: done 5381 games, mean reward -49.450, eps 0.02, speed 525.38 f/s
323560: done 5382 games, mean reward -49.450, eps 0.02, speed 547.61 f/s
323611: done 5383 games, mean reward -49.450, eps 0.02, speed 532.02 f/s
323662: done 5384 games, mean reward -49.450, eps 0.02, speed 523.98 f/s
323716: done 5385 games, mean reward -49.450, eps 0.02, speed 566.00 f/s
323767: done 5386 games, mean reward -49.450, eps 0.02, speed 531.84 f/s
323817: done 5387 games, mean reward -49.450, eps 0.02, speed 474.84 f/s
323868: done 5388 games, mean reward -49.450, eps 0.02, speed 533.00 f/s
323918: done 5389 games, mean reward -49.450, eps 0.02, speed 515.08 f/s
323968: done 5390 games, mean reward -49.450, eps 0.02, speed 525.22 f/s
324018: done 5391 games, mean reward -49.450, eps 0.02, speed 521.47 f/s
324069: done 5392 games, mean reward -49.450, eps 0.02, speed 534.95 f/s
324119: done 5393 games, mean reward -49.450, eps 0

329211: done 5493 games, mean reward -49.990, eps 0.02, speed 487.20 f/s
329261: done 5494 games, mean reward -49.990, eps 0.02, speed 535.72 f/s
329313: done 5495 games, mean reward -49.990, eps 0.02, speed 529.90 f/s
329364: done 5496 games, mean reward -49.990, eps 0.02, speed 549.61 f/s
329414: done 5497 games, mean reward -49.990, eps 0.02, speed 549.20 f/s
329465: done 5498 games, mean reward -49.990, eps 0.02, speed 561.94 f/s
329515: done 5499 games, mean reward -49.990, eps 0.02, speed 539.96 f/s
329565: done 5500 games, mean reward -49.990, eps 0.02, speed 550.41 f/s
329617: done 5501 games, mean reward -49.990, eps 0.02, speed 572.65 f/s
329667: done 5502 games, mean reward -49.990, eps 0.02, speed 542.53 f/s
329717: done 5503 games, mean reward -49.990, eps 0.02, speed 519.65 f/s
329767: done 5504 games, mean reward -49.990, eps 0.02, speed 550.85 f/s
329817: done 5505 games, mean reward -49.990, eps 0.02, speed 538.80 f/s
329869: done 5506 games, mean reward -49.990, eps 0

334968: done 5606 games, mean reward -49.980, eps 0.02, speed 540.23 f/s
335019: done 5607 games, mean reward -49.980, eps 0.02, speed 549.73 f/s
335069: done 5608 games, mean reward -49.980, eps 0.02, speed 496.58 f/s
335119: done 5609 games, mean reward -49.980, eps 0.02, speed 528.57 f/s
335170: done 5610 games, mean reward -49.980, eps 0.02, speed 548.76 f/s
335220: done 5611 games, mean reward -49.980, eps 0.02, speed 539.49 f/s
335271: done 5612 games, mean reward -49.980, eps 0.02, speed 538.70 f/s
335322: done 5613 games, mean reward -49.980, eps 0.02, speed 551.74 f/s
335372: done 5614 games, mean reward -49.980, eps 0.02, speed 540.28 f/s
335423: done 5615 games, mean reward -49.980, eps 0.02, speed 542.67 f/s
335474: done 5616 games, mean reward -49.960, eps 0.02, speed 554.23 f/s
335525: done 5617 games, mean reward -49.960, eps 0.02, speed 464.74 f/s
335575: done 5618 games, mean reward -49.960, eps 0.02, speed 494.72 f/s
335625: done 5619 games, mean reward -49.960, eps 0

340811: done 5721 games, mean reward -49.900, eps 0.02, speed 530.90 f/s
340862: done 5722 games, mean reward -49.900, eps 0.02, speed 534.27 f/s
340913: done 5723 games, mean reward -49.880, eps 0.02, speed 457.30 f/s
340963: done 5724 games, mean reward -49.880, eps 0.02, speed 524.61 f/s
341015: done 5725 games, mean reward -49.880, eps 0.02, speed 546.36 f/s
341069: done 5726 games, mean reward -49.880, eps 0.02, speed 558.87 f/s
341120: done 5727 games, mean reward -49.880, eps 0.02, speed 534.76 f/s
341170: done 5728 games, mean reward -49.880, eps 0.02, speed 524.58 f/s
341222: done 5729 games, mean reward -49.880, eps 0.02, speed 538.61 f/s
341273: done 5730 games, mean reward -49.880, eps 0.02, speed 537.15 f/s
341323: done 5731 games, mean reward -49.880, eps 0.02, speed 526.20 f/s
341374: done 5732 games, mean reward -49.880, eps 0.02, speed 531.01 f/s
341425: done 5733 games, mean reward -49.880, eps 0.02, speed 498.84 f/s
341476: done 5734 games, mean reward -49.880, eps 0

346668: done 5836 games, mean reward -49.460, eps 0.02, speed 543.66 f/s
346718: done 5837 games, mean reward -49.460, eps 0.02, speed 541.44 f/s
346770: done 5838 games, mean reward -49.460, eps 0.02, speed 495.19 f/s
346820: done 5839 games, mean reward -49.460, eps 0.02, speed 530.12 f/s
346871: done 5840 games, mean reward -49.460, eps 0.02, speed 548.88 f/s
346921: done 5841 games, mean reward -49.460, eps 0.02, speed 540.40 f/s
346972: done 5842 games, mean reward -49.460, eps 0.02, speed 538.69 f/s
347024: done 5843 games, mean reward -49.460, eps 0.02, speed 559.98 f/s
347075: done 5844 games, mean reward -49.470, eps 0.02, speed 550.40 f/s
347129: done 5845 games, mean reward -49.470, eps 0.02, speed 566.99 f/s
347182: done 5846 games, mean reward -49.470, eps 0.02, speed 569.45 f/s
347232: done 5847 games, mean reward -49.470, eps 0.02, speed 547.63 f/s
347283: done 5848 games, mean reward -49.470, eps 0.02, speed 519.75 f/s
347334: done 5849 games, mean reward -49.470, eps 0

352522: done 5951 games, mean reward -49.960, eps 0.02, speed 540.03 f/s
352575: done 5952 games, mean reward -49.960, eps 0.02, speed 578.66 f/s
352627: done 5953 games, mean reward -49.960, eps 0.02, speed 489.48 f/s
352679: done 5954 games, mean reward -49.960, eps 0.02, speed 560.27 f/s
352730: done 5955 games, mean reward -49.960, eps 0.02, speed 558.54 f/s
352781: done 5956 games, mean reward -49.960, eps 0.02, speed 559.92 f/s
352834: done 5957 games, mean reward -49.960, eps 0.02, speed 569.62 f/s
352886: done 5958 games, mean reward -49.960, eps 0.02, speed 570.54 f/s
352936: done 5959 games, mean reward -49.460, eps 0.02, speed 550.28 f/s
352987: done 5960 games, mean reward -49.460, eps 0.02, speed 553.99 f/s
353037: done 5961 games, mean reward -49.460, eps 0.02, speed 546.79 f/s
353087: done 5962 games, mean reward -49.460, eps 0.02, speed 550.48 f/s
353138: done 5963 games, mean reward -49.460, eps 0.02, speed 548.62 f/s
353189: done 5964 games, mean reward -49.460, eps 0

358287: done 6064 games, mean reward -49.980, eps 0.02, speed 542.01 f/s
358339: done 6065 games, mean reward -49.980, eps 0.02, speed 546.71 f/s
358391: done 6066 games, mean reward -49.980, eps 0.02, speed 546.68 f/s
358441: done 6067 games, mean reward -49.980, eps 0.02, speed 521.71 f/s
358492: done 6068 games, mean reward -49.980, eps 0.02, speed 535.85 f/s
358543: done 6069 games, mean reward -49.980, eps 0.02, speed 510.64 f/s
358595: done 6070 games, mean reward -49.980, eps 0.02, speed 541.75 f/s
358646: done 6071 games, mean reward -49.980, eps 0.02, speed 535.68 f/s
358697: done 6072 games, mean reward -49.980, eps 0.02, speed 537.19 f/s
358747: done 6073 games, mean reward -49.980, eps 0.02, speed 521.60 f/s
358797: done 6074 games, mean reward -49.980, eps 0.02, speed 525.06 f/s
358848: done 6075 games, mean reward -49.980, eps 0.02, speed 535.41 f/s
358901: done 6076 games, mean reward -49.980, eps 0.02, speed 551.54 f/s
358953: done 6077 games, mean reward -49.980, eps 0

364112: done 6178 games, mean reward -49.620, eps 0.02, speed 547.66 f/s
364162: done 6179 games, mean reward -49.620, eps 0.02, speed 549.55 f/s
364214: done 6180 games, mean reward -49.620, eps 0.02, speed 569.65 f/s
364264: done 6181 games, mean reward -49.620, eps 0.02, speed 538.84 f/s
364314: done 6182 games, mean reward -49.620, eps 0.02, speed 549.82 f/s
364365: done 6183 games, mean reward -49.620, eps 0.02, speed 551.66 f/s
364416: done 6184 games, mean reward -49.620, eps 0.02, speed 548.08 f/s
364466: done 6185 games, mean reward -49.620, eps 0.02, speed 526.17 f/s
364519: done 6186 games, mean reward -49.620, eps 0.02, speed 511.10 f/s
364569: done 6187 games, mean reward -49.620, eps 0.02, speed 507.39 f/s
364620: done 6188 games, mean reward -49.620, eps 0.02, speed 532.62 f/s
364670: done 6189 games, mean reward -49.620, eps 0.02, speed 528.24 f/s
364721: done 6190 games, mean reward -49.620, eps 0.02, speed 533.68 f/s
364771: done 6191 games, mean reward -49.620, eps 0

369933: done 6292 games, mean reward -49.490, eps 0.02, speed 538.95 f/s
369984: done 6293 games, mean reward -49.490, eps 0.02, speed 541.74 f/s
370040: done 6294 games, mean reward -49.490, eps 0.02, speed 575.15 f/s
370091: done 6295 games, mean reward -49.490, eps 0.02, speed 538.18 f/s
370142: done 6296 games, mean reward -49.490, eps 0.02, speed 542.93 f/s
370192: done 6297 games, mean reward -49.490, eps 0.02, speed 534.60 f/s
370243: done 6298 games, mean reward -49.490, eps 0.02, speed 538.32 f/s
370293: done 6299 games, mean reward -49.490, eps 0.02, speed 534.73 f/s
370344: done 6300 games, mean reward -49.490, eps 0.02, speed 543.67 f/s
370395: done 6301 games, mean reward -48.990, eps 0.02, speed 507.86 f/s
370450: done 6302 games, mean reward -48.990, eps 0.02, speed 586.33 f/s
370500: done 6303 games, mean reward -48.990, eps 0.02, speed 535.47 f/s
370552: done 6304 games, mean reward -48.990, eps 0.02, speed 550.53 f/s
370603: done 6305 games, mean reward -48.990, eps 0

375752: done 6406 games, mean reward -48.040, eps 0.02, speed 538.82 f/s
375802: done 6407 games, mean reward -48.040, eps 0.02, speed 520.58 f/s
375853: done 6408 games, mean reward -48.040, eps 0.02, speed 493.10 f/s
375903: done 6409 games, mean reward -48.490, eps 0.02, speed 523.23 f/s
375954: done 6410 games, mean reward -48.490, eps 0.02, speed 544.12 f/s
376007: done 6411 games, mean reward -48.490, eps 0.02, speed 565.45 f/s
376058: done 6412 games, mean reward -48.990, eps 0.02, speed 540.39 f/s
376108: done 6413 games, mean reward -48.490, eps 0.02, speed 534.63 f/s
376158: done 6414 games, mean reward -48.490, eps 0.02, speed 535.33 f/s
376208: done 6415 games, mean reward -48.490, eps 0.02, speed 527.43 f/s
376260: done 6416 games, mean reward -48.490, eps 0.02, speed 556.10 f/s
376310: done 6417 games, mean reward -48.490, eps 0.02, speed 536.85 f/s
376360: done 6418 games, mean reward -48.490, eps 0.02, speed 506.62 f/s
376412: done 6419 games, mean reward -48.490, eps 0

381563: done 6520 games, mean reward -49.070, eps 0.02, speed 551.84 f/s
381613: done 6521 games, mean reward -49.070, eps 0.02, speed 535.14 f/s
381666: done 6522 games, mean reward -49.070, eps 0.02, speed 574.04 f/s
381718: done 6523 games, mean reward -49.070, eps 0.02, speed 562.07 f/s
381768: done 6524 games, mean reward -49.070, eps 0.02, speed 551.99 f/s
381820: done 6525 games, mean reward -49.070, eps 0.02, speed 570.60 f/s
381870: done 6526 games, mean reward -49.070, eps 0.02, speed 536.08 f/s
381920: done 6527 games, mean reward -49.070, eps 0.02, speed 489.62 f/s
381970: done 6528 games, mean reward -49.070, eps 0.02, speed 550.00 f/s
382022: done 6529 games, mean reward -49.070, eps 0.02, speed 557.38 f/s
382074: done 6530 games, mean reward -49.070, eps 0.02, speed 569.55 f/s
382126: done 6531 games, mean reward -49.070, eps 0.02, speed 571.32 f/s
382178: done 6532 games, mean reward -49.070, eps 0.02, speed 562.88 f/s
382229: done 6533 games, mean reward -49.070, eps 0

387379: done 6634 games, mean reward -48.960, eps 0.02, speed 537.42 f/s
387432: done 6635 games, mean reward -48.960, eps 0.02, speed 564.24 f/s
387483: done 6636 games, mean reward -48.960, eps 0.02, speed 544.98 f/s
387535: done 6637 games, mean reward -48.960, eps 0.02, speed 547.71 f/s
387585: done 6638 games, mean reward -48.960, eps 0.02, speed 533.38 f/s
387635: done 6639 games, mean reward -48.960, eps 0.02, speed 534.49 f/s
387686: done 6640 games, mean reward -48.960, eps 0.02, speed 537.22 f/s
387736: done 6641 games, mean reward -48.960, eps 0.02, speed 534.73 f/s
387787: done 6642 games, mean reward -48.960, eps 0.02, speed 488.26 f/s
387837: done 6643 games, mean reward -48.960, eps 0.02, speed 527.79 f/s
387888: done 6644 games, mean reward -48.960, eps 0.02, speed 533.09 f/s
387939: done 6645 games, mean reward -48.960, eps 0.02, speed 547.44 f/s
387991: done 6646 games, mean reward -48.960, eps 0.02, speed 552.76 f/s
388041: done 6647 games, mean reward -48.960, eps 0

393144: done 6747 games, mean reward -49.040, eps 0.02, speed 479.90 f/s
393194: done 6748 games, mean reward -49.040, eps 0.02, speed 533.93 f/s
393245: done 6749 games, mean reward -49.040, eps 0.02, speed 542.81 f/s
393296: done 6750 games, mean reward -49.540, eps 0.02, speed 538.80 f/s
393347: done 6751 games, mean reward -49.540, eps 0.02, speed 544.54 f/s
393399: done 6752 games, mean reward -49.540, eps 0.02, speed 552.01 f/s
393452: done 6753 games, mean reward -49.540, eps 0.02, speed 560.99 f/s
393503: done 6754 games, mean reward -49.540, eps 0.02, speed 518.58 f/s
393553: done 6755 games, mean reward -49.540, eps 0.02, speed 539.89 f/s
393604: done 6756 games, mean reward -49.540, eps 0.02, speed 547.22 f/s
393656: done 6757 games, mean reward -49.540, eps 0.02, speed 568.02 f/s
393706: done 6758 games, mean reward -49.540, eps 0.02, speed 508.37 f/s
393757: done 6759 games, mean reward -49.540, eps 0.02, speed 540.62 f/s
393807: done 6760 games, mean reward -49.540, eps 0

398964: done 6861 games, mean reward -48.960, eps 0.02, speed 540.45 f/s
399015: done 6862 games, mean reward -48.960, eps 0.02, speed 543.63 f/s
399065: done 6863 games, mean reward -48.960, eps 0.02, speed 534.05 f/s
399115: done 6864 games, mean reward -48.960, eps 0.02, speed 528.87 f/s
399166: done 6865 games, mean reward -48.960, eps 0.02, speed 510.68 f/s
399216: done 6866 games, mean reward -48.960, eps 0.02, speed 535.05 f/s
399267: done 6867 games, mean reward -48.960, eps 0.02, speed 539.74 f/s
399319: done 6868 games, mean reward -48.960, eps 0.02, speed 554.02 f/s
399370: done 6869 games, mean reward -48.960, eps 0.02, speed 544.84 f/s
399422: done 6870 games, mean reward -48.730, eps 0.02, speed 549.40 f/s
399474: done 6871 games, mean reward -48.730, eps 0.02, speed 554.96 f/s
399526: done 6872 games, mean reward -48.730, eps 0.02, speed 555.64 f/s
399579: done 6873 games, mean reward -48.730, eps 0.02, speed 557.92 f/s
399631: done 6874 games, mean reward -48.730, eps 0

404787: done 6975 games, mean reward -48.500, eps 0.02, speed 520.29 f/s
404837: done 6976 games, mean reward -48.500, eps 0.02, speed 525.95 f/s
404889: done 6977 games, mean reward -48.500, eps 0.02, speed 548.06 f/s
404942: done 6978 games, mean reward -48.500, eps 0.02, speed 552.86 f/s
404993: done 6979 games, mean reward -48.500, eps 0.02, speed 536.95 f/s
405043: done 6980 games, mean reward -48.500, eps 0.02, speed 535.68 f/s
405095: done 6981 games, mean reward -48.500, eps 0.02, speed 550.53 f/s
405145: done 6982 games, mean reward -48.500, eps 0.02, speed 489.84 f/s
405196: done 6983 games, mean reward -48.500, eps 0.02, speed 546.88 f/s
405250: done 6984 games, mean reward -48.500, eps 0.02, speed 569.96 f/s
405302: done 6985 games, mean reward -48.500, eps 0.02, speed 527.10 f/s
405353: done 6986 games, mean reward -48.500, eps 0.02, speed 558.89 f/s
405404: done 6987 games, mean reward -48.500, eps 0.02, speed 546.72 f/s
405454: done 6988 games, mean reward -48.500, eps 0

410551: done 7088 games, mean reward -49.430, eps 0.02, speed 529.09 f/s
410602: done 7089 games, mean reward -49.430, eps 0.02, speed 546.69 f/s
410655: done 7090 games, mean reward -49.430, eps 0.02, speed 567.60 f/s
410706: done 7091 games, mean reward -49.430, eps 0.02, speed 535.87 f/s
410756: done 7092 games, mean reward -49.430, eps 0.02, speed 535.74 f/s
410807: done 7093 games, mean reward -49.430, eps 0.02, speed 545.69 f/s
410858: done 7094 games, mean reward -49.430, eps 0.02, speed 538.92 f/s
410909: done 7095 games, mean reward -49.430, eps 0.02, speed 545.52 f/s
410961: done 7096 games, mean reward -49.430, eps 0.02, speed 556.39 f/s
411013: done 7097 games, mean reward -49.430, eps 0.02, speed 545.96 f/s
411063: done 7098 games, mean reward -49.430, eps 0.02, speed 502.30 f/s
411116: done 7099 games, mean reward -49.430, eps 0.02, speed 566.53 f/s
411167: done 7100 games, mean reward -49.430, eps 0.02, speed 540.71 f/s
411218: done 7101 games, mean reward -49.430, eps 0

416358: done 7202 games, mean reward -49.000, eps 0.02, speed 529.54 f/s
416412: done 7203 games, mean reward -49.310, eps 0.02, speed 575.60 f/s
416464: done 7204 games, mean reward -49.310, eps 0.02, speed 506.22 f/s
416514: done 7205 games, mean reward -49.310, eps 0.02, speed 525.33 f/s
416564: done 7206 games, mean reward -49.310, eps 0.02, speed 532.28 f/s
416615: done 7207 games, mean reward -49.310, eps 0.02, speed 544.30 f/s
416665: done 7208 games, mean reward -49.310, eps 0.02, speed 528.25 f/s
416717: done 7209 games, mean reward -49.310, eps 0.02, speed 553.02 f/s
416768: done 7210 games, mean reward -49.310, eps 0.02, speed 544.69 f/s
416818: done 7211 games, mean reward -49.310, eps 0.02, speed 528.63 f/s
416870: done 7212 games, mean reward -49.310, eps 0.02, speed 554.70 f/s
416920: done 7213 games, mean reward -49.310, eps 0.02, speed 536.97 f/s
416970: done 7214 games, mean reward -49.310, eps 0.02, speed 510.41 f/s
417020: done 7215 games, mean reward -49.310, eps 0

422116: done 7315 games, mean reward -48.410, eps 0.02, speed 561.38 f/s
422168: done 7316 games, mean reward -48.410, eps 0.02, speed 571.78 f/s
422222: done 7317 games, mean reward -48.410, eps 0.02, speed 592.34 f/s
422273: done 7318 games, mean reward -48.410, eps 0.02, speed 487.87 f/s
422323: done 7319 games, mean reward -48.410, eps 0.02, speed 508.84 f/s
422373: done 7320 games, mean reward -48.410, eps 0.02, speed 513.43 f/s
422426: done 7321 games, mean reward -48.410, eps 0.02, speed 535.30 f/s
422477: done 7322 games, mean reward -48.410, eps 0.02, speed 558.28 f/s
422527: done 7323 games, mean reward -48.410, eps 0.02, speed 547.43 f/s
422577: done 7324 games, mean reward -48.410, eps 0.02, speed 539.12 f/s
422627: done 7325 games, mean reward -48.910, eps 0.02, speed 548.50 f/s
422677: done 7326 games, mean reward -48.910, eps 0.02, speed 533.83 f/s
422727: done 7327 games, mean reward -48.910, eps 0.02, speed 510.28 f/s
422777: done 7328 games, mean reward -48.910, eps 0

427932: done 7429 games, mean reward -50.000, eps 0.02, speed 549.53 f/s
427982: done 7430 games, mean reward -50.000, eps 0.02, speed 532.78 f/s
428032: done 7431 games, mean reward -50.000, eps 0.02, speed 533.85 f/s
428084: done 7432 games, mean reward -50.000, eps 0.02, speed 547.46 f/s
428134: done 7433 games, mean reward -50.000, eps 0.02, speed 523.59 f/s
428184: done 7434 games, mean reward -50.000, eps 0.02, speed 525.31 f/s
428236: done 7435 games, mean reward -50.000, eps 0.02, speed 551.21 f/s
428286: done 7436 games, mean reward -49.500, eps 0.02, speed 533.07 f/s
428337: done 7437 games, mean reward -49.500, eps 0.02, speed 496.81 f/s
428387: done 7438 games, mean reward -49.500, eps 0.02, speed 501.40 f/s
428438: done 7439 games, mean reward -49.500, eps 0.02, speed 558.50 f/s
428489: done 7440 games, mean reward -49.500, eps 0.02, speed 561.51 f/s
428540: done 7441 games, mean reward -49.500, eps 0.02, speed 521.25 f/s
428593: done 7442 games, mean reward -49.500, eps 0

433762: done 7543 games, mean reward -49.100, eps 0.02, speed 506.59 f/s
433812: done 7544 games, mean reward -49.100, eps 0.02, speed 536.16 f/s
433863: done 7545 games, mean reward -49.100, eps 0.02, speed 546.33 f/s
433914: done 7546 games, mean reward -49.100, eps 0.02, speed 539.73 f/s
433965: done 7547 games, mean reward -49.100, eps 0.02, speed 543.08 f/s
434017: done 7548 games, mean reward -49.100, eps 0.02, speed 556.56 f/s
434069: done 7549 games, mean reward -49.100, eps 0.02, speed 549.60 f/s
434123: done 7550 games, mean reward -49.100, eps 0.02, speed 576.25 f/s
434174: done 7551 games, mean reward -49.100, eps 0.02, speed 546.65 f/s
434225: done 7552 games, mean reward -49.100, eps 0.02, speed 538.91 f/s
434275: done 7553 games, mean reward -49.100, eps 0.02, speed 519.23 f/s
434327: done 7554 games, mean reward -49.100, eps 0.02, speed 534.83 f/s
434378: done 7555 games, mean reward -49.100, eps 0.02, speed 532.10 f/s
434431: done 7556 games, mean reward -49.100, eps 0

439585: done 7657 games, mean reward -49.000, eps 0.02, speed 529.67 f/s
439635: done 7658 games, mean reward -49.000, eps 0.02, speed 534.57 f/s
439685: done 7659 games, mean reward -49.000, eps 0.02, speed 483.96 f/s
439736: done 7660 games, mean reward -49.000, eps 0.02, speed 541.37 f/s
439786: done 7661 games, mean reward -49.000, eps 0.02, speed 532.72 f/s
439836: done 7662 games, mean reward -49.000, eps 0.02, speed 535.61 f/s
439887: done 7663 games, mean reward -49.000, eps 0.02, speed 536.16 f/s
439938: done 7664 games, mean reward -49.000, eps 0.02, speed 544.68 f/s
439991: done 7665 games, mean reward -49.000, eps 0.02, speed 567.00 f/s
440041: done 7666 games, mean reward -49.000, eps 0.02, speed 529.00 f/s
440093: done 7667 games, mean reward -49.000, eps 0.02, speed 554.92 f/s
440143: done 7668 games, mean reward -49.000, eps 0.02, speed 535.13 f/s
440193: done 7669 games, mean reward -48.500, eps 0.02, speed 497.95 f/s
440245: done 7670 games, mean reward -48.500, eps 0

445406: done 7771 games, mean reward -48.990, eps 0.02, speed 542.16 f/s
445457: done 7772 games, mean reward -48.990, eps 0.02, speed 545.29 f/s
445507: done 7773 games, mean reward -48.990, eps 0.02, speed 533.32 f/s
445558: done 7774 games, mean reward -48.990, eps 0.02, speed 537.86 f/s
445609: done 7775 games, mean reward -48.990, eps 0.02, speed 543.19 f/s
445661: done 7776 games, mean reward -48.990, eps 0.02, speed 497.42 f/s
445711: done 7777 games, mean reward -48.990, eps 0.02, speed 532.05 f/s
445761: done 7778 games, mean reward -48.990, eps 0.02, speed 533.06 f/s
445811: done 7779 games, mean reward -48.490, eps 0.02, speed 533.58 f/s
445863: done 7780 games, mean reward -48.490, eps 0.02, speed 549.17 f/s
445913: done 7781 games, mean reward -48.490, eps 0.02, speed 532.86 f/s
445966: done 7782 games, mean reward -48.490, eps 0.02, speed 564.89 f/s
446017: done 7783 games, mean reward -48.490, eps 0.02, speed 539.50 f/s
446067: done 7784 games, mean reward -48.490, eps 0

451214: done 7885 games, mean reward -48.660, eps 0.02, speed 549.65 f/s
451265: done 7886 games, mean reward -48.660, eps 0.02, speed 561.76 f/s
451315: done 7887 games, mean reward -48.660, eps 0.02, speed 549.14 f/s
451365: done 7888 games, mean reward -48.660, eps 0.02, speed 539.04 f/s
451417: done 7889 games, mean reward -48.660, eps 0.02, speed 570.17 f/s
451467: done 7890 games, mean reward -48.660, eps 0.02, speed 550.32 f/s
451519: done 7891 games, mean reward -48.660, eps 0.02, speed 563.66 f/s
451570: done 7892 games, mean reward -49.030, eps 0.02, speed 559.48 f/s
451620: done 7893 games, mean reward -49.030, eps 0.02, speed 549.56 f/s
451671: done 7894 games, mean reward -49.030, eps 0.02, speed 507.82 f/s
451721: done 7895 games, mean reward -49.030, eps 0.02, speed 552.75 f/s
451774: done 7896 games, mean reward -49.030, eps 0.02, speed 582.46 f/s
451824: done 7897 games, mean reward -48.530, eps 0.02, speed 541.96 f/s
451874: done 7898 games, mean reward -48.530, eps 0

457019: done 7999 games, mean reward -49.000, eps 0.02, speed 544.49 f/s
457071: done 8000 games, mean reward -49.000, eps 0.02, speed 573.83 f/s
457122: done 8001 games, mean reward -49.000, eps 0.02, speed 530.11 f/s
457174: done 8002 games, mean reward -49.000, eps 0.02, speed 546.20 f/s
457224: done 8003 games, mean reward -49.000, eps 0.02, speed 535.32 f/s
457276: done 8004 games, mean reward -49.000, eps 0.02, speed 555.52 f/s
457327: done 8005 games, mean reward -49.000, eps 0.02, speed 540.19 f/s
457377: done 8006 games, mean reward -49.000, eps 0.02, speed 534.00 f/s
457427: done 8007 games, mean reward -49.000, eps 0.02, speed 535.43 f/s
457478: done 8008 games, mean reward -49.000, eps 0.02, speed 537.95 f/s
457530: done 8009 games, mean reward -49.000, eps 0.02, speed 555.11 f/s
457582: done 8010 games, mean reward -48.500, eps 0.02, speed 555.05 f/s
457632: done 8011 games, mean reward -48.500, eps 0.02, speed 529.42 f/s
457683: done 8012 games, mean reward -49.000, eps 0

462829: done 8113 games, mean reward -49.180, eps 0.02, speed 526.86 f/s
462879: done 8114 games, mean reward -49.180, eps 0.02, speed 533.43 f/s
462930: done 8115 games, mean reward -49.180, eps 0.02, speed 543.84 f/s
462980: done 8116 games, mean reward -48.680, eps 0.02, speed 526.36 f/s
463031: done 8117 games, mean reward -48.680, eps 0.02, speed 511.41 f/s
463083: done 8118 games, mean reward -48.680, eps 0.02, speed 553.94 f/s
463134: done 8119 games, mean reward -48.680, eps 0.02, speed 539.16 f/s
463184: done 8120 games, mean reward -48.680, eps 0.02, speed 532.50 f/s
463234: done 8121 games, mean reward -48.680, eps 0.02, speed 534.65 f/s
463285: done 8122 games, mean reward -48.680, eps 0.02, speed 539.40 f/s
463336: done 8123 games, mean reward -48.680, eps 0.02, speed 544.91 f/s
463387: done 8124 games, mean reward -48.680, eps 0.02, speed 546.86 f/s
463440: done 8125 games, mean reward -48.680, eps 0.02, speed 559.15 f/s
463490: done 8126 games, mean reward -48.680, eps 0

468642: done 8227 games, mean reward -47.500, eps 0.02, speed 545.47 f/s
468695: done 8228 games, mean reward -47.500, eps 0.02, speed 579.38 f/s
468745: done 8229 games, mean reward -47.500, eps 0.02, speed 549.45 f/s
468796: done 8230 games, mean reward -47.500, eps 0.02, speed 550.47 f/s
468846: done 8231 games, mean reward -47.500, eps 0.02, speed 549.20 f/s
468896: done 8232 games, mean reward -47.500, eps 0.02, speed 547.28 f/s
468947: done 8233 games, mean reward -47.500, eps 0.02, speed 550.01 f/s
468998: done 8234 games, mean reward -47.500, eps 0.02, speed 558.46 f/s
469051: done 8235 games, mean reward -47.500, eps 0.02, speed 522.97 f/s
469102: done 8236 games, mean reward -47.500, eps 0.02, speed 537.55 f/s
469152: done 8237 games, mean reward -47.500, eps 0.02, speed 533.91 f/s
469203: done 8238 games, mean reward -47.500, eps 0.02, speed 544.67 f/s
469255: done 8239 games, mean reward -47.500, eps 0.02, speed 549.74 f/s
469306: done 8240 games, mean reward -47.500, eps 0

474396: done 8340 games, mean reward -48.500, eps 0.02, speed 539.58 f/s
474447: done 8341 games, mean reward -48.500, eps 0.02, speed 563.00 f/s
474498: done 8342 games, mean reward -48.500, eps 0.02, speed 560.75 f/s
474548: done 8343 games, mean reward -48.500, eps 0.02, speed 542.87 f/s
474598: done 8344 games, mean reward -48.500, eps 0.02, speed 549.56 f/s
474649: done 8345 games, mean reward -48.500, eps 0.02, speed 558.23 f/s
474700: done 8346 games, mean reward -48.500, eps 0.02, speed 550.13 f/s
474751: done 8347 games, mean reward -48.500, eps 0.02, speed 551.37 f/s
474802: done 8348 games, mean reward -48.500, eps 0.02, speed 561.48 f/s
474852: done 8349 games, mean reward -48.490, eps 0.02, speed 530.40 f/s
474902: done 8350 games, mean reward -48.490, eps 0.02, speed 514.23 f/s
474953: done 8351 games, mean reward -48.490, eps 0.02, speed 442.10 f/s
475003: done 8352 games, mean reward -48.490, eps 0.02, speed 512.54 f/s
475053: done 8353 games, mean reward -48.490, eps 0

480148: done 8453 games, mean reward -49.330, eps 0.02, speed 536.07 f/s
480199: done 8454 games, mean reward -49.330, eps 0.02, speed 558.36 f/s
480250: done 8455 games, mean reward -49.330, eps 0.02, speed 559.33 f/s
480300: done 8456 games, mean reward -49.330, eps 0.02, speed 505.40 f/s
480350: done 8457 games, mean reward -49.330, eps 0.02, speed 547.08 f/s
480400: done 8458 games, mean reward -49.330, eps 0.02, speed 542.39 f/s
480451: done 8459 games, mean reward -49.330, eps 0.02, speed 540.43 f/s
480501: done 8460 games, mean reward -49.330, eps 0.02, speed 538.26 f/s
480551: done 8461 games, mean reward -49.330, eps 0.02, speed 549.19 f/s
480601: done 8462 games, mean reward -49.330, eps 0.02, speed 531.10 f/s
480652: done 8463 games, mean reward -49.330, eps 0.02, speed 551.73 f/s
480704: done 8464 games, mean reward -49.320, eps 0.02, speed 560.23 f/s
480757: done 8465 games, mean reward -49.330, eps 0.02, speed 561.28 f/s
480807: done 8466 games, mean reward -49.330, eps 0

485966: done 8567 games, mean reward -47.520, eps 0.02, speed 549.49 f/s
486016: done 8568 games, mean reward -47.520, eps 0.02, speed 545.37 f/s
486067: done 8569 games, mean reward -47.530, eps 0.02, speed 560.04 f/s
486120: done 8570 games, mean reward -47.550, eps 0.02, speed 569.71 f/s
486172: done 8571 games, mean reward -47.550, eps 0.02, speed 569.40 f/s
486224: done 8572 games, mean reward -47.350, eps 0.02, speed 525.30 f/s
486275: done 8573 games, mean reward -47.850, eps 0.02, speed 546.83 f/s
486326: done 8574 games, mean reward -47.850, eps 0.02, speed 556.45 f/s
486376: done 8575 games, mean reward -47.850, eps 0.02, speed 548.88 f/s
486427: done 8576 games, mean reward -47.850, eps 0.02, speed 548.08 f/s
486477: done 8577 games, mean reward -47.350, eps 0.02, speed 548.35 f/s
486530: done 8578 games, mean reward -47.350, eps 0.02, speed 581.43 f/s
486582: done 8579 games, mean reward -47.350, eps 0.02, speed 564.57 f/s
486633: done 8580 games, mean reward -47.350, eps 0

491765: done 8680 games, mean reward -49.720, eps 0.02, speed 548.52 f/s
491816: done 8681 games, mean reward -49.720, eps 0.02, speed 544.08 f/s
491868: done 8682 games, mean reward -49.720, eps 0.02, speed 554.98 f/s
491918: done 8683 games, mean reward -49.720, eps 0.02, speed 526.55 f/s
491968: done 8684 games, mean reward -49.720, eps 0.02, speed 533.22 f/s
492018: done 8685 games, mean reward -49.720, eps 0.02, speed 533.16 f/s
492069: done 8686 games, mean reward -49.720, eps 0.02, speed 540.36 f/s
492119: done 8687 games, mean reward -49.720, eps 0.02, speed 533.19 f/s
492170: done 8688 games, mean reward -49.720, eps 0.02, speed 543.46 f/s
492221: done 8689 games, mean reward -49.720, eps 0.02, speed 508.27 f/s
492272: done 8690 games, mean reward -49.720, eps 0.02, speed 543.51 f/s
492323: done 8691 games, mean reward -49.720, eps 0.02, speed 542.71 f/s
492374: done 8692 games, mean reward -49.720, eps 0.02, speed 539.17 f/s
492425: done 8693 games, mean reward -49.720, eps 0

497584: done 8794 games, mean reward -49.500, eps 0.02, speed 559.09 f/s
497638: done 8795 games, mean reward -49.500, eps 0.02, speed 530.35 f/s
497688: done 8796 games, mean reward -49.500, eps 0.02, speed 534.99 f/s
497738: done 8797 games, mean reward -49.500, eps 0.02, speed 510.53 f/s
497789: done 8798 games, mean reward -49.500, eps 0.02, speed 545.14 f/s
497839: done 8799 games, mean reward -49.500, eps 0.02, speed 535.47 f/s
497890: done 8800 games, mean reward -49.500, eps 0.02, speed 537.62 f/s
497942: done 8801 games, mean reward -49.500, eps 0.02, speed 555.00 f/s
497992: done 8802 games, mean reward -49.500, eps 0.02, speed 535.32 f/s
498043: done 8803 games, mean reward -49.500, eps 0.02, speed 539.11 f/s
498097: done 8804 games, mean reward -49.500, eps 0.02, speed 575.22 f/s
498148: done 8805 games, mean reward -49.500, eps 0.02, speed 545.22 f/s
498199: done 8806 games, mean reward -49.500, eps 0.02, speed 493.31 f/s
498249: done 8807 games, mean reward -49.500, eps 0

503365: done 8907 games, mean reward -48.730, eps 0.02, speed 541.42 f/s
503416: done 8908 games, mean reward -48.730, eps 0.02, speed 547.61 f/s
503466: done 8909 games, mean reward -48.730, eps 0.02, speed 536.34 f/s
503517: done 8910 games, mean reward -48.730, eps 0.02, speed 538.55 f/s
503568: done 8911 games, mean reward -48.230, eps 0.02, speed 545.16 f/s
503619: done 8912 games, mean reward -48.230, eps 0.02, speed 502.44 f/s
503669: done 8913 games, mean reward -48.230, eps 0.02, speed 530.52 f/s
503720: done 8914 games, mean reward -48.230, eps 0.02, speed 544.17 f/s
503771: done 8915 games, mean reward -48.230, eps 0.02, speed 544.90 f/s
503823: done 8916 games, mean reward -48.230, eps 0.02, speed 550.60 f/s
503874: done 8917 games, mean reward -48.230, eps 0.02, speed 543.45 f/s
503925: done 8918 games, mean reward -48.230, eps 0.02, speed 545.32 f/s
503975: done 8919 games, mean reward -48.730, eps 0.02, speed 527.88 f/s
504025: done 8920 games, mean reward -48.730, eps 0

509191: done 9021 games, mean reward -50.000, eps 0.02, speed 540.94 f/s
509242: done 9022 games, mean reward -50.000, eps 0.02, speed 544.48 f/s
509293: done 9023 games, mean reward -50.000, eps 0.02, speed 544.16 f/s
509346: done 9024 games, mean reward -50.000, eps 0.02, speed 560.32 f/s
509397: done 9025 games, mean reward -50.000, eps 0.02, speed 543.90 f/s
509449: done 9026 games, mean reward -50.000, eps 0.02, speed 555.38 f/s
509499: done 9027 games, mean reward -50.000, eps 0.02, speed 528.56 f/s
509552: done 9028 games, mean reward -50.000, eps 0.02, speed 534.97 f/s
509603: done 9029 games, mean reward -50.000, eps 0.02, speed 544.19 f/s
509655: done 9030 games, mean reward -50.000, eps 0.02, speed 550.06 f/s
509705: done 9031 games, mean reward -50.000, eps 0.02, speed 489.29 f/s
509755: done 9032 games, mean reward -50.000, eps 0.02, speed 536.32 f/s
509807: done 9033 games, mean reward -50.000, eps 0.02, speed 551.65 f/s
509858: done 9034 games, mean reward -50.000, eps 0

515024: done 9135 games, mean reward -48.170, eps 0.02, speed 482.38 f/s
515075: done 9136 games, mean reward -48.170, eps 0.02, speed 543.82 f/s
515125: done 9137 games, mean reward -48.170, eps 0.02, speed 534.50 f/s
515175: done 9138 games, mean reward -47.940, eps 0.02, speed 526.29 f/s
515229: done 9139 games, mean reward -47.940, eps 0.02, speed 574.50 f/s
515281: done 9140 games, mean reward -47.940, eps 0.02, speed 554.85 f/s
515332: done 9141 games, mean reward -47.940, eps 0.02, speed 536.06 f/s
515383: done 9142 games, mean reward -47.940, eps 0.02, speed 544.58 f/s
515435: done 9143 games, mean reward -47.940, eps 0.02, speed 552.93 f/s
515485: done 9144 games, mean reward -47.940, eps 0.02, speed 529.01 f/s
515535: done 9145 games, mean reward -47.940, eps 0.02, speed 492.00 f/s
515586: done 9146 games, mean reward -47.940, eps 0.02, speed 545.52 f/s
515637: done 9147 games, mean reward -47.940, eps 0.02, speed 537.57 f/s
515688: done 9148 games, mean reward -47.940, eps 0

520846: done 9249 games, mean reward -49.000, eps 0.02, speed 547.34 f/s
520896: done 9250 games, mean reward -49.000, eps 0.02, speed 532.44 f/s
520947: done 9251 games, mean reward -49.000, eps 0.02, speed 513.83 f/s
520998: done 9252 games, mean reward -49.000, eps 0.02, speed 538.93 f/s
521049: done 9253 games, mean reward -49.000, eps 0.02, speed 543.53 f/s
521099: done 9254 games, mean reward -49.000, eps 0.02, speed 534.46 f/s
521152: done 9255 games, mean reward -49.000, eps 0.02, speed 562.00 f/s
521202: done 9256 games, mean reward -49.000, eps 0.02, speed 512.87 f/s
521253: done 9257 games, mean reward -48.500, eps 0.02, speed 543.93 f/s
521304: done 9258 games, mean reward -48.500, eps 0.02, speed 537.98 f/s
521354: done 9259 games, mean reward -48.500, eps 0.02, speed 527.58 f/s
521404: done 9260 games, mean reward -48.500, eps 0.02, speed 535.04 f/s
521456: done 9261 games, mean reward -48.500, eps 0.02, speed 551.75 f/s
521507: done 9262 games, mean reward -48.500, eps 0

526676: done 9363 games, mean reward -48.410, eps 0.02, speed 540.38 f/s
526726: done 9364 games, mean reward -48.410, eps 0.02, speed 536.95 f/s
526779: done 9365 games, mean reward -48.410, eps 0.02, speed 566.71 f/s
526830: done 9366 games, mean reward -48.410, eps 0.02, speed 539.55 f/s
526882: done 9367 games, mean reward -48.410, eps 0.02, speed 558.07 f/s
526936: done 9368 games, mean reward -48.410, eps 0.02, speed 543.00 f/s
526987: done 9369 games, mean reward -48.410, eps 0.02, speed 540.62 f/s
527037: done 9370 games, mean reward -48.410, eps 0.02, speed 536.95 f/s
527088: done 9371 games, mean reward -48.410, eps 0.02, speed 548.47 f/s
527139: done 9372 games, mean reward -48.410, eps 0.02, speed 542.85 f/s
527191: done 9373 games, mean reward -48.410, eps 0.02, speed 556.48 f/s
527242: done 9374 games, mean reward -48.410, eps 0.02, speed 547.80 f/s
527294: done 9375 games, mean reward -48.410, eps 0.02, speed 548.76 f/s
527344: done 9376 games, mean reward -48.410, eps 0

532500: done 9477 games, mean reward -48.990, eps 0.02, speed 526.54 f/s
532551: done 9478 games, mean reward -48.990, eps 0.02, speed 542.38 f/s
532602: done 9479 games, mean reward -48.990, eps 0.02, speed 544.73 f/s
532654: done 9480 games, mean reward -48.990, eps 0.02, speed 547.77 f/s
532705: done 9481 games, mean reward -48.990, eps 0.02, speed 542.39 f/s
532755: done 9482 games, mean reward -48.990, eps 0.02, speed 534.03 f/s
532805: done 9483 games, mean reward -48.700, eps 0.02, speed 526.70 f/s
532856: done 9484 games, mean reward -48.700, eps 0.02, speed 544.51 f/s
532907: done 9485 games, mean reward -48.700, eps 0.02, speed 500.09 f/s
532957: done 9486 games, mean reward -48.200, eps 0.02, speed 528.43 f/s
533007: done 9487 games, mean reward -48.200, eps 0.02, speed 528.41 f/s
533059: done 9488 games, mean reward -48.200, eps 0.02, speed 557.45 f/s
533110: done 9489 games, mean reward -48.700, eps 0.02, speed 538.46 f/s
533161: done 9490 games, mean reward -49.200, eps 0

538258: done 9590 games, mean reward -48.960, eps 0.02, speed 539.77 f/s
538308: done 9591 games, mean reward -48.960, eps 0.02, speed 531.61 f/s
538359: done 9592 games, mean reward -48.960, eps 0.02, speed 525.83 f/s
538410: done 9593 games, mean reward -48.960, eps 0.02, speed 543.48 f/s
538460: done 9594 games, mean reward -48.960, eps 0.02, speed 549.94 f/s
538512: done 9595 games, mean reward -48.960, eps 0.02, speed 570.80 f/s
538563: done 9596 games, mean reward -48.960, eps 0.02, speed 549.99 f/s
538614: done 9597 games, mean reward -49.460, eps 0.02, speed 559.73 f/s
538664: done 9598 games, mean reward -49.460, eps 0.02, speed 548.38 f/s
538714: done 9599 games, mean reward -49.460, eps 0.02, speed 524.47 f/s
538765: done 9600 games, mean reward -49.460, eps 0.02, speed 543.78 f/s
538817: done 9601 games, mean reward -49.460, eps 0.02, speed 554.16 f/s
538869: done 9602 games, mean reward -49.460, eps 0.02, speed 517.45 f/s
538920: done 9603 games, mean reward -49.460, eps 0

544080: done 9704 games, mean reward -49.290, eps 0.02, speed 528.55 f/s
544132: done 9705 games, mean reward -49.290, eps 0.02, speed 556.21 f/s
544182: done 9706 games, mean reward -49.290, eps 0.02, speed 534.71 f/s
544233: done 9707 games, mean reward -49.290, eps 0.02, speed 537.69 f/s
544284: done 9708 games, mean reward -49.290, eps 0.02, speed 541.13 f/s
544335: done 9709 games, mean reward -49.290, eps 0.02, speed 503.09 f/s
544387: done 9710 games, mean reward -49.290, eps 0.02, speed 549.45 f/s
544437: done 9711 games, mean reward -49.290, eps 0.02, speed 533.80 f/s
544487: done 9712 games, mean reward -49.290, eps 0.02, speed 535.28 f/s
544538: done 9713 games, mean reward -49.290, eps 0.02, speed 538.09 f/s
544589: done 9714 games, mean reward -49.290, eps 0.02, speed 543.66 f/s
544639: done 9715 games, mean reward -49.290, eps 0.02, speed 534.65 f/s
544691: done 9716 games, mean reward -49.290, eps 0.02, speed 547.89 f/s
544743: done 9717 games, mean reward -49.290, eps 0

549915: done 9818 games, mean reward -48.620, eps 0.02, speed 584.82 f/s
549965: done 9819 games, mean reward -48.620, eps 0.02, speed 549.58 f/s
550015: done 9820 games, mean reward -49.000, eps 0.02, speed 552.63 f/s
550066: done 9821 games, mean reward -49.000, eps 0.02, speed 552.33 f/s
550116: done 9822 games, mean reward -49.500, eps 0.02, speed 550.27 f/s
550167: done 9823 games, mean reward -49.500, eps 0.02, speed 558.22 f/s
550219: done 9824 games, mean reward -49.500, eps 0.02, speed 564.09 f/s
550269: done 9825 games, mean reward -49.500, eps 0.02, speed 442.52 f/s
550321: done 9826 games, mean reward -49.500, eps 0.02, speed 547.84 f/s
550371: done 9827 games, mean reward -49.500, eps 0.02, speed 536.08 f/s
550425: done 9828 games, mean reward -49.500, eps 0.02, speed 576.90 f/s
550475: done 9829 games, mean reward -49.500, eps 0.02, speed 525.33 f/s
550526: done 9830 games, mean reward -49.500, eps 0.02, speed 545.40 f/s
550576: done 9831 games, mean reward -49.500, eps 0

555671: done 9931 games, mean reward -48.000, eps 0.02, speed 503.53 f/s
555722: done 9932 games, mean reward -48.000, eps 0.02, speed 537.80 f/s
555774: done 9933 games, mean reward -48.000, eps 0.02, speed 553.41 f/s
555826: done 9934 games, mean reward -48.000, eps 0.02, speed 551.37 f/s
555877: done 9935 games, mean reward -48.000, eps 0.02, speed 542.04 f/s
555927: done 9936 games, mean reward -48.000, eps 0.02, speed 532.98 f/s
555978: done 9937 games, mean reward -48.000, eps 0.02, speed 539.19 f/s
556029: done 9938 games, mean reward -48.000, eps 0.02, speed 544.96 f/s
556080: done 9939 games, mean reward -48.000, eps 0.02, speed 544.44 f/s
556132: done 9940 games, mean reward -48.000, eps 0.02, speed 547.63 f/s
556182: done 9941 games, mean reward -48.000, eps 0.02, speed 475.21 f/s
556234: done 9942 games, mean reward -48.000, eps 0.02, speed 555.06 f/s
556284: done 9943 games, mean reward -48.000, eps 0.02, speed 520.38 f/s
556334: done 9944 games, mean reward -48.000, eps 0

561503: done 10045 games, mean reward -49.000, eps 0.02, speed 563.75 f/s
561554: done 10046 games, mean reward -49.000, eps 0.02, speed 560.20 f/s
561604: done 10047 games, mean reward -49.000, eps 0.02, speed 546.16 f/s
561654: done 10048 games, mean reward -49.000, eps 0.02, speed 517.11 f/s
561705: done 10049 games, mean reward -49.000, eps 0.02, speed 494.79 f/s
561759: done 10050 games, mean reward -49.000, eps 0.02, speed 531.73 f/s
561810: done 10051 games, mean reward -49.000, eps 0.02, speed 519.26 f/s
561862: done 10052 games, mean reward -49.000, eps 0.02, speed 532.47 f/s
561913: done 10053 games, mean reward -49.000, eps 0.02, speed 510.29 f/s
561963: done 10054 games, mean reward -49.000, eps 0.02, speed 499.38 f/s
562015: done 10055 games, mean reward -49.000, eps 0.02, speed 554.04 f/s
562065: done 10056 games, mean reward -49.500, eps 0.02, speed 528.24 f/s
562116: done 10057 games, mean reward -49.500, eps 0.02, speed 544.13 f/s
562166: done 10058 games, mean reward 

567254: done 10158 games, mean reward -49.000, eps 0.02, speed 513.34 f/s
567306: done 10159 games, mean reward -49.000, eps 0.02, speed 572.40 f/s
567358: done 10160 games, mean reward -49.000, eps 0.02, speed 559.26 f/s
567410: done 10161 games, mean reward -49.000, eps 0.02, speed 515.16 f/s
567460: done 10162 games, mean reward -49.000, eps 0.02, speed 507.85 f/s
567510: done 10163 games, mean reward -49.000, eps 0.02, speed 522.49 f/s
567561: done 10164 games, mean reward -49.000, eps 0.02, speed 516.93 f/s
567611: done 10165 games, mean reward -49.000, eps 0.02, speed 503.79 f/s
567662: done 10166 games, mean reward -49.000, eps 0.02, speed 374.62 f/s
567713: done 10167 games, mean reward -49.000, eps 0.02, speed 322.85 f/s
567763: done 10168 games, mean reward -49.000, eps 0.02, speed 275.46 f/s
567814: done 10169 games, mean reward -49.000, eps 0.02, speed 324.26 f/s
567864: done 10170 games, mean reward -49.000, eps 0.02, speed 458.16 f/s
567915: done 10171 games, mean reward 

572945: done 10269 games, mean reward -47.590, eps 0.02, speed 410.18 f/s
572995: done 10270 games, mean reward -47.480, eps 0.02, speed 397.38 f/s
573046: done 10271 games, mean reward -47.550, eps 0.02, speed 478.28 f/s
573096: done 10272 games, mean reward -47.550, eps 0.02, speed 419.89 f/s
573147: done 10273 games, mean reward -47.550, eps 0.02, speed 386.73 f/s
573197: done 10274 games, mean reward -47.550, eps 0.02, speed 492.22 f/s
573249: done 10275 games, mean reward -47.550, eps 0.02, speed 434.37 f/s
573301: done 10276 games, mean reward -47.550, eps 0.02, speed 382.66 f/s
573351: done 10277 games, mean reward -47.550, eps 0.02, speed 400.92 f/s
573403: done 10278 games, mean reward -47.550, eps 0.02, speed 513.84 f/s
573453: done 10279 games, mean reward -47.550, eps 0.02, speed 416.46 f/s
573504: done 10280 games, mean reward -47.550, eps 0.02, speed 478.49 f/s
573555: done 10281 games, mean reward -47.550, eps 0.02, speed 469.29 f/s
573605: done 10282 games, mean reward 

578713: done 10382 games, mean reward -49.000, eps 0.02, speed 380.65 f/s
578763: done 10383 games, mean reward -49.000, eps 0.02, speed 507.14 f/s
578814: done 10384 games, mean reward -49.000, eps 0.02, speed 372.61 f/s
578864: done 10385 games, mean reward -48.500, eps 0.02, speed 351.31 f/s
578916: done 10386 games, mean reward -48.500, eps 0.02, speed 410.89 f/s
578967: done 10387 games, mean reward -48.500, eps 0.02, speed 449.10 f/s
579020: done 10388 games, mean reward -48.500, eps 0.02, speed 546.84 f/s
579070: done 10389 games, mean reward -48.500, eps 0.02, speed 493.08 f/s
579120: done 10390 games, mean reward -48.500, eps 0.02, speed 525.70 f/s
579172: done 10391 games, mean reward -48.500, eps 0.02, speed 488.85 f/s
579223: done 10392 games, mean reward -48.500, eps 0.02, speed 533.43 f/s
579276: done 10393 games, mean reward -48.500, eps 0.02, speed 488.63 f/s
579328: done 10394 games, mean reward -48.500, eps 0.02, speed 500.03 f/s
579378: done 10395 games, mean reward 

584475: done 10495 games, mean reward -48.500, eps 0.02, speed 508.19 f/s
584525: done 10496 games, mean reward -48.500, eps 0.02, speed 516.51 f/s
584576: done 10497 games, mean reward -48.500, eps 0.02, speed 494.75 f/s
584626: done 10498 games, mean reward -48.500, eps 0.02, speed 470.61 f/s
584676: done 10499 games, mean reward -48.500, eps 0.02, speed 534.89 f/s
584727: done 10500 games, mean reward -48.500, eps 0.02, speed 560.34 f/s
584778: done 10501 games, mean reward -48.500, eps 0.02, speed 344.27 f/s
584829: done 10502 games, mean reward -48.500, eps 0.02, speed 544.42 f/s
584880: done 10503 games, mean reward -48.500, eps 0.02, speed 548.72 f/s
584932: done 10504 games, mean reward -48.500, eps 0.02, speed 517.52 f/s
584982: done 10505 games, mean reward -48.500, eps 0.02, speed 535.44 f/s
585033: done 10506 games, mean reward -48.500, eps 0.02, speed 546.91 f/s
585085: done 10507 games, mean reward -48.500, eps 0.02, speed 402.57 f/s
585137: done 10508 games, mean reward 

590219: done 10608 games, mean reward -48.520, eps 0.02, speed 505.51 f/s
590272: done 10609 games, mean reward -48.520, eps 0.02, speed 583.34 f/s
590323: done 10610 games, mean reward -48.520, eps 0.02, speed 545.90 f/s
590373: done 10611 games, mean reward -48.520, eps 0.02, speed 464.23 f/s
590423: done 10612 games, mean reward -48.520, eps 0.02, speed 549.96 f/s
590473: done 10613 games, mean reward -48.520, eps 0.02, speed 541.10 f/s
590524: done 10614 games, mean reward -49.020, eps 0.02, speed 482.11 f/s
590576: done 10615 games, mean reward -49.020, eps 0.02, speed 571.30 f/s
590626: done 10616 games, mean reward -49.020, eps 0.02, speed 552.78 f/s
590680: done 10617 games, mean reward -49.020, eps 0.02, speed 524.62 f/s
590732: done 10618 games, mean reward -49.020, eps 0.02, speed 573.17 f/s
590782: done 10619 games, mean reward -49.020, eps 0.02, speed 551.73 f/s
590833: done 10620 games, mean reward -49.020, eps 0.02, speed 466.35 f/s
590885: done 10621 games, mean reward 

595998: done 10721 games, mean reward -48.170, eps 0.02, speed 479.70 f/s
596049: done 10722 games, mean reward -48.170, eps 0.02, speed 555.71 f/s
596100: done 10723 games, mean reward -48.170, eps 0.02, speed 561.87 f/s
596150: done 10724 games, mean reward -48.170, eps 0.02, speed 475.40 f/s
596201: done 10725 games, mean reward -48.170, eps 0.02, speed 562.58 f/s
596253: done 10726 games, mean reward -48.170, eps 0.02, speed 518.85 f/s
596303: done 10727 games, mean reward -48.170, eps 0.02, speed 440.81 f/s
596356: done 10728 games, mean reward -48.170, eps 0.02, speed 565.78 f/s
596406: done 10729 games, mean reward -48.170, eps 0.02, speed 537.50 f/s
596457: done 10730 games, mean reward -48.170, eps 0.02, speed 482.30 f/s
596507: done 10731 games, mean reward -48.170, eps 0.02, speed 535.04 f/s
596558: done 10732 games, mean reward -48.170, eps 0.02, speed 546.48 f/s
596609: done 10733 games, mean reward -48.170, eps 0.02, speed 479.70 f/s
596661: done 10734 games, mean reward 

601712: done 10833 games, mean reward -49.170, eps 0.02, speed 485.43 f/s
601763: done 10834 games, mean reward -49.170, eps 0.02, speed 560.20 f/s
601813: done 10835 games, mean reward -49.170, eps 0.02, speed 552.24 f/s
601863: done 10836 games, mean reward -49.170, eps 0.02, speed 456.48 f/s
601914: done 10837 games, mean reward -49.170, eps 0.02, speed 558.48 f/s
601964: done 10838 games, mean reward -49.170, eps 0.02, speed 552.46 f/s
602015: done 10839 games, mean reward -49.170, eps 0.02, speed 492.71 f/s
602066: done 10840 games, mean reward -49.170, eps 0.02, speed 528.84 f/s
602117: done 10841 games, mean reward -49.170, eps 0.02, speed 562.47 f/s
602168: done 10842 games, mean reward -48.670, eps 0.02, speed 490.66 f/s
602218: done 10843 games, mean reward -48.670, eps 0.02, speed 547.84 f/s
602268: done 10844 games, mean reward -48.670, eps 0.02, speed 536.28 f/s
602319: done 10845 games, mean reward -48.670, eps 0.02, speed 480.12 f/s
602369: done 10846 games, mean reward 

607363: done 10944 games, mean reward -49.090, eps 0.02, speed 471.15 f/s
607414: done 10945 games, mean reward -49.090, eps 0.02, speed 523.61 f/s
607467: done 10946 games, mean reward -49.090, eps 0.02, speed 555.18 f/s
607518: done 10947 games, mean reward -49.090, eps 0.02, speed 455.66 f/s
607569: done 10948 games, mean reward -49.090, eps 0.02, speed 562.97 f/s
607621: done 10949 games, mean reward -49.090, eps 0.02, speed 574.44 f/s
607671: done 10950 games, mean reward -49.090, eps 0.02, speed 482.33 f/s
607724: done 10951 games, mean reward -49.090, eps 0.02, speed 581.91 f/s
607774: done 10952 games, mean reward -49.090, eps 0.02, speed 551.24 f/s
607824: done 10953 games, mean reward -49.090, eps 0.02, speed 477.89 f/s
607875: done 10954 games, mean reward -49.090, eps 0.02, speed 559.94 f/s
607925: done 10955 games, mean reward -49.090, eps 0.02, speed 517.05 f/s
607975: done 10956 games, mean reward -49.090, eps 0.02, speed 473.72 f/s
608025: done 10957 games, mean reward 

613132: done 11057 games, mean reward -50.000, eps 0.02, speed 436.49 f/s
613182: done 11058 games, mean reward -50.000, eps 0.02, speed 531.78 f/s
613233: done 11059 games, mean reward -50.000, eps 0.02, speed 518.63 f/s
613283: done 11060 games, mean reward -50.000, eps 0.02, speed 481.56 f/s
613335: done 11061 games, mean reward -50.000, eps 0.02, speed 555.01 f/s
613386: done 11062 games, mean reward -50.000, eps 0.02, speed 545.65 f/s
613436: done 11063 games, mean reward -50.000, eps 0.02, speed 483.85 f/s
613486: done 11064 games, mean reward -50.000, eps 0.02, speed 533.54 f/s
613537: done 11065 games, mean reward -50.000, eps 0.02, speed 545.55 f/s
613588: done 11066 games, mean reward -50.000, eps 0.02, speed 482.85 f/s
613640: done 11067 games, mean reward -50.000, eps 0.02, speed 530.46 f/s
613690: done 11068 games, mean reward -50.000, eps 0.02, speed 521.77 f/s
613740: done 11069 games, mean reward -50.000, eps 0.02, speed 445.82 f/s
613792: done 11070 games, mean reward 

618847: done 11169 games, mean reward -49.000, eps 0.02, speed 477.75 f/s
618897: done 11170 games, mean reward -49.000, eps 0.02, speed 523.51 f/s
618947: done 11171 games, mean reward -49.000, eps 0.02, speed 534.71 f/s
618997: done 11172 games, mean reward -49.000, eps 0.02, speed 422.75 f/s
619047: done 11173 games, mean reward -49.000, eps 0.02, speed 495.57 f/s
619099: done 11174 games, mean reward -49.000, eps 0.02, speed 535.01 f/s
619149: done 11175 games, mean reward -49.000, eps 0.02, speed 451.38 f/s
619201: done 11176 games, mean reward -49.000, eps 0.02, speed 477.92 f/s
619251: done 11177 games, mean reward -49.000, eps 0.02, speed 383.89 f/s
619302: done 11178 games, mean reward -49.000, eps 0.02, speed 422.39 f/s
619352: done 11179 games, mean reward -49.000, eps 0.02, speed 504.76 f/s
619402: done 11180 games, mean reward -49.000, eps 0.02, speed 478.55 f/s
619455: done 11181 games, mean reward -49.000, eps 0.02, speed 585.58 f/s
619505: done 11182 games, mean reward 

KeyboardInterrupt: 