In [1]:
%matplotlib notebook
import gym
from baselines import deepq
import matplotlib.pyplot as plt
from matplotlib.ticker import MaxNLocator
from xvfbwrapper import Xvfb

In [2]:
fig, ax = plt.subplots(figsize=(8, 6))
plt.ion()

fig.show()
fig.canvas.draw()

def callback(lcl, glb):
    # stop training if reward exceeds 199
    is_solved = lcl['t'] > 100 and sum(lcl['episode_rewards'][-101:-1]) / 100 >= 160
    if lcl['t'] % 100 == 0:
        ax.clear()
        ax.plot(lcl['episode_rewards'])
        ax.xaxis.set_major_locator(MaxNLocator(integer=True))
        ax.set_xlabel('Number of Episodes')
        ax.set_ylabel('Mean episode reward')
        ax.set_title('Mean Reward vs Episodes')
        fig.canvas.draw()
    return is_solved


def main():
    env = gym.make("CartPole-v0")
    env = gym.wrappers.Monitor(env, directory='./cartpole', video_callable=lambda x: True, uid='bonsai', force=True)
    model = deepq.models.mlp([32])
    act = deepq.learn(
        env,
        q_func=model,
        lr=1e-3,
        max_timesteps=100000,
        buffer_size=50000,
        exploration_fraction=0.1,
        exploration_final_eps=0.02,
        print_freq=10,
        callback=callback
    )

<IPython.core.display.Javascript object>

In [3]:
display = Xvfb()
display.start()
main()
display.stop()

[2017-11-22 15:46:58,073] Making new env: CartPole-v0
[2017-11-22 15:46:58,129] Clearing 402 monitor files from previous run (because force=True was provided)


Instructions for updating:
Use `argmax` instead


[2017-11-22 15:46:59,155] From /bonsai/baselines/baselines/deepq/build_graph.py:366: arg_max (from tensorflow.python.ops.gen_math_ops) is deprecated and will be removed in a future version.
Instructions for updating:
Use `argmax` instead
[2017-11-22 15:47:00,662] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000000.mp4
  out=out, **kwargs)
  ret = ret.dtype.type(ret / rcount)
[2017-11-22 15:47:03,747] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000001.mp4
[2017-11-22 15:47:04,512] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000002.mp4
[2017-11-22 15:47:06,078] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000003.mp4
[2017-11-22 15:47:06,683] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video

--------------------------------------
| % time spent exploring  | 98       |
| episodes                | 10       |
| mean 100 episode reward | 21.8     |
| steps                   | 195      |
--------------------------------------


[2017-11-22 15:47:12,448] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000010.mp4
[2017-11-22 15:47:13,012] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000011.mp4
[2017-11-22 15:47:14,883] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000012.mp4
[2017-11-22 15:47:16,731] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000013.mp4
[2017-11-22 15:47:17,648] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000014.mp4
[2017-11-22 15:47:18,420] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000015.mp4
[2017-11-22 15:47:19,103] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000016.mp4

--------------------------------------
| % time spent exploring  | 95       |
| episodes                | 20       |
| mean 100 episode reward | 22.5     |
| steps                   | 427      |
--------------------------------------


[2017-11-22 15:47:26,203] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000020.mp4
[2017-11-22 15:47:26,917] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000021.mp4
[2017-11-22 15:47:27,913] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000022.mp4
[2017-11-22 15:47:28,944] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000023.mp4
[2017-11-22 15:47:29,813] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000024.mp4
[2017-11-22 15:47:31,037] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000025.mp4
[2017-11-22 15:47:32,432] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000026.mp4

--------------------------------------
| % time spent exploring  | 93       |
| episodes                | 30       |
| mean 100 episode reward | 23.9     |
| steps                   | 692      |
--------------------------------------


[2017-11-22 15:47:36,283] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000030.mp4
[2017-11-22 15:47:37,917] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000031.mp4
[2017-11-22 15:47:38,397] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000032.mp4
[2017-11-22 15:47:39,280] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000033.mp4
[2017-11-22 15:47:40,476] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000034.mp4
[2017-11-22 15:47:41,356] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000035.mp4
[2017-11-22 15:47:42,880] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000036.mp4

--------------------------------------
| % time spent exploring  | 91       |
| episodes                | 40       |
| mean 100 episode reward | 23.3     |
| steps                   | 908      |
--------------------------------------


[2017-11-22 15:47:46,545] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000040.mp4
[2017-11-22 15:47:47,241] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000041.mp4
[2017-11-22 15:47:47,990] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000042.mp4
[2017-11-22 15:47:48,992] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000043.mp4
[2017-11-22 15:47:49,798] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000044.mp4
[2017-11-22 15:47:50,971] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000045.mp4
[2017-11-22 15:47:51,905] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000046.mp4

--------------------------------------
| % time spent exploring  | 89       |
| episodes                | 50       |
| mean 100 episode reward | 22.5     |
| steps                   | 1101     |
--------------------------------------


[2017-11-22 15:47:56,453] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000050.mp4
[2017-11-22 15:47:57,138] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000051.mp4
[2017-11-22 15:47:58,510] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000052.mp4
[2017-11-22 15:48:00,922] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000053.mp4
[2017-11-22 15:48:01,799] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000054.mp4
[2017-11-22 15:48:02,317] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000055.mp4
[2017-11-22 15:48:02,979] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000056.mp4

--------------------------------------
| % time spent exploring  | 87       |
| episodes                | 60       |
| mean 100 episode reward | 22       |
| steps                   | 1298     |
--------------------------------------


[2017-11-22 15:48:06,360] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000060.mp4
[2017-11-22 15:48:07,143] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000061.mp4
[2017-11-22 15:48:08,864] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000062.mp4
[2017-11-22 15:48:10,412] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000063.mp4
[2017-11-22 15:48:11,671] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000064.mp4
[2017-11-22 15:48:12,568] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000065.mp4
[2017-11-22 15:48:13,464] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000066.mp4

--------------------------------------
| % time spent exploring  | 85       |
| episodes                | 70       |
| mean 100 episode reward | 21.4     |
| steps                   | 1479     |
--------------------------------------


[2017-11-22 15:48:17,040] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000070.mp4
[2017-11-22 15:48:18,207] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000071.mp4
[2017-11-22 15:48:19,432] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000072.mp4
[2017-11-22 15:48:20,279] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000073.mp4
[2017-11-22 15:48:21,303] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000074.mp4
[2017-11-22 15:48:22,379] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000075.mp4
[2017-11-22 15:48:23,563] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000076.mp4

--------------------------------------
| % time spent exploring  | 83       |
| episodes                | 80       |
| mean 100 episode reward | 21.1     |
| steps                   | 1665     |
--------------------------------------


[2017-11-22 15:48:27,381] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000080.mp4
[2017-11-22 15:48:28,643] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000081.mp4
[2017-11-22 15:48:29,201] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000082.mp4
[2017-11-22 15:48:30,234] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000083.mp4
[2017-11-22 15:48:30,929] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000084.mp4
[2017-11-22 15:48:31,871] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000085.mp4
[2017-11-22 15:48:32,494] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000086.mp4

--------------------------------------
| % time spent exploring  | 81       |
| episodes                | 90       |
| mean 100 episode reward | 20.8     |
| steps                   | 1850     |
--------------------------------------


[2017-11-22 15:48:36,372] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000090.mp4
[2017-11-22 15:48:36,921] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000091.mp4
[2017-11-22 15:48:37,571] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000092.mp4
[2017-11-22 15:48:38,240] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000093.mp4
[2017-11-22 15:48:39,335] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000094.mp4
[2017-11-22 15:48:40,171] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000095.mp4
[2017-11-22 15:48:40,728] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000096.mp4

--------------------------------------
| % time spent exploring  | 80       |
| episodes                | 100      |
| mean 100 episode reward | 19.9     |
| steps                   | 1974     |
--------------------------------------


[2017-11-22 15:48:43,828] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000100.mp4
[2017-11-22 15:48:45,033] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000101.mp4
[2017-11-22 15:48:45,841] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000102.mp4
[2017-11-22 15:48:46,555] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000103.mp4
[2017-11-22 15:48:47,403] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000104.mp4
[2017-11-22 15:48:48,031] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000105.mp4
[2017-11-22 15:48:48,875] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000106.mp4

--------------------------------------
| % time spent exploring  | 79       |
| episodes                | 110      |
| mean 100 episode reward | 19.5     |
| steps                   | 2142     |
--------------------------------------


[2017-11-22 15:48:52,817] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000110.mp4
[2017-11-22 15:48:53,678] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000111.mp4
[2017-11-22 15:48:54,883] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000112.mp4
[2017-11-22 15:48:55,480] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000113.mp4
[2017-11-22 15:48:56,304] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000114.mp4
[2017-11-22 15:48:57,091] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000115.mp4
[2017-11-22 15:48:57,709] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000116.mp4

--------------------------------------
| % time spent exploring  | 76       |
| episodes                | 120      |
| mean 100 episode reward | 19.3     |
| steps                   | 2353     |
--------------------------------------


[2017-11-22 15:49:03,163] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000120.mp4
[2017-11-22 15:49:03,735] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000121.mp4
[2017-11-22 15:49:04,352] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000122.mp4
[2017-11-22 15:49:05,014] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000123.mp4
[2017-11-22 15:49:06,194] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000124.mp4
[2017-11-22 15:49:06,903] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000125.mp4
[2017-11-22 15:49:07,870] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000126.mp4

--------------------------------------
| % time spent exploring  | 75       |
| episodes                | 130      |
| mean 100 episode reward | 18       |
| steps                   | 2488     |
--------------------------------------


[2017-11-22 15:49:12,162] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000130.mp4
[2017-11-22 15:49:12,712] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000131.mp4
[2017-11-22 15:49:13,955] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000132.mp4
[2017-11-22 15:49:15,037] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000133.mp4
[2017-11-22 15:49:16,530] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000134.mp4
[2017-11-22 15:49:17,986] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000135.mp4
[2017-11-22 15:49:18,889] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000136.mp4

--------------------------------------
| % time spent exploring  | 73       |
| episodes                | 140      |
| mean 100 episode reward | 18.2     |
| steps                   | 2726     |
--------------------------------------


[2017-11-22 15:49:23,723] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000140.mp4
[2017-11-22 15:49:26,144] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000141.mp4
[2017-11-22 15:49:27,524] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000142.mp4
[2017-11-22 15:49:28,612] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000143.mp4
[2017-11-22 15:49:29,383] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000144.mp4
[2017-11-22 15:49:30,132] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000145.mp4
[2017-11-22 15:49:30,713] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000146.mp4

--------------------------------------
| % time spent exploring  | 71       |
| episodes                | 150      |
| mean 100 episode reward | 18.5     |
| steps                   | 2950     |
--------------------------------------


[2017-11-22 15:49:34,454] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000150.mp4
[2017-11-22 15:49:36,326] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000151.mp4
[2017-11-22 15:49:37,902] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000152.mp4
[2017-11-22 15:49:41,364] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000153.mp4
[2017-11-22 15:49:42,571] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000154.mp4
[2017-11-22 15:49:43,736] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000155.mp4
[2017-11-22 15:49:45,823] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000156.mp4

--------------------------------------
| % time spent exploring  | 67       |
| episodes                | 160      |
| mean 100 episode reward | 20.4     |
| steps                   | 3338     |
--------------------------------------


[2017-11-22 15:49:53,376] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000160.mp4
[2017-11-22 15:49:55,025] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000161.mp4
[2017-11-22 15:49:56,112] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000162.mp4
[2017-11-22 15:49:59,076] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000163.mp4
[2017-11-22 15:50:02,907] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000164.mp4
[2017-11-22 15:50:04,419] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000165.mp4
[2017-11-22 15:50:05,171] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000166.mp4

--------------------------------------
| % time spent exploring  | 62       |
| episodes                | 170      |
| mean 100 episode reward | 23.4     |
| steps                   | 3816     |
--------------------------------------


[2017-11-22 15:50:13,722] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000170.mp4
[2017-11-22 15:50:18,495] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000171.mp4
[2017-11-22 15:50:20,860] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000172.mp4
[2017-11-22 15:50:24,140] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000173.mp4
[2017-11-22 15:50:27,363] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000174.mp4
[2017-11-22 15:50:32,541] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000175.mp4
[2017-11-22 15:50:35,230] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000176.mp4

--------------------------------------
| % time spent exploring  | 54       |
| episodes                | 180      |
| mean 100 episode reward | 30.1     |
| steps                   | 4677     |
--------------------------------------


[2017-11-22 15:50:48,408] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000180.mp4
[2017-11-22 15:50:51,845] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000181.mp4
[2017-11-22 15:50:55,581] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000182.mp4
[2017-11-22 15:50:58,981] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000183.mp4
[2017-11-22 15:51:02,607] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000184.mp4
[2017-11-22 15:51:07,623] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000185.mp4
[2017-11-22 15:51:09,541] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000186.mp4

--------------------------------------
| % time spent exploring  | 44       |
| episodes                | 190      |
| mean 100 episode reward | 38.5     |
| steps                   | 5699     |
--------------------------------------


[2017-11-22 15:51:26,818] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000190.mp4
[2017-11-22 15:51:29,255] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000191.mp4
[2017-11-22 15:51:32,255] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000192.mp4
[2017-11-22 15:51:34,841] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000193.mp4
[2017-11-22 15:51:38,059] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000194.mp4
[2017-11-22 15:51:42,204] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000195.mp4
[2017-11-22 15:51:46,429] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000196.mp4

--------------------------------------
| % time spent exploring  | 34       |
| episodes                | 200      |
| mean 100 episode reward | 47.1     |
| steps                   | 6686     |
--------------------------------------


[2017-11-22 15:52:09,090] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000200.mp4
[2017-11-22 15:52:14,531] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000201.mp4
[2017-11-22 15:52:20,361] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000202.mp4
[2017-11-22 15:52:26,250] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000203.mp4
[2017-11-22 15:52:31,311] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000204.mp4
[2017-11-22 15:52:35,580] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000205.mp4
[2017-11-22 15:52:40,103] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000206.mp4

--------------------------------------
| % time spent exploring  | 20       |
| episodes                | 210      |
| mean 100 episode reward | 59.3     |
| steps                   | 8071     |
--------------------------------------


[2017-11-22 15:53:00,172] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000210.mp4
[2017-11-22 15:53:05,609] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000211.mp4
[2017-11-22 15:53:11,272] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000212.mp4
[2017-11-22 15:53:16,622] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000213.mp4
[2017-11-22 15:53:22,523] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000214.mp4
[2017-11-22 15:53:28,249] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000215.mp4
[2017-11-22 15:53:34,481] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000216.mp4

--------------------------------------
| % time spent exploring  | 6        |
| episodes                | 220      |
| mean 100 episode reward | 71.7     |
| steps                   | 9523     |
--------------------------------------


[2017-11-29 00:27:16,391] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000220.mp4
[2017-11-29 00:27:23,016] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000221.mp4
[2017-11-29 00:27:28,570] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000222.mp4


Saving model due to mean reward increase: None -> 75.8


[2017-11-29 00:27:35,781] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000223.mp4
[2017-11-29 00:27:42,420] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000224.mp4
[2017-11-29 00:27:49,782] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000225.mp4
[2017-11-29 00:27:55,546] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000226.mp4
[2017-11-29 00:28:01,042] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000227.mp4
[2017-11-29 00:28:06,161] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000228.mp4
[2017-11-29 00:28:12,102] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000229.mp4

--------------------------------------
| % time spent exploring  | 2        |
| episodes                | 230      |
| mean 100 episode reward | 85.5     |
| steps                   | 11040    |
--------------------------------------


[2017-11-29 00:28:16,898] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000230.mp4
[2017-11-29 00:28:22,360] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000231.mp4
[2017-11-29 00:28:26,648] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000232.mp4
[2017-11-29 00:28:31,562] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000233.mp4
[2017-11-29 00:28:50,252] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000234.mp4
[2017-11-29 00:29:00,017] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000235.mp4
[2017-11-29 00:29:05,696] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000236.mp4

--------------------------------------
| % time spent exploring  | 2        |
| episodes                | 240      |
| mean 100 episode reward | 96.7     |
| steps                   | 12392    |
--------------------------------------


[2017-11-29 00:29:24,713] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000240.mp4
[2017-11-29 00:29:28,808] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000241.mp4
[2017-11-29 00:29:35,413] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000242.mp4
[2017-11-29 00:29:39,779] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000243.mp4
[2017-11-29 00:29:45,647] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000244.mp4
[2017-11-29 00:29:51,262] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000245.mp4
[2017-11-29 00:29:55,712] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000246.mp4

--------------------------------------
| % time spent exploring  | 2        |
| episodes                | 250      |
| mean 100 episode reward | 111      |
| steps                   | 14084    |
--------------------------------------


[2017-11-29 00:30:14,899] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000250.mp4
[2017-11-29 00:30:21,490] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000251.mp4
[2017-11-29 00:30:27,385] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000252.mp4
[2017-11-29 00:30:33,381] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000253.mp4
[2017-11-29 00:30:39,704] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000254.mp4
[2017-11-29 00:30:45,358] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000255.mp4
[2017-11-29 00:30:51,762] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000256.mp4

--------------------------------------
| % time spent exploring  | 2        |
| episodes                | 260      |
| mean 100 episode reward | 125      |
| steps                   | 15866    |
--------------------------------------


[2017-11-29 00:31:18,430] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000260.mp4
[2017-11-29 00:31:24,742] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000261.mp4
[2017-11-29 00:31:30,801] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000262.mp4
[2017-11-29 00:31:37,123] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000263.mp4
[2017-11-29 00:31:43,219] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000264.mp4
[2017-11-29 00:31:50,371] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000265.mp4
[2017-11-29 00:31:57,473] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000266.mp4

--------------------------------------
| % time spent exploring  | 2        |
| episodes                | 270      |
| mean 100 episode reward | 139      |
| steps                   | 17751    |
--------------------------------------


[2017-11-29 00:32:25,673] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000270.mp4
[2017-11-29 00:32:32,262] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000271.mp4
[2017-11-29 00:32:37,788] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000272.mp4
[2017-11-29 00:32:43,310] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000273.mp4
[2017-11-29 00:32:49,773] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000274.mp4
[2017-11-29 00:32:55,032] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000275.mp4
[2017-11-29 00:32:59,530] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000276.mp4

--------------------------------------
| % time spent exploring  | 2        |
| episodes                | 280      |
| mean 100 episode reward | 146      |
| steps                   | 19267    |
--------------------------------------


[2017-11-29 00:33:19,269] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000280.mp4
[2017-11-29 00:33:24,827] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000281.mp4
[2017-11-29 00:33:31,235] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000282.mp4
[2017-11-29 00:33:36,829] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000283.mp4


Saving model due to mean reward increase: 75.8 -> 148.8


[2017-11-29 00:33:44,699] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000284.mp4
[2017-11-29 00:33:50,894] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000285.mp4
[2017-11-29 00:33:56,584] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000286.mp4
[2017-11-29 00:34:03,006] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000287.mp4
[2017-11-29 00:34:10,048] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000288.mp4
[2017-11-29 00:34:16,811] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000289.mp4


--------------------------------------
| % time spent exploring  | 2        |
| episodes                | 290      |
| mean 100 episode reward | 153      |
| steps                   | 21039    |
--------------------------------------


[2017-11-29 00:34:22,517] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000290.mp4
[2017-11-29 00:34:27,919] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000291.mp4
[2017-11-29 00:34:32,956] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000292.mp4
[2017-11-29 00:34:37,885] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000293.mp4
[2017-11-29 00:34:43,660] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000294.mp4
[2017-11-29 00:34:49,193] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000295.mp4
[2017-11-29 00:34:56,097] Starting new video recorder writing to /bonsai/baselines/tutorials/cartpole/openaigym.video.0.bonsai.video000296.mp4

--------------------------------------
| % time spent exploring  | 2        |
| episodes                | 300      |
| mean 100 episode reward | 160      |
| steps                   | 22703    |
--------------------------------------
Restored model with mean reward: 148.8
INFO:tensorflow:Restoring parameters from /tmp/tmp78rcksef/model


[2017-11-29 00:35:14,411] Restoring parameters from /tmp/tmp78rcksef/model
[2017-11-29 00:35:14,621] Finished writing results. You can upload them to the scoreboard via gym.upload('/bonsai/baselines/tutorials/cartpole')
