In [1]:
import os
import sys

# env relative imports
import gymnasium as gym
import gym_idsgame

# Setting up the env

In [2]:
env_prefix = 'idsgame'
env_options = [
    'minimal_defense',
    'random_defense', 
    'maximal_attack',
    'random_attack',
    '', # 2 agents
]

versions = range(0,21 +1)

In [3]:
version = versions[-1] #latest
env_option = env_options[0]

env_name = f"{env_prefix}-{env_option}{'-' if len(env_option) else ''}v{version}"

env = gym.make(env_name)

In [4]:
print(env_name)

idsgame-maximal_attack-v21


In [5]:
# testing env
done = False
env.reset()
while not done:
    attack_action = env.attacker_action_space.sample()
    defense_action = env.defender_action_space.sample()
    a = (attack_action, defense_action)
    obs, reward, done, _, info = env.step(a)
    print(f'reward: {reward}')
    print(f'attacker_action: {attack_action}')
    print(f'attacker_action shape: {attack_action.shape}')
    print(f'defense_action: {defense_action}')
    print(f'defense_action shape: {defense_action.shape}')
    print(f'obs {obs}')
    print(f'obs shape {obs.shape}')

In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 2. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
reward: (0, 0)
attacker_action: 17
attacker_action shape: ()
defense_action: 2
defense_action shape: ()
obs [[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
obs shape (4, 10)
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.

  logger.warn(
  logger.deprecation(
  logger.warn(
  logger.warn(f"{pre} is not within the observation space.")
  logger.warn(
  logger.warn(
  logger.warn(
  logger.warn(f"{pre} is not within the observation space.")
  logger.warn(


# Setting up the agent

In [6]:
random_seed = 0

In [7]:
# configuration
from gym_idsgame.agents.training_agents.q_learning.q_agent_config import QAgentConfig
from gym_idsgame.agents.training_agents.q_learning.dqn.dqn import DQNAgent
from gym_idsgame.agents.training_agents.q_learning.dqn.dqn_config import DQNConfig

from experiments.util import util

util.create_artefact_dirs('./output', random_seed)

In [8]:
dqn_config = DQNConfig(input_dim=88)

q_agent_config = QAgentConfig(gamma=0.999, alpha=0.0005, epsilon=1, render=False, eval_sleep=0.9,
                              min_epsilon=0.01, eval_episodes=100, train_log_frequency=100,
                              epsilon_decay=0.9999, video=True, eval_log_frequency=1,
                              video_fps=5, video_dir='./output' + "/results/videos/" + str(random_seed), num_episodes=20001,
                              eval_render=False, gifs=True, gif_dir='./output' + "/results/gifs/" + str(random_seed),
                              eval_frequency=1000, attacker=True, defender=False, video_frequency=101,
                              save_dir='./output' + "/results/data/" + str(random_seed), dqn_config=dqn_config)

defender_agent = DQNAgent(env, q_agent_config)

#launch training
defender_agent.train()

#get results
train_result = defender_agent.train_result
eval_result = defender_agent.eval_result


  logger.warn(
  logger.warn(
  logger.warn(
  logger.warn(
  logger.warn(
  logger.warn(
  logger.warn(
[Warmup] step:0, buffer_size: 0:   1%|          | 81/10000 [00:00<00:24, 401.88it/s]

In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[2. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[2. 1. 1. 1. 1.]
 [1. 1. 2. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 1.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 

[Warmup] step:100, buffer_size: 100:   2%|▏         | 169/10000 [00:00<00:23, 423.67it/s]

In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 2. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  2.  1.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 2. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 2. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 1.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 

[Warmup] step:200, buffer_size: 200:   2%|▏         | 212/10000 [00:00<00:25, 377.21it/s]

In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 3.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 1.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [2. 1. 1. 1. 1.]
 [1. 1. 1. 1. 3.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 2.  0.  0.  0.  0.  2.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [2. 1. 1. 1. 1.]
 [1. 1. 2. 1. 3.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 3.  0.  0.  0.  1.  3.  1.  1.  1.  1.]
 

[Warmup] step:200, buffer_size: 200:   3%|▎         | 288/10000 [00:00<00:27, 350.97it/s]

In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 1.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  1.  2.  1.  1.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 2. 1. 1. 1.]
 [1. 1. 2. 1. 1.]
 [1. 1. 2. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 2.  0.  0.  0.  1.  2.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  1.  2.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 2. 1. 1. 1.]
 [1. 2. 2. 1. 1.]
 [1. 1. 2. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0.  1.  2.  2.  1.  1.]
 [ 2.  0.  0.  0.  1.  2.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  1.  2.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 2. 2. 1. 1.]
 [1. 2. 2. 1. 1.]
 [1. 1. 2. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 1.  0.  0.  0.  0.  1.  2.  2.  1.  1.]
 [ 2.  0.  0.  0.  1.  2.  1.  1.  1.  1.]
 

[Warmup] step:300, buffer_size: 300:   4%|▎         | 367/10000 [00:00<00:26, 368.27it/s]

In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 1.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  2.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[2. 1. 1. 1. 1.]
 [2. 1. 1. 1. 1.]
 [2. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 2.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 

[Warmup] step:400, buffer_size: 400:   4%|▍         | 449/10000 [00:01<00:25, 375.20it/s]

In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 2. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  2.  1.  1.  1.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 2.]
 [1. 1. 1. 1. 1.]
 [1. 2. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 1.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  2.  1.  1.  1.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 2.]
 [2. 1. 1. 1. 1.]
 [1. 2. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 2.  0.  0.  0.  0.  2.  1.  1.  1.  1.]
 

[Warmup] step:500, buffer_size: 500:   5%|▌         | 532/10000 [00:01<00:24, 392.00it/s]

In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 1.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  2.  1.  1.  2.  1.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [2. 2. 1. 2. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 2.  0.  0.  0.  1.  2.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  2.  1.  1.  2.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [2. 2. 1. 2. 2.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 2.  0.  0.  0.  1.  2.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  2.  1.  1.  2.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 2.]
 [1. 1. 1. 1. 1.]
 [2. 2. 1. 2. 2.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 1.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 2.  0.  0.  0.  1.  2.  1.  1.  1.  1.]
 

[Warmup] step:600, buffer_size: 600:   6%|▌         | 618/10000 [00:01<00:23, 401.98it/s]

In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 2.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 2. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 

[Warmup] step:700, buffer_size: 700:   7%|▋         | 700/10000 [00:01<00:24, 380.02it/s]

In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 1.  0.  0.  0.  0.  1.  1.  2.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 3. 1. 2.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 2.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 

[Warmup] step:800, buffer_size: 800:   8%|▊         | 800/10000 [00:02<00:26, 345.70it/s]

In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 4.  0.  0.  0.  1.  4.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  2.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [3. 1. 1. 1. 1.]
 [2. 1. 2. 2. 2.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 4.  0.  0.  0.  1.  4.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  2.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [3. 1. 1. 1. 1.]
 [2. 1. 3. 2. 2.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 1.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 4.  0.  0.  0.  1.  4.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  2.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 2. 1. 1. 1.]
 [3. 1. 1. 1. 1.]
 [2. 1. 3. 2. 2.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 2.  0.  0.  0.  1.  2.  1.  1.  1.  1.]
 [ 4.  0.  0.  0.  0.  4.  1.  1.  1.  1.]
 

[Warmup] step:800, buffer_size: 800:   9%|▊         | 860/10000 [00:02<00:24, 379.01it/s]

In function: attacker obs[[ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 3.  0.  0.  0.  1.  3.  1.  1.  2.  1.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [2. 1. 1. 2. 2.]
 [2. 1. 1. 3. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 1.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 3.  0.  0.  0.  1.  3.  1.  1.  2.  1.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 2. 1.]
 [2. 1. 1. 2. 2.]
 [2. 1. 1. 3. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 2.  0.  0.  0.  1.  2.  1.  1.  1.  1.]
 [ 3.  0.  0.  0.  0.  3.  1.  1.  2.  1.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 2. 2. 1.]
 [2. 1. 1. 2. 2.]
 [2. 1. 1. 3. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 

[Warmup] step:900, buffer_size: 900:   9%|▉         | 941/10000 [00:02<00:24, 368.35it/s]

In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 2.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 1.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[2. 1. 1. 1. 2.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 2.  0.  0.  0.  0.  2.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 

[Warmup] step:1000, buffer_size: 1000:  10%|█         | 1019/10000 [00:02<00:23, 376.71it/s]

In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 1.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  2.  1.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 2. 1.]
 [1. 1. 1. 2. 1.]
 [1. 1. 1. 2. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 2.  0.  0.  0.  1.  2.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  2.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 2. 1. 2. 1.]
 [1. 1. 1. 2. 1.]
 [1. 1. 1. 2. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0.  1.  2.  1.  2.  1.]
 [ 2.  0.  0.  0.  1.  2.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  2.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 2. 1. 2. 1.]
 [1. 1. 1. 2. 1.]
 [1. 2. 1. 2. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 

[Warmup] step:1100, buffer_size: 1100:  11%|█         | 1100/10000 [00:02<00:23, 371.53it/s]

In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 1.  0.  0.  0.  0.  1.  2.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [2. 2. 1. 1. 1.]
 [1. 1. 1. 1. 2.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 2. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 

[Warmup] step:1200, buffer_size: 1200:  12%|█▏        | 1200/10000 [00:03<00:23, 380.00it/s]

In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 2. 1.]
 [1. 1. 2. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 1.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 2. 1.]
 [1. 2. 2. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 2.  0.  0.  0.  1.  2.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 2. 1.]
 [1. 2. 2. 1. 1.]
 [1. 2. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0.  1.  1.  2.  2.  1.]
 [ 2.  0.  0.  0.  1.  2.  1.  1.  1.  1.]
 

[Warmup] step:1300, buffer_size: 1300:  13%|█▎        | 1300/10000 [00:03<00:22, 383.21it/s]

In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 2. 1. 1. 1.]
 [1. 1. 1. 1. 2.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 1.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 2. 1. 2. 1.]
 [1. 1. 1. 1. 2.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 2.  0.  0.  0.  0.  2.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 2. 1. 2. 1.]
 [2. 1. 1. 1. 2.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 3.  0.  0.  0.  1.  3.  1.  1.  1.  1.]
 

[Warmup] step:1300, buffer_size: 1300:  14%|█▍        | 1399/10000 [00:03<00:19, 435.34it/s]

In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 2.]
 [1. 1. 1. 1. 2.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 2. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 1.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 

[Warmup] step:1400, buffer_size: 1400:  15%|█▍        | 1487/10000 [00:03<00:19, 426.69it/s]

In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 1.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[2. 1. 1. 1. 1.]
 [1. 1. 1. 1. 2.]
 [1. 2. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 2. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 1.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 

[Warmup] step:1500, buffer_size: 1500:  15%|█▌        | 1530/10000 [00:03<00:21, 385.61it/s]

In function: attacker obs[[ 0.  1.  0.  0.  0.  3.  1.  1.  1.  1.]
 [ 2.  0.  0.  0.  1.  2.  2.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[3. 1. 1. 1. 1.]
 [1. 3. 1. 1. 1.]
 [1. 2. 1. 2. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0.  1.  1.  2.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 2. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0.  1.  1.  2.  1.  1.]
 

[Warmup] step:1600, buffer_size: 1600:  16%|█▌        | 1611/10000 [00:04<00:21, 382.34it/s]

In function: attacker obs[[ 1.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [2. 2. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 2.  0.  0.  0.  1.  2.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 2. 1. 1. 1.]
 [2. 2. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 

[Warmup] step:1700, buffer_size: 1700:  17%|█▋        | 1703/10000 [00:04<00:19, 417.08it/s]

In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 1.  0.  0.  0.  0.  1.  2.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 2. 1.]
 [2. 2. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 2.  0.  0.  0.  0.  2.  2.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 2. 1.]
 [2. 2. 1. 1. 2.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 3.  0.  0.  0.  1.  3.  2.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 2. 1.]
 [2. 3. 1. 1. 2.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0.  1.  2.  1.  2.  1.]
 [ 3.  0.  0.  0.  1.  3.  2.  1.  1.  1.]
 

[Warmup] step:1800, buffer_size: 1800:  18%|█▊        | 1800/10000 [00:04<00:19, 415.75it/s]

In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 2.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 1.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 2. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 2.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 

[Warmup] step:1800, buffer_size: 1800:  19%|█▊        | 1874/10000 [00:04<00:21, 379.80it/s]

In function: attacker obs[[ 2.  0.  0.  0.  0.  2.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[2. 1. 1. 1. 1.]
 [2. 2. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 3.  0.  0.  0.  1.  3.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[2. 1. 2. 1. 1.]
 [2. 2. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 

[Warmup] step:1900, buffer_size: 1900:  20%|█▉        | 1951/10000 [00:05<00:22, 357.33it/s]

In function: attacker obs[[ 1.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 2. 1. 1. 1.]
 [1. 1. 1. 2. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 2.  0.  0.  0.  1.  2.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 3. 1. 1. 1.]
 [1. 1. 1. 2. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 

[Warmup] step:2000, buffer_size: 2000:  20%|██        | 2023/10000 [00:05<00:23, 332.38it/s]

In function: attacker obs[[ 0.  1.  0.  0.  0.  2.  1.  1.  1.  1.]
 [ 2.  0.  0.  0.  1.  2.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  2.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[2. 1. 1. 2. 1.]
 [1. 1. 1. 2. 1.]
 [2. 1. 1. 2. 2.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  2.  0.  0.  0.  2.  2.  1.  1.  1.]
 [ 2.  0.  0.  0.  1.  2.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  2.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[2. 2. 1. 2. 1.]
 [1. 1. 1. 2. 1.]
 [2. 1. 1. 2. 2.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  3.  0.  0.  1.  2.  3.  1.  1.  1.]
 [ 2.  0.  0.  0.  0.  2.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  2.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[2. 2. 1. 2. 1.]
 [1. 1. 1. 2. 1.]
 [2. 1. 2. 2. 2.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 

[Warmup] step:2100, buffer_size: 2100:  21%|██        | 2100/10000 [00:05<00:22, 347.51it/s]

In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 2. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 

[Warmup] step:2200, buffer_size: 2200:  22%|██▏       | 2200/10000 [00:05<00:20, 387.12it/s]

In function: attacker obs[[ 0.  0.  0.  0.  0.  1.  1.  3.  1.  1.]
 [ 2.  0.  0.  0.  1.  2.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  2.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 3. 1. 1.]
 [1. 1. 1. 2. 1.]
 [1. 2. 2. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 1.  0.  0.  0.  0.  1.  1.  3.  1.  1.]
 [ 2.  0.  0.  0.  1.  2.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  2.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 3. 1. 1.]
 [1. 1. 2. 2. 1.]
 [1. 2. 2. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 2.  0.  0.  0.  1.  2.  1.  3.  1.  1.]
 [ 2.  0.  0.  0.  0.  2.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  2.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 3. 2. 1.]
 [1. 1. 2. 2. 1.]
 [1. 2. 2. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 

[Warmup] step:2200, buffer_size: 2200:  23%|██▎       | 2260/10000 [00:05<00:21, 358.06it/s]

In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 2. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 2. 1. 1. 1.]
 [2. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 1.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 

[Warmup] step:2300, buffer_size: 2300:  23%|██▎       | 2333/10000 [00:06<00:23, 332.56it/s]

In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 3. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 1.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 4. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 2.  0.  0.  0.  1.  2.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 4. 1. 1. 1.]
 [1. 1. 2. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0.  1.  4.  1.  1.  1.]
 [ 2.  0.  0.  0.  1.  2.  1.  1.  1.  1.]
 

[Warmup] step:2400, buffer_size: 2400:  24%|██▍       | 2405/10000 [00:06<00:25, 303.06it/s]

In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0.  1.  2.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 2. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 1.  0.  0.  0.  0.  1.  2.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 2. 1. 1. 1.]
 [2. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 2.  0.  0.  0.  1.  2.  2.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 

[Warmup] step:2400, buffer_size: 2400:  25%|██▍       | 2468/10000 [00:06<00:25, 295.46it/s]

In function: attacker obs[[ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 2.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 1.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 2. 1. 2.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 2.  0.  0.  0.  1.  2.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 2. 1. 1.]
 [1. 1. 2. 1. 2.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 

[Warmup] step:2500, buffer_size: 2500:  25%|██▌       | 2536/10000 [00:06<00:23, 312.03it/s]

In function: attacker obs[[ 2.  0.  0.  0.  1.  2.  2.  1.  1.  1.]
 [ 2.  0.  0.  0.  0.  2.  1.  2.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  2.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 2. 1. 1. 1.]
 [1. 1. 3. 2. 2.]
 [1. 2. 1. 1. 2.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 2. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 

[Warmup] step:2600, buffer_size: 2600:  26%|██▌       | 2605/10000 [00:07<00:23, 315.04it/s]

In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  2.  1.  1.  1.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 2. 1.]
 [1. 1. 1. 1. 1.]
 [1. 2. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 1.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  2.  1.  1.  1.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 2. 1.]
 [1. 1. 1. 1. 1.]
 [1. 2. 2. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 2.  0.  0.  0.  1.  2.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  2.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 2. 1.]
 [1. 2. 1. 1. 1.]
 [1. 2. 2. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0.  1.  1.  1.  2.  1.]
 [ 2.  0.  0.  0.  1.  2.  1.  1.  1.  1.]
 

[Warmup] step:2700, buffer_size: 2700:  27%|██▋       | 2708/10000 [00:07<00:22, 330.00it/s]

In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 4.  0.  0.  0.  1.  4.  1.  2.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 2. 1. 1.]
 [3. 2. 2. 1. 1.]
 [2. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0.  1.  1.  3.  1.  1.]
 [ 4.  0.  0.  0.  1.  4.  1.  2.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 3. 1. 1.]
 [3. 2. 2. 1. 1.]
 [2. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 1.  0.  0.  0.  0.  1.  1.  3.  1.  1.]
 [ 4.  0.  0.  0.  1.  4.  1.  2.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 3. 1. 1.]
 [3. 2. 2. 1. 2.]
 [2. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 2.  0.  0.  0.  0.  2.  1.  3.  1.  1.]
 [ 4.  0.  0.  0.  1.  4.  1.  2.  1.  1.]
 

[Warmup] step:2700, buffer_size: 2700:  27%|██▋       | 2742/10000 [00:07<00:22, 328.49it/s]

In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 2.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 1.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 2.]
 [1. 1. 1. 2. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 2.  0.  0.  0.  1.  2.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 

[Warmup] step:2800, buffer_size: 2800:  28%|██▊       | 2806/10000 [00:07<00:25, 277.46it/s]

In function: attacker obs[[ 1.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 2.]
 [2. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 2.  0.  0.  0.  1.  2.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 2.]
 [2. 1. 1. 2. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 

[Warmup] step:2800, buffer_size: 2800:  29%|██▊       | 2867/10000 [00:07<00:24, 287.75it/s]

In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 2.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 1.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 2.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 2. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 2.  0.  0.  0.  1.  2.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 

[Warmup] step:2900, buffer_size: 2900:  29%|██▉       | 2937/10000 [00:08<00:22, 314.61it/s]

In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0.  1.  2.  1.  1.  1.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 2. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 1.  0.  0.  0.  0.  1.  2.  1.  1.  1.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 2. 1. 1. 1.]
 [2. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 2.  0.  0.  0.  0.  2.  2.  1.  1.  1.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 

[Warmup] step:3000, buffer_size: 3000:  30%|███       | 3000/10000 [00:08<00:25, 279.48it/s]

In function: attacker obs[[ 1.  0.  0.  0.  0.  1.  3.  3.  1.  1.]
 [ 2.  0.  0.  0.  1.  2.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 3. 3. 1. 1.]
 [1. 1. 1. 1. 2.]
 [1. 1. 2. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 2.  0.  0.  0.  1.  2.  3.  3.  1.  1.]
 [ 2.  0.  0.  0.  0.  2.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 3. 3. 2. 1.]
 [1. 1. 1. 1. 2.]
 [1. 1. 2. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0.  2.  1.  1.  1.  1.]
 

[Warmup] step:3000, buffer_size: 3000:  31%|███       | 3059/10000 [00:08<00:24, 280.68it/s]

In function: attacker obs[[ 3.  0.  0.  0.  1.  3.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[2. 1. 1. 1. 1.]
 [2. 1. 2. 1. 1.]
 [1. 1. 1. 2. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 2. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 

[Warmup] step:3100, buffer_size: 3100:  32%|███▏      | 3151/10000 [00:08<00:23, 293.70it/s]

In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 2. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 1.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 2. 1. 1. 1.]
 [1. 1. 1. 1. 2.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 2.  0.  0.  0.  1.  2.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 

[Warmup] step:3200, buffer_size: 3200:  32%|███▏      | 3210/10000 [00:09<00:24, 274.69it/s]

In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 1.  0.  0.  0.  0.  1.  1.  1.  2.  1.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 2. 1. 1.]
 [1. 1. 1. 3. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 2.  0.  0.  0.  1.  2.  1.  1.  2.  1.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 2. 2. 1.]
 [1. 1. 1. 3. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0.  1.  1.  2.  2.  1.]
 [ 2.  0.  0.  0.  1.  2.  1.  1.  2.  1.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 2. 2. 1.]
 [1. 1. 1. 3. 1.]
 [2. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 1.  0.  0.  0.  0.  1.  1.  2.  2.  1.]
 [ 2.  0.  0.  0.  1.  2.  1.  1.  2.  1.]
 

[Warmup] step:3200, buffer_size: 3200:  33%|███▎      | 3282/10000 [00:09<00:21, 315.57it/s]

In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 1.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  2.  2.  1.  1.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 1. 2. 1.]
 [1. 2. 2. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 2.  0.  0.  0.  1.  2.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  2.  2.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 2. 1. 1. 1.]
 [1. 1. 1. 2. 1.]
 [1. 2. 2. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0.  1.  3.  1.  1.  1.]
 [ 2.  0.  0.  0.  1.  2.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  2.  2.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 3. 1. 1. 1.]
 [1. 1. 1. 2. 1.]
 [1. 2. 2. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 1.  0.  0.  0.  0.  1.  3.  1.  1.  1.]
 [ 2.  0.  0.  0.  1.  2.  1.  1.  1.  1.]
 

[Warmup] step:3300, buffer_size: 3300:  33%|███▎      | 3346/10000 [00:09<00:23, 288.84it/s]

In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0.  1.  2.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 2. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 

[Warmup] step:3400, buffer_size: 3400:  34%|███▍      | 3400/10000 [00:09<00:22, 291.58it/s]

In function: attacker obs[[ 2.  0.  0.  0.  1.  2.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 3. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 2. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 2.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 1.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 

[Warmup] step:3400, buffer_size: 3400:  34%|███▍      | 3434/10000 [00:09<00:25, 260.26it/s]

In function: attacker obs[[ 2.  0.  0.  0.  0.  2.  1.  1.  2.  1.]
 [ 2.  0.  0.  0.  1.  2.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[2. 1. 1. 2. 1.]
 [1. 2. 1. 1. 1.]
 [2. 2. 1. 1. 3.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 3.  0.  0.  0.  1.  3.  1.  1.  2.  1.]
 [ 2.  0.  0.  0.  0.  2.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[2. 1. 1. 3. 1.]
 [1. 2. 1. 1. 1.]
 [2. 2. 1. 1. 3.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 

[Warmup] step:3500, buffer_size: 3500:  35%|███▌      | 3500/10000 [00:10<00:23, 280.26it/s]

In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0.  2.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [2. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0.  2.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [2. 2. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  1.  0.  0.  0.  2.  1.  1.  1.  1.]
 

[Warmup] step:3500, buffer_size: 3500:  36%|███▌      | 3560/10000 [00:10<00:21, 301.78it/s]

In function: attacker obs[[ 0.  0.  0.  0.  0.  1.  1.  1.  2.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 2. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 1.  0.  0.  0.  0.  1.  1.  1.  2.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 2. 2. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 2.  0.  0.  0.  1.  2.  1.  1.  2.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 2. 2. 2. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 

[Warmup] step:3600, buffer_size: 3600:  36%|███▋      | 3630/10000 [00:10<00:21, 302.62it/s]

In function: attacker obs[[ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 2. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 1.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 2. 1. 2.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 2.  0.  0.  0.  1.  2.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 2. 1. 2.]
 [1. 2. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 

[Warmup] step:3700, buffer_size: 3700:  37%|███▋      | 3700/10000 [00:10<00:22, 277.76it/s]

In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0.  1.  1.  2.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 2. 2. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 1.  0.  0.  0.  0.  1.  1.  2.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 3. 2. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 2.  0.  0.  0.  1.  2.  1.  2.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 3. 2. 2.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 2.  0.  0.  0.  1.  2.  1.  2.  1.  1.]
 

[Warmup] step:3700, buffer_size: 3700:  37%|███▋      | 3749/10000 [00:11<00:23, 271.52it/s]

In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 2.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 1.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 2. 2.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 2.  0.  0.  0.  1.  2.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 

[Warmup] step:3800, buffer_size: 3800:  38%|███▊      | 3804/10000 [00:11<00:23, 268.53it/s]

In function: attacker obs[[ 1.  0.  0.  0.  0.  1.  1.  1.  2.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 2. 2. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 2.  0.  0.  0.  1.  2.  1.  1.  2.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 2. 2. 1.]
 [1. 1. 1. 1. 1.]
 [2. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 

[Warmup] step:3800, buffer_size: 3800:  39%|███▊      | 3865/10000 [00:11<00:22, 275.94it/s]

In function: attacker obs[[ 0.  2.  0.  0.  1.  2.  2.  2.  2.  1.]
 [ 2.  0.  0.  0.  0.  2.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  2.  2.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[2. 1. 2. 2. 1.]
 [1. 1. 3. 1. 1.]
 [1. 2. 2. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[2. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 

[Warmup] step:3900, buffer_size: 3900:  39%|███▉      | 3919/10000 [00:11<00:24, 245.78it/s]

In function: attacker obs[[ 0.  0.  0.  0.  0.  2.  1.  3.  1.  1.]
 [ 2.  0.  0.  0.  1.  2.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[2. 1. 3. 1. 1.]
 [1. 1. 1. 1. 2.]
 [1. 1. 1. 2. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  1.  0.  0.  0.  2.  1.  3.  1.  1.]
 [ 2.  0.  0.  0.  1.  2.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[2. 1. 3. 1. 1.]
 [2. 1. 1. 1. 2.]
 [1. 1. 1. 2. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 

[Warmup] step:3900, buffer_size: 3900:  40%|███▉      | 3968/10000 [00:11<00:26, 231.25it/s]

In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0.  1.  1.  2.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 2. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0.  1.  1.  2.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 2. 2. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 1.  0.  0.  0.  0.  1.  1.  2.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 2. 2. 1.]
 [1. 1. 1. 1. 2.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 

[Warmup] step:4000, buffer_size: 4000:  40%|████      | 4022/10000 [00:12<00:26, 226.92it/s]

In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 2. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  2.  2.  1.  1.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 2. 2. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 1.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 

[Warmup] step:4000, buffer_size: 4000:  41%|████      | 4073/10000 [00:12<00:25, 228.24it/s]

In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 2. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 1.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 2. 1. 2. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 2.  0.  0.  0.  1.  2.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 2. 2. 2. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: a

[Warmup] step:4100, buffer_size: 4100:  41%|████      | 4124/10000 [00:12<00:24, 235.92it/s]

In function: attacker obs[[ 1.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 2. 1. 1.]
 [1. 1. 1. 1. 1.]
 [2. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 2.  0.  0.  0.  0.  2.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[2. 1. 2. 1. 1.]
 [1. 1. 1. 1. 1.]
 [2. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0.  1.  1.  1.  2.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 

[Warmup] step:4200, buffer_size: 4200:  42%|████▏     | 4200/10000 [00:12<00:21, 272.41it/s]

In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 1.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  2.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 2. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [2. 1. 1. 2. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 2.  0.  0.  0.  0.  2.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  2.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 2. 1. 1. 1.]
 [2. 1. 1. 1. 1.]
 [2. 1. 1. 2. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 3.  0.  0.  0.  1.  3.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  2.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 3. 1. 1. 1.]
 [2. 1. 1. 1. 1.]
 [2. 1. 1. 2. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0.  1.  3.  1.  2.  1.]
 [ 3.  0.  0.  0.  1.  3.  1.  1.  1.  1.]
 

[Warmup] step:4200, buffer_size: 4200:  43%|████▎     | 4283/10000 [00:13<00:18, 304.14it/s]

In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 1.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  1.  2.  1.  1.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 3. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 2. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 2.  0.  0.  0.  1.  2.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  1.  2.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 3. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 2. 1. 2.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0.  1.  1.  4.  1.  1.]
 [ 2.  0.  0.  0.  1.  2.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  1.  2.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 4. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 2. 1. 2.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 1.  0.  0.  0.  0.  1.  1.  4.  1.  1.]
 [ 2.  0.  0.  0.  1.  2.  1.  1.  1.  1.]
 

[Warmup] step:4300, buffer_size: 4300:  43%|████▎     | 4314/10000 [00:13<00:18, 304.51it/s]

In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 2. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 

[Warmup] step:4300, buffer_size: 4300:  44%|████▎     | 4374/10000 [00:13<00:20, 268.91it/s]

In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 2. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 1.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 2.]
 [1. 2. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 

[Warmup] step:4400, buffer_size: 4400:  45%|████▍     | 4469/10000 [00:13<00:18, 293.00it/s]

In function: attacker obs[[ 2.  0.  0.  0.  1.  2.  1.  1.  4.  1.]
 [ 2.  0.  0.  0.  0.  2.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 5. 2.]
 [1. 3. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 2. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 

[Warmup] step:4500, buffer_size: 4500:  45%|████▌     | 4530/10000 [00:14<00:18, 291.28it/s]

In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 2. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 1.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 2. 1. 1. 1.]
 [1. 1. 1. 1. 2.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 2.  0.  0.  0.  1.  2.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 

[Warmup] step:4600, buffer_size: 4600:  46%|████▌     | 4603/10000 [00:14<00:16, 325.92it/s]

In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 1.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[3. 1. 1. 1. 1.]
 [1. 1. 2. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 2. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 

[Warmup] step:4600, buffer_size: 4600:  47%|████▋     | 4668/10000 [00:14<00:18, 291.99it/s]

In function: attacker obs[[ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 3.  0.  0.  0.  1.  3.  1.  2.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [3. 1. 2. 1. 1.]
 [1. 1. 2. 1. 3.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 1.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 3.  0.  0.  0.  1.  3.  1.  2.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [3. 1. 2. 1. 1.]
 [1. 1. 3. 1. 3.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 2.  0.  0.  0.  1.  2.  1.  1.  1.  1.]
 [ 3.  0.  0.  0.  0.  3.  1.  2.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [3. 1. 2. 1. 1.]
 [1. 2. 3. 1. 3.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 

[Warmup] step:4700, buffer_size: 4700:  47%|████▋     | 4727/10000 [00:14<00:20, 261.31it/s]

In function: attacker obs[[ 1.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 2. 1. 1. 2.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 2.  0.  0.  0.  1.  2.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 2. 1. 1. 1.]
 [1. 2. 1. 1. 2.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0.  2.  1.  1.  1.  1.]
 

[Warmup] step:4800, buffer_size: 4800:  48%|████▊     | 4800/10000 [00:14<00:17, 295.50it/s]

In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 2. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 1.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 2. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 2. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 2.  0.  0.  0.  1.  2.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 

[Warmup] step:4800, buffer_size: 4800:  49%|████▊     | 4859/10000 [00:15<00:17, 287.75it/s]

In function: attacker obs[[ 2.  0.  0.  0.  1.  2.  2.  1.  1.  1.]
 [ 2.  0.  0.  0.  0.  2.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 3. 1. 1. 2.]
 [2. 1. 1. 1. 2.]
 [1. 1. 1. 2. 2.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0.  2.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[2. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  1.  0.  0.  0.  2.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 

[Warmup] step:4900, buffer_size: 4900:  49%|████▉     | 4928/10000 [00:15<00:16, 310.23it/s]

In function: attacker obs[[ 0.  0.  0.  0.  0.  1.  2.  2.  1.  1.]
 [ 2.  0.  0.  0.  1.  2.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  2.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 2. 2. 1. 1.]
 [2. 1. 1. 1. 1.]
 [1. 2. 2. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 2. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 

[Warmup] step:5000, buffer_size: 5000:  50%|█████     | 5000/10000 [00:15<00:17, 284.33it/s]

In function: attacker obs[[ 1.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[2. 1. 1. 1. 1.]
 [1. 1. 1. 1. 2.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 2.  0.  0.  0.  0.  2.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[2. 1. 1. 1. 1.]
 [1. 1. 1. 1. 2.]
 [1. 1. 1. 2. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 3.  0.  0.  0.  1.  3.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[2. 1. 1. 1. 1.]
 [2. 1. 1. 1. 2.]
 [1. 1. 1. 2. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 

[Warmup] step:5000, buffer_size: 5000:  51%|█████     | 5086/10000 [00:15<00:16, 292.66it/s]

In function: attacker obs[[ 1.  0.  0.  0.  0.  1.  2.  2.  2.  1.]
 [ 2.  0.  0.  0.  1.  2.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 3. 2. 2. 1.]
 [1. 1. 2. 1. 1.]
 [1. 2. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 2.  0.  0.  0.  1.  2.  2.  2.  2.  1.]
 [ 2.  0.  0.  0.  0.  2.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 3. 2. 2. 1.]
 [1. 1. 2. 1. 1.]
 [1. 3. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  2.  1.]
 

[Warmup] step:5100, buffer_size: 5100:  51%|█████▏    | 5148/10000 [00:16<00:16, 289.62it/s]

In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 2.  0.  0.  0.  1.  2.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 2. 1. 1. 1.]
 [1. 1. 1. 1. 2.]
 [2. 1. 1. 1. 2.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0.  1.  2.  1.  1.  1.]
 [ 2.  0.  0.  0.  1.  2.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 2. 1. 1. 2.]
 [1. 1. 1. 1. 2.]
 [2. 1. 1. 1. 2.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 1.  0.  0.  0.  0.  1.  2.  1.  1.  1.]
 [ 2.  0.  0.  0.  1.  2.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 2. 1. 1. 2.]
 [1. 1. 1. 1. 2.]
 [2. 2. 1. 1. 2.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 2.  0.  0.  0.  1.  2.  2.  1.  1.  1.]
 [ 2.  0.  0.  0.  0.  2.  1.  1.  1.  1.]
 

[Warmup] step:5200, buffer_size: 5200:  52%|█████▏    | 5209/10000 [00:16<00:16, 295.06it/s]

In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 2. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  2.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 2. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [2. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 1.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 

[Warmup] step:5200, buffer_size: 5200:  52%|█████▏    | 5239/10000 [00:16<00:16, 291.25it/s]

In function: attacker obs[[ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 3.  0.  0.  0.  1.  3.  2.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [2. 2. 2. 1. 2.]
 [3. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 1.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 3.  0.  0.  0.  1.  3.  2.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [2. 2. 2. 1. 2.]
 [3. 1. 1. 1. 2.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 2.  0.  0.  0.  1.  2.  1.  1.  1.  1.]
 [ 3.  0.  0.  0.  0.  3.  2.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [2. 2. 3. 1. 2.]
 [3. 1. 1. 1. 2.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 

[Warmup] step:5300, buffer_size: 5300:  53%|█████▎    | 5305/10000 [00:16<00:15, 297.73it/s]

In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 3.  0.  0.  0.  1.  3.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[2. 1. 2. 1. 1.]
 [2. 1. 2. 2. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0.  2.  1.  2.  1.  1.]
 [ 3.  0.  0.  0.  1.  3.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[2. 1. 2. 1. 2.]
 [2. 1. 2. 2. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  1.  0.  0.  0.  2.  1.  2.  1.  1.]
 [ 3.  0.  0.  0.  1.  3.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[2. 1. 2. 1. 2.]
 [2. 1. 3. 2. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  2.  0.  0.  1.  2.  2.  2.  1.  1.]
 [ 3.  0.  0.  0.  0.  3.  1.  1.  1.  1.]
 

[Warmup] step:5300, buffer_size: 5300:  54%|█████▎    | 5369/10000 [00:16<00:16, 274.91it/s]

In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0.  1.  1.  2.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 2. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0.  1.  1.  2.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 2. 1. 1.]
 [1. 1. 1. 1. 2.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 1.  0.  0.  0.  0.  1.  1.  2.  1.  1.]
 

[Warmup] step:5400, buffer_size: 5400:  54%|█████▍    | 5400/10000 [00:17<00:19, 236.89it/s]

In function: attacker obs[[ 1.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [2. 1. 1. 1. 2.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 2. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 1.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 

[Warmup] step:5400, buffer_size: 5400:  55%|█████▍    | 5481/10000 [00:17<00:17, 251.95it/s]

In function: attacker obs[[ 0.  0.  1.  0.  0.  2.  2.  1.  2.  1.]
 [ 2.  0.  0.  0.  1.  2.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[2. 2. 1. 2. 1.]
 [1. 1. 2. 1. 1.]
 [2. 1. 1. 1. 2.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  2.  0.  1.  2.  2.  2.  2.  1.]
 [ 2.  0.  0.  0.  0.  2.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[2. 2. 1. 2. 1.]
 [2. 1. 2. 1. 1.]
 [2. 1. 1. 1. 2.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 

[Warmup] step:5500, buffer_size: 5500:  55%|█████▌    | 5512/10000 [00:17<00:16, 266.40it/s]

In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 1.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  2.  1.  2.  1.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 2. 2. 2. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 2.  0.  0.  0.  1.  2.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  2.  1.  2.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 1. 2. 1.]
 [1. 2. 2. 2. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0.  1.  1.  1.  2.  1.]
 [ 2.  0.  0.  0.  1.  2.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  2.  1.  2.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 2. 1.]
 [1. 1. 1. 2. 1.]
 [1. 2. 2. 2. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 1.  0.  0.  0.  0.  1.  1.  1.  2.  1.]
 [ 2.  0.  0.  0.  1.  2.  1.  1.  1.  1.]
 

[Warmup] step:5500, buffer_size: 5500:  56%|█████▌    | 5567/10000 [00:17<00:17, 251.46it/s]

In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 2.]
 [1. 1. 2. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 1.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 2.]
 [1. 1. 2. 1. 1.]
 [1. 2. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 2.  0.  0.  0.  1.  2.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 2.]
 [1. 1. 2. 1. 2.]
 [1. 2. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0.  2.  1.  1.  1.  1.]
 [ 2.  0.  0.  0.  1.  2.  1.  1.  1.  1.]
 

[Warmup] step:5600, buffer_size: 5600:  56%|█████▌    | 5624/10000 [00:17<00:16, 266.76it/s]

In function: attacker obs[[ 2.  0.  0.  0.  1.  2.  1.  1.  2.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 2. 2. 2.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0.  1.  2.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 2. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0.  1.  2.  1.  1.  1.]
 

[Warmup] step:5600, buffer_size: 5600:  57%|█████▋    | 5680/10000 [00:18<00:16, 256.94it/s]

In function: attacker obs[[ 2.  0.  0.  0.  0.  2.  2.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[3. 2. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 3.  0.  0.  0.  0.  3.  2.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[3. 2. 1. 1. 2.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 4.  0.  0.  0.  1.  4.  2.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[3. 2. 1. 1. 2.]
 [1. 1. 1. 1. 1.]
 [2. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 

[Warmup] step:5700, buffer_size: 5700:  57%|█████▋    | 5732/10000 [00:18<00:17, 237.91it/s]

In function: attacker obs[[ 0.  0.  0.  0.  0.  1.  2.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 2. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 1.  0.  0.  0.  0.  1.  2.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 2. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 2. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 2.  0.  0.  0.  1.  2.  2.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 2. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 3. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 

[Warmup] step:5800, buffer_size: 5800:  58%|█████▊    | 5800/10000 [00:18<00:16, 249.60it/s]

In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 2.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 1.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 2.]
 [1. 1. 1. 1. 2.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 2.  0.  0.  0.  1.  2.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 

[Warmup] step:5800, buffer_size: 5800:  58%|█████▊    | 5842/10000 [00:18<00:16, 245.18it/s]

In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 2. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 1.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 2.]
 [1. 1. 1. 2. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 2.  0.  0.  0.  0.  2.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 

[Warmup] step:5900, buffer_size: 5900:  59%|█████▉    | 5900/10000 [00:19<00:15, 260.29it/s]

In function: attacker obs[[ 1.  0.  0.  0.  0.  1.  2.  1.  1.  1.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 2. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 2.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 2.  0.  0.  0.  1.  2.  2.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 2. 1. 1. 1.]
 [2. 1. 1. 1. 1.]
 [1. 1. 1. 1. 2.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 

[Warmup] step:5900, buffer_size: 5900:  60%|█████▉    | 5962/10000 [00:19<00:16, 244.32it/s]

In function: attacker obs[[ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 2. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 1.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 2. 1. 2. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 2.  0.  0.  0.  1.  2.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 2. 2. 2. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 

[Warmup] step:6000, buffer_size: 6000:  60%|██████    | 6017/10000 [00:19<00:15, 252.55it/s]

In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 2. 1. 1.]
 [1. 2. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 1.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 2. 1. 1.]
 [1. 2. 1. 1. 1.]
 [1. 1. 2. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 2.  0.  0.  0.  1.  2.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 2. 1. 1.]
 [1. 2. 1. 1. 2.]
 [1. 1. 2. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0.  1.  1.  3.  1.  1.]
 [ 2.  0.  0.  0.  1.  2.  1.  1.  1.  1.]
 

[Warmup] step:6000, buffer_size: 6000:  60%|██████    | 6050/10000 [00:19<00:14, 272.10it/s]

In function: attacker obs[[ 1.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[2. 1. 1. 1. 1.]
 [1. 2. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 2.  0.  0.  0.  0.  2.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[3. 1. 1. 1. 1.]
 [1. 2. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 3.  0.  0.  0.  0.  3.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[3. 1. 1. 1. 1.]
 [1. 2. 1. 1. 1.]
 [1. 1. 2. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 4.  0.  0.  0.  1.  4.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 

[Warmup] step:6100, buffer_size: 6100:  61%|██████▏   | 6138/10000 [00:19<00:13, 276.83it/s]

In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 2. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  2.  1.  1.  1.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 2. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 2. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 1.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  2.  1.  1.  1.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 3. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 2. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 2.  0.  0.  0.  1.  2.  1.  1.  1.  1.]
 

[Warmup] step:6200, buffer_size: 6200:  62%|██████▏   | 6208/10000 [00:20<00:12, 308.48it/s]

In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 2.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 2.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 1.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[2. 1. 1. 1. 2.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 2.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 2.  0.  0.  0.  1.  2.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[2. 1. 1. 1. 2.]
 [1. 1. 1. 1. 1.]
 [1. 1. 2. 1. 2.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0.  2.  1.  1.  1.  1.]
 [ 2.  0.  0.  0.  1.  2.  1.  1.  1.  1.]
 

[Warmup] step:6200, buffer_size: 6200:  62%|██████▏   | 6243/10000 [00:20<00:11, 319.18it/s]

In function: attacker obs[[ 2.  0.  0.  0.  1.  2.  2.  2.  1.  1.]
 [ 2.  0.  0.  0.  0.  2.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  1.  2.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 2. 2. 1. 1.]
 [1. 2. 1. 2. 1.]
 [2. 1. 2. 2. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 1. 2. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 1.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 

[Warmup] step:6300, buffer_size: 6300:  63%|██████▎   | 6304/10000 [00:20<00:16, 230.07it/s]

In function: attacker obs[[ 1.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [2. 1. 2. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 2.  0.  0.  0.  1.  2.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 2.]
 [1. 1. 1. 1. 1.]
 [2. 1. 2. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 

[Warmup] step:6300, buffer_size: 6300:  64%|██████▎   | 6360/10000 [00:20<00:14, 248.44it/s]

In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  2.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 2.]
 [1. 1. 1. 1. 1.]
 [2. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 1.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  2.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 2. 1. 1. 2.]
 [1. 1. 1. 1. 1.]
 [2. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 2.  0.  0.  0.  1.  2.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  2.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 2. 1. 1. 3.]
 [1. 1. 1. 1. 1.]
 [2. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0.  1.  2.  1.  1.  1.]
 [ 2.  0.  0.  0.  1.  2.  1.  1.  1.  1.]
 

[Warmup] step:6400, buffer_size: 6400:  64%|██████▍   | 6425/10000 [00:20<00:12, 282.41it/s]

In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  2.  1.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[2. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 2. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 1.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  2.  1.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[2. 1. 1. 1. 2.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 2. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 2.  0.  0.  0.  1.  2.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  2.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[3. 1. 1. 1. 2.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 2. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0.  3.  1.  1.  1.  1.]
 [ 2.  0.  0.  0.  1.  2.  1.  1.  1.  1.]
 

[Warmup] step:6500, buffer_size: 6500:  65%|██████▌   | 6500/10000 [00:21<00:11, 293.35it/s]

In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 2.  0.  0.  0.  0.  2.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 2. 1. 1.]
 [2. 1. 2. 1. 1.]
 [1. 1. 2. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 3.  0.  0.  0.  1.  3.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 3. 1. 1.]
 [2. 1. 2. 1. 1.]
 [1. 1. 2. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0.  1.  1.  3.  1.  1.]
 [ 3.  0.  0.  0.  1.  3.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 3. 1. 1.]
 [2. 1. 2. 2. 1.]
 [1. 1. 2. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 1.  0.  0.  0.  0.  1.  1.  3.  1.  1.]
 [ 3.  0.  0.  0.  1.  3.  1.  1.  1.  1.]
 

[Warmup] step:6500, buffer_size: 6500:  65%|██████▌   | 6545/10000 [00:21<00:12, 270.10it/s]

In function: attacker obs[[ 1.  0.  0.  0.  0.  1.  1.  2.  1.  1.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 2. 2. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 2.  0.  0.  0.  1.  2.  1.  2.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 2. 2. 2.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 

[Warmup] step:6600, buffer_size: 6600:  66%|██████▌   | 6606/10000 [00:21<00:12, 276.38it/s]

In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 1.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 2. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 2. 1. 2.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 2.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 

[Warmup] step:6600, buffer_size: 6600:  67%|██████▋   | 6695/10000 [00:21<00:11, 284.86it/s]

In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 2. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  2.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 2. 1.]
 [1. 1. 1. 1. 1.]
 [2. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 1.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 

[Warmup] step:6700, buffer_size: 6700:  67%|██████▋   | 6724/10000 [00:22<00:12, 271.75it/s]

In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 2.  0.  0.  0.  1.  2.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  2.  1.  2.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[2. 1. 1. 2. 1.]
 [1. 1. 1. 1. 1.]
 [2. 1. 2. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0.  2.  1.  2.  2.  1.]
 [ 2.  0.  0.  0.  1.  2.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  2.  1.  2.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[2. 1. 2. 2. 1.]
 [1. 1. 1. 1. 1.]
 [2. 1. 2. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 

[Warmup] step:6700, buffer_size: 6700:  68%|██████▊   | 6778/10000 [00:22<00:13, 240.21it/s]

In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 2. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 1.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[2. 1. 1. 1. 1.]
 [1. 2. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 2.  0.  0.  0.  0.  2.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 

[Warmup] step:6800, buffer_size: 6800:  68%|██████▊   | 6834/10000 [00:22<00:12, 256.82it/s]

In function: attacker obs[[ 0.  0.  3.  0.  0.  3.  3.  3.  1.  1.]
 [ 2.  0.  0.  0.  1.  2.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[3. 3. 3. 1. 1.]
 [1. 1. 1. 1. 2.]
 [1. 1. 1. 1. 2.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  4.  0.  1.  3.  3.  4.  1.  1.]
 [ 2.  0.  0.  0.  0.  2.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[3. 3. 3. 1. 1.]
 [1. 1. 2. 1. 2.]
 [1. 1. 1. 1. 2.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 

[Warmup] step:6800, buffer_size: 6800:  69%|██████▉   | 6891/10000 [00:22<00:12, 256.67it/s]

In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 2.  0.  0.  0.  1.  2.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  2.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[2. 1. 1. 2. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 2. 2.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0.  3.  1.  1.  2.  1.]
 [ 2.  0.  0.  0.  1.  2.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  2.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[3. 1. 1. 2. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 2. 2.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  1.  0.  0.  0.  3.  1.  1.  2.  1.]
 [ 2.  0.  0.  0.  1.  2.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  2.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[3. 1. 1. 2. 1.]
 [1. 1. 1. 2. 1.]
 [1. 1. 1. 2. 2.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  2.  0.  0.  1.  3.  2.  1.  2.  1.]
 [ 2.  0.  0.  0.  0.  2.  1.  1.  1.  1.]
 

[Warmup] step:6900, buffer_size: 6900:  69%|██████▉   | 6949/10000 [00:22<00:11, 268.25it/s]

In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 2.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 2. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 2.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 1.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 2. 1. 1.]
 [1. 1. 1. 1. 1.]
 [2. 1. 1. 1. 2.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 2.  0.  0.  0.  1.  2.  1.  1.  1.  1.]
 

[Warmup] step:7000, buffer_size: 7000:  70%|███████   | 7003/10000 [00:23<00:12, 239.02it/s]

In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 2. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 2. 1. 1. 1.]
 [1. 1. 2. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 1.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 

[Warmup] step:7000, buffer_size: 7000:  71%|███████   | 7069/10000 [00:23<00:10, 279.78it/s]

In function: attacker obs[[ 2.  0.  0.  0.  1.  2.  1.  2.  1.  1.]
 [ 2.  0.  0.  0.  0.  2.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  2.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 2. 1. 2.]
 [2. 1. 1. 2. 2.]
 [2. 1. 1. 1. 2.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 2. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 

[Warmup] step:7100, buffer_size: 7100:  71%|███████▏  | 7139/10000 [00:23<00:10, 277.56it/s]

In function: attacker obs[[ 0.  0.  0.  0.  0.  1.  1.  1.  4.  1.]
 [ 2.  0.  0.  0.  1.  2.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  2.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 4. 1.]
 [1. 1. 2. 1. 1.]
 [2. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 2. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 1.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 

[Warmup] step:7200, buffer_size: 7200:  72%|███████▏  | 7206/10000 [00:23<00:09, 302.38it/s]

In function: attacker obs[[ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 2. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 1.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 2. 1. 1.]
 [1. 2. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 2.  0.  0.  0.  1.  2.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 2. 1. 1.]
 [1. 3. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 

[Warmup] step:7200, buffer_size: 7200:  73%|███████▎  | 7269/10000 [00:24<00:10, 261.95it/s]

In function: attacker obs[[ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 2.  0.  0.  0.  1.  2.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 2. 1. 2. 3.]
 [1. 1. 1. 2. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 1.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 2.  0.  0.  0.  1.  2.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 2. 1. 2. 3.]
 [1. 1. 2. 2. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 2.  0.  0.  0.  1.  2.  1.  1.  1.  1.]
 [ 2.  0.  0.  0.  0.  2.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 2. 1. 2. 4.]
 [1. 1. 2. 2. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 

[Warmup] step:7300, buffer_size: 7300:  73%|███████▎  | 7300/10000 [00:24<00:10, 249.75it/s]

In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[2. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[2. 1. 1. 2. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 1.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 

[Warmup] step:7300, buffer_size: 7300:  74%|███████▎  | 7352/10000 [00:24<00:10, 245.48it/s]

In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 2.]
 [1. 1. 1. 1. 2.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 1.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 2.]
 [1. 1. 1. 1. 2.]
 [1. 1. 2. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 2.  0.  0.  0.  1.  2.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 2.]
 [1. 1. 1. 1. 2.]
 [1. 1. 2. 2. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0.  1.  1.  1.  2.  1.]
 [ 2.  0.  0.  0.  1.  2.  1.  1.  1.  1.]
 

[Warmup] step:7400, buffer_size: 7400:  74%|███████▍  | 7414/10000 [00:24<00:10, 253.91it/s]

In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  2.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 1. 2. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  2.  1.]
 [ 0.  0.  0.  0.  0.  2.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 1. 2. 1.]
 [2. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 1.  0.  0.  0.  0.  1.  1.  1.  2.  1.]
 

[Warmup] step:7400, buffer_size: 7400:  75%|███████▍  | 7468/10000 [00:24<00:10, 243.41it/s]

In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0.  2.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[2. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  1.  0.  0.  0.  2.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[2. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [2. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  2.  0.  0.  1.  2.  2.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 

[Warmup] step:7500, buffer_size: 7500:  75%|███████▌  | 7500/10000 [00:25<00:10, 244.26it/s]

In function: attacker obs[[ 1.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 2. 1.]
 [1. 1. 1. 2. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 2.  0.  0.  0.  1.  2.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 2. 1.]
 [1. 1. 2. 2. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 

[Warmup] step:7500, buffer_size: 7500:  75%|███████▌  | 7541/10000 [00:25<00:12, 200.90it/s]

In function: attacker obs[[ 0.  0.  0.  0.  0.  2.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[2. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  1.  0.  0.  0.  2.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[2. 1. 1. 1. 1.]
 [1. 1. 2. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 

[Warmup] step:7600, buffer_size: 7600:  76%|███████▌  | 7600/10000 [00:25<00:11, 211.81it/s]

In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0.  1.  1.  2.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 2. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0.  1.  1.  2.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [2. 1. 2. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 1.  0.  0.  0.  0.  1.  1.  2.  1.  1.]
 

[Warmup] step:7600, buffer_size: 7600:  76%|███████▋  | 7649/10000 [00:25<00:09, 238.84it/s]

In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0.  1.  2.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 2. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0.  1.  2.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 2. 1. 1. 1.]
 [1. 2. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 1.  0.  0.  0.  0.  1.  2.  1.  1.  1.]
 

[Warmup] step:7600, buffer_size: 7600:  77%|███████▋  | 7699/10000 [00:25<00:10, 213.25it/s]

In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 1.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  2.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 2.]
 [1. 1. 1. 1. 1.]
 [2. 1. 1. 1. 2.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 2.  0.  0.  0.  1.  2.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  2.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 2.]
 [1. 1. 1. 1. 1.]
 [2. 2. 1. 1. 2.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0.  1.  2.  1.  1.  1.]
 [ 2.  0.  0.  0.  1.  2.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  2.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 2. 1. 1. 2.]
 [1. 1. 1. 1. 1.]
 [2. 2. 1. 1. 2.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 

[Warmup] step:7700, buffer_size: 7700:  77%|███████▋  | 7725/10000 [00:26<00:10, 222.85it/s]

In function: attacker obs[[ 0.  1.  0.  0.  0.  2.  1.  1.  1.  1.]
 [ 2.  0.  0.  0.  1.  2.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  2.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[2. 1. 1. 1. 1.]
 [1. 1. 1. 3. 1.]
 [2. 1. 1. 3. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  2.  0.  0.  1.  2.  2.  1.  1.  1.]
 [ 2.  0.  0.  0.  0.  2.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  2.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[2. 1. 1. 1. 2.]
 [1. 1. 1. 3. 1.]
 [2. 1. 1. 3. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 

[Warmup] step:7700, buffer_size: 7700:  78%|███████▊  | 7770/10000 [00:26<00:11, 197.84it/s]

In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 2.  0.  0.  0.  1.  2.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  2.  1.  1.  2.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[3. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [2. 1. 1. 2. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0.  3.  1.  1.  1.  1.]
 [ 2.  0.  0.  0.  1.  2.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  2.  1.  1.  2.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[3. 1. 1. 1. 2.]
 [1. 1. 1. 1. 1.]
 [2. 1. 1. 2. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  1.  0.  0.  0.  3.  1.  1.  1.  1.]
 [ 2.  0.  0.  0.  1.  2.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  2.  1.  1.  2.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[3. 1. 1. 1. 2.]
 [1. 1. 1. 1. 1.]
 [3. 1. 1. 2. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  2.  0.  0.  1.  3.  2.  1.  1.  1.]
 [ 2.  0.  0.  0.  0.  2.  1.  1.  1.  1.]
 

[Warmup] step:7800, buffer_size: 7800:  78%|███████▊  | 7821/10000 [00:26<00:10, 208.78it/s]

In function: attacker obs[[ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 2. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 1.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 2. 1. 1.]
 [1. 2. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 2.  0.  0.  0.  1.  2.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 2. 1. 1.]
 [1. 2. 2. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 

[Warmup] step:7800, buffer_size: 7800:  79%|███████▊  | 7874/10000 [00:26<00:09, 217.47it/s]

In function: attacker obs[[ 1.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[2. 1. 1. 1. 1.]
 [2. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 2.  0.  0.  0.  0.  2.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[2. 1. 1. 1. 1.]
 [2. 1. 1. 1. 2.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 3.  0.  0.  0.  1.  3.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[2. 1. 1. 1. 1.]
 [2. 1. 1. 1. 2.]
 [1. 1. 2. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 

[Warmup] step:7900, buffer_size: 7900:  79%|███████▉  | 7926/10000 [00:26<00:08, 230.91it/s]

In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 2. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 2. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 2.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 1.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 

[Warmup] step:7900, buffer_size: 7900:  80%|███████▉  | 7973/10000 [00:27<00:09, 210.42it/s]

In function: attacker obs[[ 1.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 2.]
 [2. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 2.  0.  0.  0.  1.  2.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 2. 1. 1. 1.]
 [1. 1. 1. 1. 2.]
 [2. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 

[Warmup] step:8000, buffer_size: 8000:  80%|████████  | 8024/10000 [00:27<00:08, 227.02it/s]

In function: attacker obs[[ 1.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 3.  0.  0.  0.  1.  3.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  2.  1.  2.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 2. 1. 1.]
 [3. 2. 1. 1. 1.]
 [2. 1. 2. 1. 2.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 2.  0.  0.  0.  1.  2.  1.  1.  1.  1.]
 [ 3.  0.  0.  0.  0.  3.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  2.  1.  2.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 2. 1. 1.]
 [3. 2. 1. 1. 1.]
 [2. 1. 2. 1. 3.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0.  1.  2.  1.  1.  1.]
 

[Warmup] step:8000, buffer_size: 8000:  81%|████████  | 8069/10000 [00:27<00:09, 200.78it/s]

In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 2. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  1.  2.  1.  1.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 1. 2. 1.]
 [1. 1. 2. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 1.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  1.  2.  1.  1.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 1. 3. 1.]
 [1. 1. 2. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 2.  0.  0.  0.  1.  2.  1.  1.  1.  1.]
 

[Warmup] step:8100, buffer_size: 8100:  81%|████████  | 8121/10000 [00:27<00:08, 224.23it/s]

In function: attacker obs[[ 0.  0.  0.  0.  0.  2.  1.  1.  1.  1.]
 [ 0.  2.  0.  0.  1.  2.  2.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  2.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[2. 1. 1. 1. 1.]
 [2. 1. 1. 1. 1.]
 [2. 2. 1. 1. 2.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  1.  0.  0.  0.  2.  1.  1.  1.  1.]
 [ 0.  2.  0.  0.  1.  2.  2.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  2.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[2. 1. 1. 1. 1.]
 [2. 1. 1. 2. 1.]
 [2. 2. 1. 1. 2.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  2.  0.  0.  1.  2.  2.  1.  1.  1.]
 [ 0.  2.  0.  0.  0.  2.  2.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  2.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[3. 1. 1. 1. 1.]
 [2. 1. 1. 2. 1.]
 [2. 2. 1. 1. 2.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 

[Warmup] step:8100, buffer_size: 8100:  82%|████████▏ | 8175/10000 [00:28<00:07, 248.15it/s]

In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 2.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[2. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 2.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 1.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[2. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 3.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 2.  0.  0.  0.  0.  2.  1.  1.  1.  1.]
 

[Warmup] step:8200, buffer_size: 8200:  82%|████████▏ | 8224/10000 [00:28<00:08, 218.99it/s]

In function: attacker obs[[ 1.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 2. 1. 1.]
 [1. 1. 1. 1. 2.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 2.  0.  0.  0.  1.  2.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 2. 1.]
 [1. 1. 2. 1. 1.]
 [1. 1. 1. 1. 2.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0.  1.  1.  1.  2.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 

[Warmup] step:8200, buffer_size: 8200:  83%|████████▎ | 8271/10000 [00:28<00:07, 217.00it/s]

In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 1.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  2.  2.  1.  1.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 2. 2. 1. 2.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0.  2.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[2. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  1.  0.  0.  0.  2.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 

[Warmup] step:8300, buffer_size: 8300:  83%|████████▎ | 8300/10000 [00:28<00:08, 204.23it/s]

In function: attacker obs[[ 2.  0.  0.  0.  0.  2.  1.  1.  1.  1.]
 [ 3.  0.  0.  0.  1.  3.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  2.  2.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[2. 1. 1. 1. 2.]
 [2. 2. 1. 1. 1.]
 [2. 2. 1. 2. 2.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 3.  0.  0.  0.  1.  3.  1.  1.  1.  1.]
 [ 3.  0.  0.  0.  0.  3.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  2.  2.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[2. 1. 1. 1. 2.]
 [2. 2. 1. 1. 1.]
 [2. 3. 1. 2. 2.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 

[Warmup] step:8300, buffer_size: 8300:  83%|████████▎ | 8334/10000 [00:28<00:09, 178.02it/s]

In function: attacker obs[[ 0.  0.  0.  0.  0.  1.  1.  1.  3.  1.]
 [ 2.  0.  0.  0.  1.  2.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 3. 1.]
 [2. 1. 1. 1. 2.]
 [1. 1. 1. 1. 2.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 1.  0.  0.  0.  0.  1.  1.  1.  3.  1.]
 [ 2.  0.  0.  0.  1.  2.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 3. 1.]
 [2. 2. 1. 1. 2.]
 [1. 1. 1. 1. 2.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 2.  0.  0.  0.  1.  2.  1.  1.  3.  1.]
 [ 2.  0.  0.  0.  0.  2.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 3. 2.]
 [2. 2. 1. 1. 2.]
 [1. 1. 1. 1. 2.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 

[Warmup] step:8300, buffer_size: 8300:  84%|████████▍ | 8378/10000 [00:29<00:08, 195.05it/s]

In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  2.  1.  1.  1.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 2.]
 [1. 1. 1. 1. 1.]
 [1. 2. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 1.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  2.  1.  1.  1.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 2.]
 [1. 2. 1. 1. 1.]
 [1. 2. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 2.  0.  0.  0.  1.  2.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  2.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 2.]
 [1. 2. 1. 1. 1.]
 [1. 2. 1. 1. 2.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 2.  0.  0.  0.  1.  2.  1.  1.  1.  1.]
 

[Warmup] step:8400, buffer_size: 8400:  84%|████████▍ | 8400/10000 [00:29<00:08, 195.20it/s]

In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  2.  1.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 2. 1. 2. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 1.  0.  0.  0.  0.  1.  1.  1.  2.  1.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 2. 1. 2. 1.]
 [1. 1. 1. 1. 2.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 2.  0.  0.  0.  1.  2.  1.  1.  2.  1.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 2. 1. 1.]
 [1. 2. 1. 2. 1.]
 [1. 1. 1. 1. 2.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0.  1.  1.  2.  1.  1.]
 [ 2.  0.  0.  0.  1.  2.  1.  1.  2.  1.]
 

[Warmup] step:8400, buffer_size: 8400:  84%|████████▍ | 8436/10000 [00:29<00:09, 167.27it/s]

In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 2. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 2. 1. 1.]
 [1. 1. 1. 1. 2.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 1.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 2. 1. 1.]
 [1. 1. 1. 1. 2.]
 [1. 1. 1. 2. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 2.  0.  0.  0.  1.  2.  1.  1.  1.  1.]
 

[Warmup] step:8400, buffer_size: 8400:  85%|████████▍ | 8474/10000 [00:29<00:08, 173.20it/s]

In function: attacker obs[[ 2.  0.  0.  0.  1.  2.  1.  2.  2.  1.]
 [ 3.  0.  0.  0.  0.  3.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 2. 2. 3.]
 [2. 1. 1. 1. 1.]
 [1. 1. 2. 3. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 2. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 1.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 

[Warmup] step:8500, buffer_size: 8500:  85%|████████▌ | 8519/10000 [00:29<00:07, 196.07it/s]

In function: attacker obs[[ 1.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 2. 1. 1.]
 [1. 2. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 2.  0.  0.  0.  1.  2.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 2. 1. 1. 1.]
 [1. 1. 2. 1. 1.]
 [1. 2. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 

[Warmup] step:8600, buffer_size: 8600:  86%|████████▌ | 8600/10000 [00:30<00:05, 247.37it/s]

In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 2.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  2.  1.  1.  1.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 2.]
 [1. 1. 1. 1. 1.]
 [1. 2. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 

[Warmup] step:8600, buffer_size: 8600:  86%|████████▋ | 8639/10000 [00:30<00:05, 268.28it/s]

In function: attacker obs[[ 0.  1.  0.  0.  0.  2.  1.  2.  1.  1.]
 [ 2.  0.  0.  0.  1.  2.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[2. 1. 2. 1. 3.]
 [2. 1. 1. 1. 2.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  2.  0.  0.  1.  2.  2.  2.  1.  1.]
 [ 2.  0.  0.  0.  0.  2.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[2. 1. 2. 1. 3.]
 [2. 1. 1. 1. 2.]
 [1. 1. 2. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 

[Warmup] step:8700, buffer_size: 8700:  87%|████████▋ | 8700/10000 [00:30<00:04, 279.47it/s]

In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 1.  0.  0.  0.  0.  1.  2.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 2. 2. 1. 1.]
 [1. 1. 1. 2. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 2.  0.  0.  0.  0.  2.  2.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [2. 2. 2. 1. 1.]
 [1. 1. 1. 2. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 3.  0.  0.  0.  1.  3.  2.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [2. 2. 2. 1. 1.]
 [2. 1. 1. 2. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 3.  0.  0.  0.  1.  3.  2.  1.  1.  1.]
 

[Warmup] step:8700, buffer_size: 8700:  87%|████████▋ | 8729/10000 [00:30<00:04, 270.93it/s]

In function: attacker obs[[ 2.  0.  0.  0.  0.  2.  2.  1.  1.  1.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[2. 2. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 2.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [2. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 

[Warmup] step:8700, buffer_size: 8700:  88%|████████▊ | 8781/10000 [00:31<00:05, 205.62it/s]

In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 2. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 2.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 1.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[2. 1. 2. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 2.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 2.  0.  0.  0.  1.  2.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[2. 1. 2. 1. 1.]
 [1. 1. 1. 2. 1.]
 [1. 1. 1. 1. 2.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0.  2.  1.  2.  1.  1.]
 [ 2.  0.  0.  0.  1.  2.  1.  1.  1.  1.]
 

[Warmup] step:8800, buffer_size: 8800:  88%|████████▊ | 8803/10000 [00:31<00:06, 198.37it/s]

In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 1.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  1.  2.  1.  1.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 2. 1. 1. 1.]
 [2. 1. 2. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 2.  0.  0.  0.  1.  2.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  1.  2.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 2. 1. 1. 1.]
 [3. 1. 2. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 2.  0.  0.  0.  1.  2.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  1.  2.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 2. 1. 1. 1.]
 [4. 1. 2. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 1.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 2.  0.  0.  0.  1.  2.  1.  1.  1.  1.]
 

[Warmup] step:8800, buffer_size: 8800:  89%|████████▊ | 8870/10000 [00:31<00:05, 195.49it/s]

In function: attacker obs[[ 0.  0.  0.  0.  0.  1.  1.  2.  1.  1.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 2. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 1.  0.  0.  0.  0.  1.  1.  2.  1.  1.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 2. 1. 1.]
 [1. 1. 1. 2. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 2.  0.  0.  0.  1.  2.  1.  2.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 2. 1. 1.]
 [1. 1. 1. 2. 1.]
 [2. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 

[Warmup] step:8900, buffer_size: 8900:  89%|████████▉ | 8902/10000 [00:31<00:04, 225.98it/s]

In function: attacker obs[[ 1.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 2.]
 [1. 1. 1. 1. 1.]
 [1. 2. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 2.  0.  0.  0.  1.  2.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 3.]
 [1. 1. 1. 1. 1.]
 [1. 2. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 

[Warmup] step:8900, buffer_size: 8900:  89%|████████▉ | 8947/10000 [00:31<00:05, 193.79it/s]

In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0.  1.  2.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 2. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0.  1.  2.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 2. 1. 1. 2.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 1.  0.  0.  0.  0.  1.  2.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 3. 1. 1. 2.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 2.  0.  0.  0.  1.  2.  2.  1.  1.  1.]
 

[Warmup] step:9000, buffer_size: 9000:  90%|█████████ | 9000/10000 [00:32<00:05, 188.24it/s]

In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 2.  0.  0.  0.  1.  2.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 2. 1. 1. 2.]
 [1. 1. 1. 1. 1.]
 [1. 2. 1. 1. 2.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0.  1.  2.  2.  1.  1.]
 [ 2.  0.  0.  0.  1.  2.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 2. 2. 1. 2.]
 [1. 1. 1. 1. 1.]
 [1. 2. 1. 1. 2.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 1.  0.  0.  0.  0.  1.  2.  2.  1.  1.]
 [ 2.  0.  0.  0.  1.  2.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 2. 2. 1. 3.]
 [1. 1. 1. 1. 1.]
 [1. 2. 1. 1. 2.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 2.  0.  0.  0.  1.  2.  2.  2.  1.  1.]
 [ 2.  0.  0.  0.  0.  2.  1.  1.  1.  1.]
 

[Warmup] step:9000, buffer_size: 9000:  90%|█████████ | 9043/10000 [00:32<00:04, 224.61it/s]

In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 2.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 1.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 2. 2.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 2.  0.  0.  0.  1.  2.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 

[Warmup] step:9100, buffer_size: 9100:  91%|█████████ | 9100/10000 [00:32<00:04, 222.89it/s]

In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 2.  0.  0.  0.  1.  2.  2.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 2. 1. 2. 1.]
 [1. 1. 2. 2. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 2.  0.  0.  0.  1.  2.  2.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 3. 1. 2. 1.]
 [1. 1. 2. 2. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 1.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 2.  0.  0.  0.  1.  2.  2.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 3. 1. 2. 2.]
 [1. 1. 2. 2. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 2.  0.  0.  0.  1.  2.  1.  1.  1.  1.]
 [ 2.  0.  0.  0.  0.  2.  2.  1.  1.  1.]
 

[Warmup] step:9100, buffer_size: 9100:  91%|█████████▏| 9143/10000 [00:32<00:03, 217.03it/s]

In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 2. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 1.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 3. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 2.  0.  0.  0.  1.  2.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 

[Warmup] step:9100, buffer_size: 9100:  92%|█████████▏| 9189/10000 [00:33<00:04, 194.25it/s]

In function: attacker obs[[ 2.  0.  0.  0.  1.  2.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 2.]
 [1. 1. 1. 1. 1.]
 [2. 1. 1. 2. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 2.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 1.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 

[Warmup] step:9200, buffer_size: 9200:  92%|█████████▏| 9246/10000 [00:33<00:03, 233.91it/s]

In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 2. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 2. 1.]
 [1. 1. 1. 1. 2.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 1.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 2. 1.]
 [1. 1. 1. 1. 2.]
 [2. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 2.  0.  0.  0.  1.  2.  1.  1.  1.  1.]
 

[Warmup] step:9300, buffer_size: 9300:  93%|█████████▎| 9300/10000 [00:33<00:02, 237.45it/s]

In function: attacker obs[[ 1.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 2.]
 [1. 1. 2. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 2.  0.  0.  0.  0.  2.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[2. 1. 1. 1. 2.]
 [1. 1. 2. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 3.  0.  0.  0.  1.  3.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[2. 1. 1. 1. 2.]
 [1. 1. 2. 1. 1.]
 [2. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 

[Warmup] step:9300, buffer_size: 9300:  94%|█████████▎| 9358/10000 [00:33<00:02, 259.34it/s]

In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 2.]
 [1. 1. 1. 1. 2.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 1.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 2.]
 [1. 2. 1. 1. 2.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 2.  0.  0.  0.  1.  2.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 2.]
 [1. 3. 1. 1. 2.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0.  1.  2.  1.  1.  1.]
 [ 2.  0.  0.  0.  1.  2.  1.  1.  1.  1.]
 

[Warmup] step:9400, buffer_size: 9400:  94%|█████████▍| 9450/10000 [00:33<00:01, 277.64it/s]

In function: attacker obs[[ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 2.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 1.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 2.]
 [1. 1. 2. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 2.  0.  0.  0.  0.  2.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[2. 1. 1. 1. 1.]
 [1. 1. 1. 1. 2.]
 [1. 1. 2. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 3.  0.  0.  0.  1.  3.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 

[Warmup] step:9500, buffer_size: 9500:  95%|█████████▌| 9519/10000 [00:34<00:01, 292.64it/s]

In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 3. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 1.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 3. 1. 1. 1.]
 [1. 2. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 2.  0.  0.  0.  1.  2.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[2. 3. 1. 1. 1.]
 [1. 2. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0.  2.  3.  1.  1.  1.]
 [ 2.  0.  0.  0.  1.  2.  1.  1.  1.  1.]
 

[Warmup] step:9500, buffer_size: 9500:  95%|█████████▌| 9549/10000 [00:34<00:01, 282.95it/s]

In function: attacker obs[[ 2.  0.  0.  0.  1.  2.  1.  1.  2.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 2. 2. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 2.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 2. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 1.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 

[Warmup] step:9600, buffer_size: 9600:  96%|█████████▋| 9645/10000 [00:34<00:01, 300.63it/s]

In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 1.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  1.  2.  1.  1.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 1. 2. 1.]
 [1. 1. 2. 1. 2.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 2.  0.  0.  0.  1.  2.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  1.  2.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 2. 2. 1.]
 [1. 1. 2. 1. 2.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 2.  0.  0.  0.  1.  2.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  1.  2.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 2. 2. 1.]
 [1. 1. 2. 1. 3.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 1.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 2.  0.  0.  0.  1.  2.  1.  1.  1.  1.]
 

[Warmup] step:9700, buffer_size: 9700:  97%|█████████▋| 9717/10000 [00:34<00:00, 307.45it/s]

In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 2.  0.  0.  0.  1.  2.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 2. 1.]
 [1. 1. 2. 1. 2.]
 [1. 1. 1. 2. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0.  1.  1.  1.  2.  1.]
 [ 2.  0.  0.  0.  1.  2.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 2. 1.]
 [1. 1. 2. 1. 3.]
 [1. 1. 1. 2. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 

[Warmup] step:9700, buffer_size: 9700:  98%|█████████▊| 9778/10000 [00:35<00:00, 289.18it/s]

In function: attacker obs[[ 0.  0.  0.  0.  0.  2.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[2. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  1.  0.  0.  0.  2.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[2. 1. 1. 1. 1.]
 [1. 1. 1. 2. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  2.  0.  0.  1.  2.  2.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[2. 1. 1. 1. 1.]
 [1. 2. 1. 2. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 

[Warmup] step:9800, buffer_size: 9800:  98%|█████████▊| 9808/10000 [00:35<00:00, 276.30it/s]

In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 1.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 2. 1. 1. 1.]
 [2. 1. 1. 2. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 2.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 

[Warmup] step:9800, buffer_size: 9800:  99%|█████████▉| 9895/10000 [00:35<00:00, 262.28it/s]

In function: attacker obs[[ 0.  1.  0.  0.  0.  3.  1.  1.  1.  1.]
 [ 2.  0.  0.  0.  1.  2.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[3. 1. 1. 1. 1.]
 [1. 2. 2. 2. 2.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  2.  0.  0.  1.  3.  2.  1.  1.  1.]
 [ 2.  0.  0.  0.  0.  2.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[3. 1. 1. 1. 1.]
 [1. 2. 2. 2. 2.]
 [1. 2. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 

[Warmup] step:9900, buffer_size: 9900: 100%|█████████▉| 9958/10000 [00:35<00:00, 269.15it/s]

In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [2. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 1.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [2. 1. 1. 1. 1.]
 [1. 1. 2. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 2.  0.  0.  0.  1.  2.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 

[Warmup] step:9900, buffer_size: 9900: 100%|█████████▉| 9986/10000 [00:35<00:00, 267.72it/s]Error when trying to add network graph to tensorboard
[Warmup] step:9900, buffer_size: 9900: 100%|██████████| 10000/10000 [00:35<00:00, 278.01it/s]
[Train] epsilon:1.00,avg_a_R:0.00,avg_d_R:0.00,avg_t:0.00,avg_h:0.00,acc_A_R:0.00,acc_D_R:0.00:   0%|          | 0/20001 [00:37<?, ?it/s]

In function: attacker obs[[ 1.  0.  0.  0.  0.  1.  2.  2.  1.  1.]
 [ 2.  0.  0.  0.  1.  2.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 2. 2. 1. 2.]
 [1. 1. 1. 2. 1.]
 [2. 1. 2. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 2.  0.  0.  0.  1.  2.  2.  2.  1.  1.]
 [ 2.  0.  0.  0.  0.  2.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0.  1.  1.  1.  1.  1.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 2. 2. 1. 2.]
 [1. 1. 1. 2. 1.]
 [2. 1. 2. 1. 2.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  1. 10. 10. 10. 10.  0.]]
In function: defender obs[[1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [0. 0. 0. 0. 0.]]
In function: attacker obs[[ 0.  0.  0.  0.  0. 10. 10. 10. 10.  0.]
 [ 0.  0.  0.  0.  0.  2.  1.  1.  1.  1.]
 

ValueError: setting an array element with a sequence. The requested array has an inhomogeneous shape after 1 dimensions. The detected shape was (64,) + inhomogeneous part.

ValueError: setting an array element with a sequence. The requested array has an inhomogeneous shape after 2 dimensions. The detected shape was (2, 3) + inhomogeneous part.