In [1]:
import gym
import wandb
import torch
import numpy as np
from tqdm import tqdm
import torch.nn as nn
import torch.optim as optim
import torch.nn.functional as F

# Define Policy and REINFORCE classes

class Policy(nn.Module):
    def __init__(self, state_dim, hidden_dim, action_dim):
        super(Policy, self).__init__()
        self.fc1 = torch.nn.Linear(state_dim, hidden_dim)
        self.fc2 = torch.nn.Linear(hidden_dim, action_dim)

    def forward(self, x):
        x = F.relu(self.fc1(x))
        return F.softmax(self.fc2(x), dim=1)

class REINFORCE:
    def __init__(self, state_dim, hidden_dim, action_dim, learning_rate, gamma, device, optimizer_type):
        self.policy_net = Policy(state_dim, hidden_dim, action_dim).to(device)
        self.optimizer_type = optimizer_type
        if optimizer_type == 'adam':
            self.optimizer = torch.optim.Adam(self.policy_net.parameters(), lr=learning_rate)
        elif optimizer_type == 'sgd':
            self.optimizer = torch.optim.SGD(self.policy_net.parameters(), lr=learning_rate)
        else:
            raise ValueError("Unsupported optimizer type")
        self.gamma = gamma
        self.device = device

    def take_action(self, state):
        state = torch.tensor(state.reshape(1, -1), dtype=torch.float).to(self.device) 
        probs = self.policy_net(state)
        action_dist = torch.distributions.Categorical(probs) 
        action = action_dist.sample()
        return action.item()  

    def update(self, transition_dict):
        reward_list = transition_dict['rewards']
        state_list = transition_dict['states']
        action_list = transition_dict['actions']

        G = 0
        self.optimizer.zero_grad()
        for i in reversed(range(len(reward_list))):
            reward = reward_list[i]
            state = torch.tensor(state_list[i].reshape(1, -1), dtype=torch.float).to(self.device)
            action = torch.tensor(action_list[i]).view(-1, 1).to(self.device)
            log_prob = torch.log(self.policy_net(state).gather(1, action))
            G = self.gamma * G + reward
            loss = -log_prob * G
            loss.backward()
        self.optimizer.step()

# Hyperparameters
learning_rate = 1e-3
gamma = 0.99
hidden_dim = 128
num_episodes = 300
device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
env_name = "CartPole-v1"

# Define the sweep configuration
sweep_config = {
    "method": "bayes",
    "metric": {"name": "regret", "goal": "minimize"},
    "parameters": {
        "learning_rate": {"min": 1e-5, "max": 1e-2},
        "hidden_dim": {"values": [32, 64, 128, 256]},
        "optimizer_type": {"values": ["adam", "sgd"]}
    },'project':'cartpole_without_baseline_new',
    "early_terminate": {
        "type": "hyperband",
        "min_iter": 3,
        "max_iter": 100
    }
}
# Initialize the sweep
sweep_id = wandb.sweep(sweep_config)

def train(learning_rate, hidden_dim, optimizer_type):
    env = gym.make(env_name)
    env.reset(seed=0)
    state_dim = env.observation_space.shape[0]
    action_dim = env.action_space.n
    agent = REINFORCE(state_dim, hidden_dim, action_dim, learning_rate, gamma, device, optimizer_type)
    return_list = []

    for i_episode in range(num_episodes):
        episode_return = 0
        transition_dict = {
            "states": [],
            "actions": [],
            "next_states": [],
            "rewards": [],
            "dones": []
        }
        state, _ = env.reset()
        terminated, truncated = False, False
        while not terminated and not truncated:
            action = agent.take_action(state)
            next_state, reward, terminated, truncated, _ = env.step(action)
            transition_dict["states"].append(state)
            transition_dict["actions"].append(action)
            transition_dict["next_states"].append(next_state)
            transition_dict["rewards"].append(reward)
            transition_dict["dones"].append(terminated)
            state = next_state
            episode_return += reward
        return_list.append(episode_return)
        agent.update(transition_dict)


    avg = []
    for i in range(num_episodes):
        if i < 100:
            avg_return = np.mean(return_list[:i+1])
        else:
            avg_return = np.mean(return_list[i-100:i+1])
        wandb.log({"avg_scores": avg_return})
        avg.append(avg_return)


    regret = 0
    for i in avg:
        if i < 475:
            regret += 475 - i

    return regret

def run_training():
    config_defaults = {
        "learning_rate": 1e-3,
        "hidden_dim": 128,
        "optimizer_type": "adam"
    }
    config = wandb.init(config=config_defaults)
    learning_rate = config.config["learning_rate"]
    hidden_dim = config.config["hidden_dim"]
    optimizer_type = config.config["optimizer_type"]
    regret = train(learning_rate, hidden_dim, optimizer_type)

    wandb.log({"regret": regret})

# Run the sweep
wandb.agent(sweep_id, function=run_training)


Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


Create sweep with ID: 76xlzgsh
Sweep URL: https://wandb.ai/rl_shobhith/cartpole_without_baseline_new/sweeps/76xlzgsh


[34m[1mwandb[0m: Agent Starting Run: yp6oq89k with config:
[34m[1mwandb[0m: 	hidden_dim: 256
[34m[1mwandb[0m: 	learning_rate: 0.0016396303816840869
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.
[34m[1mwandb[0m: Currently logged in as: [33mshobhith-v[0m ([33mrl_shobhith[0m). Use [1m`wandb login --relogin`[0m to force relogin


  if not isinstance(terminated, (bool, np.bool8)):


VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▁▁▁▁▁▂▂▂▂▃▂▂▂▂▃▃▃▃▃▃▃▃▃▃▃▄▄▄▄▄▄▄▅▅▆▇████
regret,▁

0,1
avg_scores,122.32673
regret,122818.66113


[34m[1mwandb[0m: Agent Starting Run: shetyvci with config:
[34m[1mwandb[0m: 	hidden_dim: 128
[34m[1mwandb[0m: 	learning_rate: 0.000624658239765813
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▅▄▂▁▁▁▁▁▁▁▁▁▂▂▁▁▂▂▂▃▃▃▃▃▄▄▄▄▅▅▆▆▆▆▆▇▇███
regret,▁

0,1
avg_scores,55.0297
regret,131740.00156


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: 7vc9ankm with config:
[34m[1mwandb[0m: 	hidden_dim: 256
[34m[1mwandb[0m: 	learning_rate: 0.007707530481611629
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,█▄▃▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
regret,▁

0,1
avg_scores,9.39604
regret,139674.95642


[34m[1mwandb[0m: Agent Starting Run: ty7mvngs with config:
[34m[1mwandb[0m: 	hidden_dim: 32
[34m[1mwandb[0m: 	learning_rate: 0.0012502067821338564
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▁▂▂▁▁▁▁▁▁▁▁▂▂▂▂▂▂▂▃▃▃▃▃▄▄▄▄▄▅▅▅▆▆▆▆▇▇███
regret,▁

0,1
avg_scores,58.35644
regret,132128.94931


[34m[1mwandb[0m: Agent Starting Run: 2x3akhce with config:
[34m[1mwandb[0m: 	hidden_dim: 64
[34m[1mwandb[0m: 	learning_rate: 0.0022745714316541156
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,█▆▆██▇▆▅▅▄▄▄▄▃▃▃▂▁▁▁▁▁▁▁▁▁▁▁▁▂▂▂▃▃▃▃▃▃▃▃
regret,▁

0,1
avg_scores,22.10891
regret,135945.03135


[34m[1mwandb[0m: Agent Starting Run: 19he1x1i with config:
[34m[1mwandb[0m: 	hidden_dim: 256
[34m[1mwandb[0m: 	learning_rate: 0.0020262370406098607
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▁▁▁▁▁▂▂▂▂▃▃▃▄▄▅▅▆▆▇▇▇▇██████▇▇▇▆▆▆▅▅▄▄▄▃
regret,▁

0,1
avg_scores,39.37624
regret,127430.96561


[34m[1mwandb[0m: Agent Starting Run: 1wxyddbg with config:
[34m[1mwandb[0m: 	hidden_dim: 32
[34m[1mwandb[0m: 	learning_rate: 0.005090131807389067
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.000 MB of 0.000 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▄▅█▅▃▃▂▂▂▁▁▁▂▂▂▁▂▃▃▃▃▃▃▃▃▃▄▅▅▅▅▆▆▇▇▇███▇
regret,▁

0,1
avg_scores,25.64356
regret,136849.82217


[34m[1mwandb[0m: Agent Starting Run: s5ggxjzk with config:
[34m[1mwandb[0m: 	hidden_dim: 64
[34m[1mwandb[0m: 	learning_rate: 0.0012420546908991502
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▂▂▂▁▁▁▁▁▁▁▁▁▁▁▂▂▂▂▂▃▃▃▃▄▄▄▄▄▅▅▅▅▆▆▆▇▇███
regret,▁

0,1
avg_scores,61.20792
regret,131417.95477


[34m[1mwandb[0m: Agent Starting Run: wpgkl8ga with config:
[34m[1mwandb[0m: 	hidden_dim: 32
[34m[1mwandb[0m: 	learning_rate: 0.005275040354292142
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▁▁▁▁▁▁▁▁▂▂▂▂▂▂▂▂▃▃▃▄▄▄▅▅▆▆▆▆▇▇▇▇▇██████▇
regret,▁

0,1
avg_scores,165.37624
regret,114638.68622


[34m[1mwandb[0m: Agent Starting Run: 3buu4chi with config:
[34m[1mwandb[0m: 	hidden_dim: 32
[34m[1mwandb[0m: 	learning_rate: 0.00040026094302339537
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▁▃▂▂▂▂▂▂▂▂▂▂▃▃▃▃▃▃▄▄▄▄▅▅▅▅▆▆▆▆▇▇██▇▇▇███
regret,▁

0,1
avg_scores,56.70297
regret,131650.4782


[34m[1mwandb[0m: Agent Starting Run: 5ke6duef with config:
[34m[1mwandb[0m: 	hidden_dim: 256
[34m[1mwandb[0m: 	learning_rate: 0.002752863739965303
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.006 MB uploaded\r'), FloatProgress(value=0.1952671994985112, max=1.0…

0,1
avg_scores,███▆▅▄▃▃▃▃▃▂▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
regret,▁

0,1
avg_scores,9.32673
regret,138804.57379


[34m[1mwandb[0m: Agent Starting Run: x7gh4atn with config:
[34m[1mwandb[0m: 	hidden_dim: 64
[34m[1mwandb[0m: 	learning_rate: 0.003766331512947806
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.000 MB of 0.000 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,█▅▃▂▂▂▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
regret,▁

0,1
avg_scores,9.35644
regret,139254.47596


[34m[1mwandb[0m: Agent Starting Run: m9qlv0iw with config:
[34m[1mwandb[0m: 	hidden_dim: 32
[34m[1mwandb[0m: 	learning_rate: 0.005056795078041388
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.006 MB uploaded\r'), FloatProgress(value=0.19554649521718676, max=1.…

0,1
avg_scores,▄▃▂▄▅▇█▇▆▆▆▅▅▄▄▄▄▃▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
regret,▁

0,1
avg_scores,9.32673
regret,138824.20063


[34m[1mwandb[0m: Agent Starting Run: etfs677u with config:
[34m[1mwandb[0m: 	hidden_dim: 256
[34m[1mwandb[0m: 	learning_rate: 0.0010560621839581243
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.000 MB of 0.000 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,█▅▄▃▃▃▂▂▂▂▂▂▂▂▁▁▁▁▁▂▂▂▂▂▂▂▂▂▂▂▂▂▂▁▁▁▁▁▁▁
regret,▁

0,1
avg_scores,9.57426
regret,139142.08429


[34m[1mwandb[0m: Agent Starting Run: kau18q0l with config:
[34m[1mwandb[0m: 	hidden_dim: 32
[34m[1mwandb[0m: 	learning_rate: 0.0005388996533453981
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.006 MB uploaded\r'), FloatProgress(value=0.19536268212439292, max=1.…

0,1
avg_scores,▁▂▃▃▃▃▄▄▄▄▄▄▅▅▅▆▆▇█▇▇▇▇▆▆▅▅▄▄▃▃▃▂▃▅▅▅▅▅▅
regret,▁

0,1
avg_scores,31.44554
regret,133072.25523


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: xmqb1k37 with config:
[34m[1mwandb[0m: 	hidden_dim: 64
[34m[1mwandb[0m: 	learning_rate: 0.008569234246789776
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.011111111111111112, max=1.0…

VBox(children=(Label(value='0.001 MB of 0.006 MB uploaded\r'), FloatProgress(value=0.19551583568516775, max=1.…

0,1
avg_scores,█▄▃▂▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
regret,▁

0,1
avg_scores,9.39604
regret,139572.6237


[34m[1mwandb[0m: Agent Starting Run: kv2h783i with config:
[34m[1mwandb[0m: 	hidden_dim: 32
[34m[1mwandb[0m: 	learning_rate: 0.009873004126744297
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.011111111111111112, max=1.0…

VBox(children=(Label(value='0.001 MB of 0.006 MB uploaded\r'), FloatProgress(value=0.20074050225370252, max=1.…

0,1
avg_scores,▁▁▁▁▁▁▁▂▂▂▂▂▂▂▂▂▂▂▂▂▂▂▂▂▂▃▃▃▃▄▄▄▄▅▅▅▅▆▇█
regret,▁

0,1
avg_scores,235.56436
regret,120404.84811


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: dnl0saqg with config:
[34m[1mwandb[0m: 	hidden_dim: 128
[34m[1mwandb[0m: 	learning_rate: 0.00933208598251259
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.011288888888925108, max=1.0…

VBox(children=(Label(value='0.000 MB of 0.000 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,█▆▄▃▃▂▂▂▂▂▂▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
regret,▁

0,1
avg_scores,9.32673
regret,139532.90374


[34m[1mwandb[0m: Agent Starting Run: 288ffgs9 with config:
[34m[1mwandb[0m: 	hidden_dim: 256
[34m[1mwandb[0m: 	learning_rate: 0.008675043611247466
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.006 MB uploaded\r'), FloatProgress(value=0.1953590467231107, max=1.0…

0,1
avg_scores,█▄▃▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▂▂▂▂▂▂▂▂▂▂▂▂▂▁▁▁▁▁▁▁
regret,▁

0,1
avg_scores,9.39604
regret,139611.60147


[34m[1mwandb[0m: Agent Starting Run: fjqatkyy with config:
[34m[1mwandb[0m: 	hidden_dim: 64
[34m[1mwandb[0m: 	learning_rate: 0.0014916342500754384
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.000 MB of 0.006 MB uploaded\r'), FloatProgress(value=0.0, max=1.0)))

0,1
avg_scores,▁▁▁▁▂▂▂▂▂▂▂▂▂▂▃▃▃▃▃▃▄▄▄▄▄▄▅▅▅▅▅▅▅▆▆▆▇▇▇█
regret,▁

0,1
avg_scores,76.77228
regret,130308.27388


[34m[1mwandb[0m: Agent Starting Run: v1oktm46 with config:
[34m[1mwandb[0m: 	hidden_dim: 256
[34m[1mwandb[0m: 	learning_rate: 0.0029284227626168967
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.011111111111111112, max=1.0…

VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▁▁▁▁▁▁▁▁▁▁▁▁▁▁▂▂▂▂▂▂▂▃▃▃▃▄▄▄▄▅▅▅▅▆▆▆▇▇██
regret,▁

0,1
avg_scores,300.44554
regret,111956.27273


[34m[1mwandb[0m: Agent Starting Run: xw3q9tag with config:
[34m[1mwandb[0m: 	hidden_dim: 128
[34m[1mwandb[0m: 	learning_rate: 0.0004988841659989362
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▁▁▁▁▁▁▁▁▁▁▁▁▁▂▂▂▂▂▂▂▂▂▂▂▃▃▃▃▄▄▅▅▅▅▆▆▇▇▇█
regret,▁

0,1
avg_scores,58.92079
regret,133853.26126


[34m[1mwandb[0m: Agent Starting Run: qwirhx4n with config:
[34m[1mwandb[0m: 	hidden_dim: 64
[34m[1mwandb[0m: 	learning_rate: 0.004744469560393682
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.000 MB of 0.000 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,█▆▅▄▃▃▂▂▂▁▁▁▂▂▂▁▁▁▁▁▁▁▂▂▂▃▄▄▆▆▆▆▆▆▇▇███▆
regret,▁

0,1
avg_scores,23.41584
regret,137175.39212


[34m[1mwandb[0m: Agent Starting Run: acm83im5 with config:
[34m[1mwandb[0m: 	hidden_dim: 128
[34m[1mwandb[0m: 	learning_rate: 0.001150422740499447
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.000 MB of 0.001 MB uploaded\r'), FloatProgress(value=0.0, max=1.0)))

0,1
avg_scores,▁▁▁▂▃▃▄▄▄▄▄▅▅▆▇▇████▇▇████▇▆▆▅▅▅▅▆▆▆▆▆▆▆
regret,▁

0,1
avg_scores,29.71287
regret,134421.37494


[34m[1mwandb[0m: Agent Starting Run: dl0x8syu with config:
[34m[1mwandb[0m: 	hidden_dim: 256
[34m[1mwandb[0m: 	learning_rate: 0.00395049725582574
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.000 MB of 0.000 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▅▁▅▁▁▂▃▃▃▃▃▄▄▄▄▄▅▆▆▆▇▇███▇▇▇▇▇▆▆▅▆▅▆▆▆▆▇
regret,▁

0,1
avg_scores,9.40594
regret,139721.00693


[34m[1mwandb[0m: Agent Starting Run: 2g6zrgm9 with config:
[34m[1mwandb[0m: 	hidden_dim: 32
[34m[1mwandb[0m: 	learning_rate: 0.00443076349781637
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.011111111111111112, max=1.0…

VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▁▁▁▁▁▁▁▁▁▁▁▂▂▂▂▂▃▃▄▄▅▅▅▅▅▆▆▅▅▅▅▅▅▅▅▆▆▇▇█
regret,▁

0,1
avg_scores,307.93069
regret,103868.43766


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: 4upfgq87 with config:
[34m[1mwandb[0m: 	hidden_dim: 32
[34m[1mwandb[0m: 	learning_rate: 0.009481162411146042
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.000 MB of 0.006 MB uploaded\r'), FloatProgress(value=0.0, max=1.0)))

0,1
avg_scores,▁▁▂▁▁▁▂▂▂▂▂▃▃▃▄▄▅▅▆▆▆▆▆▆▆▆▅▆▆▅▅▅▅▅▆▆▇▇██
regret,▁

0,1
avg_scores,75.9604
regret,128159.09817


[34m[1mwandb[0m: Agent Starting Run: grdoz439 with config:
[34m[1mwandb[0m: 	hidden_dim: 32
[34m[1mwandb[0m: 	learning_rate: 0.0014058725475968189
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.011111111111111112, max=1.0…

VBox(children=(Label(value='0.000 MB of 0.001 MB uploaded\r'), FloatProgress(value=0.0, max=1.0)))

0,1
avg_scores,▆█▆▄▄▄▄▄▃▃▃▃▃▃▃▃▃▃▂▂▁▂▃▂▃▂▂▂▁▂▂▃▄▅▅▅▆▆▆▆
regret,▁

0,1
avg_scores,43.63366
regret,132134.25076


[34m[1mwandb[0m: Agent Starting Run: ora2quto with config:
[34m[1mwandb[0m: 	hidden_dim: 256
[34m[1mwandb[0m: 	learning_rate: 0.0023769321685458153
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.000 MB of 0.001 MB uploaded\r'), FloatProgress(value=0.0, max=1.0)))

0,1
avg_scores,▅▃▆██▇▆▆▅▄▄▄▄▄▃▃▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▂▂▃▃▃▅▆██
regret,▁

0,1
avg_scores,17.50495
regret,138862.42491


[34m[1mwandb[0m: Agent Starting Run: 1iejb3vb with config:
[34m[1mwandb[0m: 	hidden_dim: 256
[34m[1mwandb[0m: 	learning_rate: 0.00442967804318147
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▁▁▁▁▁▁▂▁▂▂▂▂▂▂▃▃▃▃▄▅▅▆▆▇▇▇▇▇▇▇▇▇▆▅▅▅▆▆▇█
regret,▁

0,1
avg_scores,189.10891
regret,112449.96347


[34m[1mwandb[0m: Agent Starting Run: coy5nvqo with config:
[34m[1mwandb[0m: 	hidden_dim: 32
[34m[1mwandb[0m: 	learning_rate: 0.004549855796388878
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.006 MB uploaded\r'), FloatProgress(value=0.1953932936383579, max=1.0…

0,1
avg_scores,▁▁▁▁▁▁▁▁▁▂▂▂▂▂▂▂▂▃▃▃▃▄▄▄▅▅▆▆▆▆▇▇▇████▇▇▇
regret,▁

0,1
avg_scores,154.09901
regret,117682.83963


[34m[1mwandb[0m: Agent Starting Run: 55gjzrxs with config:
[34m[1mwandb[0m: 	hidden_dim: 256
[34m[1mwandb[0m: 	learning_rate: 0.004398366643997907
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.006 MB uploaded\r'), FloatProgress(value=0.19533208020050125, max=1.…

0,1
avg_scores,▁▁▁▁▂▂▂▃▃▃▃▄▅▅▆▇▇▇▇███▇▇▇▆▅▄▄▄▄▃▃▂▂▂▂▂▂▂
regret,▁

0,1
avg_scores,31.72277
regret,125934.1142


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: 1p9a16r6 with config:
[34m[1mwandb[0m: 	hidden_dim: 256
[34m[1mwandb[0m: 	learning_rate: 0.005201085217508244
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.006 MB uploaded\r'), FloatProgress(value=0.19548518576579402, max=1.…

0,1
avg_scores,██▄▃▃▂▂▂▂▂▂▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
regret,▁

0,1
avg_scores,9.32673
regret,139307.61411


[34m[1mwandb[0m: Agent Starting Run: vsxkc1fw with config:
[34m[1mwandb[0m: 	hidden_dim: 128
[34m[1mwandb[0m: 	learning_rate: 0.007434129814533388
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.006 MB uploaded\r'), FloatProgress(value=0.1953932936383579, max=1.0…

0,1
avg_scores,▁▁▁▁▁▂▂▃▃▃▃▄▄▃▄▄▅▅▅▆▆▇██▇▇███████▇▇▆▆▆▆█
regret,▁

0,1
avg_scores,99.0099
regret,123246.47719


[34m[1mwandb[0m: Agent Starting Run: 5rirwyle with config:
[34m[1mwandb[0m: 	hidden_dim: 256
[34m[1mwandb[0m: 	learning_rate: 0.005272753327013269
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.000 MB of 0.000 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▆▆▄▇▇▆▅▅▄▄▄▄▄▅▅▇█▇██████▇▇▆▅▄▂▁▁▁▁▁▁▂▂▂▂
regret,▁

0,1
avg_scores,9.40594
regret,139558.79117


[34m[1mwandb[0m: Agent Starting Run: 8s0fzc58 with config:
[34m[1mwandb[0m: 	hidden_dim: 32
[34m[1mwandb[0m: 	learning_rate: 0.006342199727853958
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.000 MB of 0.000 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,█▅▃▅▆▅▅▄▄▃▃▃▃▃▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
regret,▁

0,1
avg_scores,9.39604
regret,138923.99039


[34m[1mwandb[0m: Agent Starting Run: jp2ypwww with config:
[34m[1mwandb[0m: 	hidden_dim: 256
[34m[1mwandb[0m: 	learning_rate: 0.008843031254498257
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.011111111111111112, max=1.0…

VBox(children=(Label(value='0.000 MB of 0.000 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,█▃▅▂▁▂▂▃▃▃▃▃▄▄▄▄▄▅▅▅▆▆▆▆▅▅▅▅▆▅▅▅▄▄▄▄▅▆▆▇
regret,▁

0,1
avg_scores,9.39604
regret,139728.16609


[34m[1mwandb[0m: Agent Starting Run: 445y4177 with config:
[34m[1mwandb[0m: 	hidden_dim: 256
[34m[1mwandb[0m: 	learning_rate: 0.005899828065804922
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▁▁▁▁▁▁▁▁▁▂▂▂▂▂▂▃▃▃▃▃▃▃▄▄▄▄▄▅▅▆▆▇▇██████▇
regret,▁

0,1
avg_scores,328.06931
regret,96653.36939


[34m[1mwandb[0m: Agent Starting Run: 27m6y8a2 with config:
[34m[1mwandb[0m: 	hidden_dim: 32
[34m[1mwandb[0m: 	learning_rate: 0.0069714669939476715
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▁▁▁▁▁▁▁▂▂▂▂▂▂▂▂▃▃▄▄▅▅▅▅▅▆▆▇▇███▇▇▇▇▇▇▆▆▆
regret,▁

0,1
avg_scores,227.08911
regret,92574.82668


[34m[1mwandb[0m: Agent Starting Run: yfv1hrc6 with config:
[34m[1mwandb[0m: 	hidden_dim: 128
[34m[1mwandb[0m: 	learning_rate: 0.008933091171439589
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▁▁▂▂▂▂▂▃▃▃▃▃▃▃▄▄▄▄▄▄▄▄▄▄▃▃▃▂▂▂▂▂▃▄▅▆▆▇██
regret,▁

0,1
avg_scores,263.42574
regret,110459.61545


[34m[1mwandb[0m: Agent Starting Run: xh5ga6pw with config:
[34m[1mwandb[0m: 	hidden_dim: 32
[34m[1mwandb[0m: 	learning_rate: 0.007692029463677434
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▁▁▁▁▁▁▁▁▂▂▂▂▂▂▂▂▂▂▂▂▂▂▂▂▂▂▂▃▃▃▃▃▃▄▄▅▆▇▇█
regret,▁

0,1
avg_scores,326.06931
regret,115205.38132


[34m[1mwandb[0m: Agent Starting Run: j92n4doz with config:
[34m[1mwandb[0m: 	hidden_dim: 256
[34m[1mwandb[0m: 	learning_rate: 0.0021695817607620517
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.011288888888925108, max=1.0…

VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,█▆▆▅▄▄▃▃▃▃▃▂▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
regret,▁

0,1
avg_scores,9.39604
regret,138468.22047


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: beowjh9n with config:
[34m[1mwandb[0m: 	hidden_dim: 32
[34m[1mwandb[0m: 	learning_rate: 0.004512537740256537
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▂▂▂▂▂▂▂▂▂▂▂▃▃▃▄▄▅▅▆▆▇▇▇██
regret,▁

0,1
avg_scores,340.30693
regret,110850.62478


[34m[1mwandb[0m: Agent Starting Run: zo6a5u5o with config:
[34m[1mwandb[0m: 	hidden_dim: 256
[34m[1mwandb[0m: 	learning_rate: 0.0038252220723659185
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▁▁▁▁▂▂▂▂▃▃▃▃▃▃▃▄▄▅▅▆▆▆▆▆▆▆▆▆▇▇▇▆▇▇▇▇▇███
regret,▁

0,1
avg_scores,111.50495
regret,122396.80016


[34m[1mwandb[0m: Agent Starting Run: n67cngo9 with config:
[34m[1mwandb[0m: 	hidden_dim: 128
[34m[1mwandb[0m: 	learning_rate: 0.001390359657058051
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▁▁▁▁▁▁▁▁▁▁▁▁▁▁▂▂▂▂▂▂▂▃▃▃▃▄▄▄▅▅▅▅▆▆▆▆▇▇██
regret,▁

0,1
avg_scores,250.21782
regret,115814.84031


[34m[1mwandb[0m: Agent Starting Run: uoom5kht with config:
[34m[1mwandb[0m: 	hidden_dim: 64
[34m[1mwandb[0m: 	learning_rate: 0.009863853749599544
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▁▂▂▂▂▂▂▃▃▃▃▃▃▃▃▃▃▃▄▄▄▅▅▅▅▅▇████▇▇▇▆▇▇▇▇▆
regret,▁

0,1
avg_scores,73.51485
regret,124955.10097


[34m[1mwandb[0m: Agent Starting Run: fgjquxb2 with config:
[34m[1mwandb[0m: 	hidden_dim: 32
[34m[1mwandb[0m: 	learning_rate: 0.0070406146199077
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▆▆█▇▅▅▄▅▅▅▅▅▄▄▄▄▃▃▃▃▂▂▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
regret,▁

0,1
avg_scores,9.32673
regret,138407.02253


[34m[1mwandb[0m: Agent Starting Run: cl9fo3cd with config:
[34m[1mwandb[0m: 	hidden_dim: 128
[34m[1mwandb[0m: 	learning_rate: 0.008327128834248174
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▁▁▁▁▁▁▁▁▁▁▁▁▂▂▂▂▂▂▂▂▂▃▃▄▅▆▆▆▆▇▇▇▇▇▇██▇▆▆
regret,▁

0,1
avg_scores,160.67327
regret,115814.13923


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: oaxp1osv with config:
[34m[1mwandb[0m: 	hidden_dim: 64
[34m[1mwandb[0m: 	learning_rate: 0.007717551260576001
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▁▁▁▁▁▁▂▂▂▂▂▂▂▂▂▂▃▃▃▄▄▄▅▇▇▇▇▇▇▇▇███▇▇▆▅▅▅
regret,▁

0,1
avg_scores,115.9901
regret,115350.80659


[34m[1mwandb[0m: Agent Starting Run: mfy1tnzx with config:
[34m[1mwandb[0m: 	hidden_dim: 32
[34m[1mwandb[0m: 	learning_rate: 0.005486753380785276
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▂▂▂▂▂▂▂▂▂▃▃▃▃▃▃▄▄▅▆▆▇▇▇██
regret,▁

0,1
avg_scores,341.57426
regret,109847.81387


[34m[1mwandb[0m: Agent Starting Run: frzzky2x with config:
[34m[1mwandb[0m: 	hidden_dim: 128
[34m[1mwandb[0m: 	learning_rate: 0.0009365201022600468
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▃▁▃▄▃▄▅▅▅▅▅▅▅▆▇▇▇▇▆▇▇▇▇▇▇█▇▆▆▆▆▆▆▅▅▅▆▇▇█
regret,▁

0,1
avg_scores,39.45545
regret,132587.39359


[34m[1mwandb[0m: Agent Starting Run: 1wly2t6t with config:
[34m[1mwandb[0m: 	hidden_dim: 32
[34m[1mwandb[0m: 	learning_rate: 0.007423146840341542
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▁▁▁▁▁▁▁▁▁▁▁▁▁▁▂▂▂▂▂▂▂▃▃▃▃▃▃▃▃▄▄▄▅▅▆▆▇▇██
regret,▁

0,1
avg_scores,171.67327
regret,125358.98232


[34m[1mwandb[0m: Agent Starting Run: ehor06q0 with config:
[34m[1mwandb[0m: 	hidden_dim: 64
[34m[1mwandb[0m: 	learning_rate: 0.004793921815946731
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.011111111111111112, max=1.0…

VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▁▁▁▁▁▁▁▁▂▂▂▂▂▂▂▂▂▂▃▃▃▃▃▃▃▃▃▃▃▃▃▄▄▅▆▇▇███
regret,▁

0,1
avg_scores,252.06931
regret,116708.87022


[34m[1mwandb[0m: Agent Starting Run: wpe0ir8t with config:
[34m[1mwandb[0m: 	hidden_dim: 64
[34m[1mwandb[0m: 	learning_rate: 0.004305046325746628
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.000 MB of 0.001 MB uploaded\r'), FloatProgress(value=0.0, max=1.0)))

0,1
avg_scores,▇▅▆██▆▅▅▄▄▄▄▃▃▃▃▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
regret,▁

0,1
avg_scores,9.37624
regret,138474.00124


[34m[1mwandb[0m: Agent Starting Run: d9vbwkz0 with config:
[34m[1mwandb[0m: 	hidden_dim: 32
[34m[1mwandb[0m: 	learning_rate: 0.003228937514696818
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.011111111111111112, max=1.0…

VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▁▁▁▁▁▁▁▁▁▁▁▁▂▂▂▂▂▂▂▃▃▃▃▃▄▄▄▅▅▆▆▆▆▇▇█████
regret,▁

0,1
avg_scores,261.94059
regret,110163.77793


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: ewlx6kac with config:
[34m[1mwandb[0m: 	hidden_dim: 64
[34m[1mwandb[0m: 	learning_rate: 0.003142311340053154
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▁▄▅█▇▆▅▆▆▅▅▄▄▄▃▃▂▁▁▁▁▁▂▂▃▃▄▄▄▅▅▅▅▅▄▄▃▃▂▂
regret,▁

0,1
avg_scores,14.56436
regret,137511.80806


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: iphvma68 with config:
[34m[1mwandb[0m: 	hidden_dim: 256
[34m[1mwandb[0m: 	learning_rate: 0.0035723481396258147
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▁▁▁▂▂▂▃▃▃▃▃▃▃▃▄▄▅▅▆▇▇▇██████▇▇▇▇▆▅▅▅▅▅▆█
regret,▁

0,1
avg_scores,128.28713
regret,117423.63606


[34m[1mwandb[0m: Agent Starting Run: bkprofa1 with config:
[34m[1mwandb[0m: 	hidden_dim: 64
[34m[1mwandb[0m: 	learning_rate: 0.003910694508158939
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▁▁▁▁▁▁▁▁▁▁▁▂▂▂▂▂▂▃▃▃▃▄▄▄▄▅▅▅▅▅▅▅▆▇▇▇████
regret,▁

0,1
avg_scores,266.24752
regret,109297.34127


[34m[1mwandb[0m: Agent Starting Run: fp0rje12 with config:
[34m[1mwandb[0m: 	hidden_dim: 256
[34m[1mwandb[0m: 	learning_rate: 0.007897593402935405
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.000 MB of 0.001 MB uploaded\r'), FloatProgress(value=0.0, max=1.0)))

0,1
avg_scores,█▅▃▃▃▂▂▂▂▂▂▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
regret,▁

0,1
avg_scores,9.46535
regret,139583.89856


[34m[1mwandb[0m: Agent Starting Run: er6a5jy5 with config:
[34m[1mwandb[0m: 	hidden_dim: 32
[34m[1mwandb[0m: 	learning_rate: 0.002544688506302802
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.011111111111111112, max=1.0…

VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▁▁▁▁▁▁▂▂▂▂▂▂▂▂▂▃▃▃▃▃▄▄▄▄▅▅▅▅▆▆▆▆▆▇▇▇▇███
regret,▁

0,1
avg_scores,74.51485
regret,130691.1883


[34m[1mwandb[0m: Agent Starting Run: 4nqecpjf with config:
[34m[1mwandb[0m: 	hidden_dim: 256
[34m[1mwandb[0m: 	learning_rate: 0.004883463918937782
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▄▁█▅▃▄▄▄▄▃▄▄▄▄▄▃▄▄▄▄▅▅▅▅▅▄▄▅▅▄▄▄▃▄▃▄▄▅▅▅
regret,▁

0,1
avg_scores,9.39604
regret,139716.60673


[34m[1mwandb[0m: Agent Starting Run: 5ly5f42d with config:
[34m[1mwandb[0m: 	hidden_dim: 32
[34m[1mwandb[0m: 	learning_rate: 5.2939428744018365e-05
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▁▅▁▃▄▆▇▇▇▇▆▇▇▇▇█▇▇▆▆▅▅▅▄▃▃▃▃▂▃▃▃▂▂▁▁▃▂▂▂
regret,▁

0,1
avg_scores,18.43564
regret,136538.43692


[34m[1mwandb[0m: Agent Starting Run: 8vh506qr with config:
[34m[1mwandb[0m: 	hidden_dim: 256
[34m[1mwandb[0m: 	learning_rate: 0.004746471223302573
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▁▁▁▁▁▁▁▂▂▂▂▂▂▂▃▃▄▄▅▆▆▇▇█████▇▇▇▇▆▆▆▆▆▆▆▇
regret,▁

0,1
avg_scores,305.45545
regret,84764.86024


[34m[1mwandb[0m: Agent Starting Run: 3rrh5n2a with config:
[34m[1mwandb[0m: 	hidden_dim: 128
[34m[1mwandb[0m: 	learning_rate: 0.006360666196752822
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▁▁▁▂▃▄▄▃▃▃▃▃▂▂▂▂▂▂▁▂▂▂▂▂▂▂▂▂▂▃▃▃▃▄▅▅▆▆██
regret,▁

0,1
avg_scores,86.31683
regret,128461.13692


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: 7xhg1yix with config:
[34m[1mwandb[0m: 	hidden_dim: 256
[34m[1mwandb[0m: 	learning_rate: 0.008178765426725956
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▅▃▂▁▁▁▁█▇▆▆▆▅▅▅▅▅▅▅▅▅▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
regret,▁

0,1
avg_scores,9.39604
regret,139392.71999


[34m[1mwandb[0m: Agent Starting Run: filfqb5d with config:
[34m[1mwandb[0m: 	hidden_dim: 64
[34m[1mwandb[0m: 	learning_rate: 0.009959720159601584
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.000 MB of 0.001 MB uploaded\r'), FloatProgress(value=0.0, max=1.0)))

0,1
avg_scores,█▅▄▃▃▂▂▂▂▂▂▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
regret,▁

0,1
avg_scores,9.50495
regret,139433.25484


[34m[1mwandb[0m: Agent Starting Run: m1v26wu9 with config:
[34m[1mwandb[0m: 	hidden_dim: 128
[34m[1mwandb[0m: 	learning_rate: 0.009104447471836304
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,█▇▅▅▅▄▃▃▃▃▃▃▂▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▂▂▂▁▁▁▁▁
regret,▁

0,1
avg_scores,9.32673
regret,139580.29765


[34m[1mwandb[0m: Agent Starting Run: miqh8rth with config:
[34m[1mwandb[0m: 	hidden_dim: 64
[34m[1mwandb[0m: 	learning_rate: 0.005246992715205427
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▁▁▁▁▁▁▁▁▁▁▁▁▂▂▂▂▃▃▄▄▄▄▄▄▄▄▄▅▅▅▅▅▅▅▆▆▇▇██
regret,▁

0,1
avg_scores,324.9802
regret,103067.6344


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: 4uv898qn with config:
[34m[1mwandb[0m: 	hidden_dim: 128
[34m[1mwandb[0m: 	learning_rate: 0.009794644035757106
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.011111111111111112, max=1.0…

VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,█▅▇▆▅▄▃▃▃▃▃▂▂▂▂▁▁▁▁▁▁▁▁▃▃▃▃▃▃▃▃▃▃▃▃▃▁▁▁▁
regret,▁

0,1
avg_scores,9.32673
regret,139232.49775


[34m[1mwandb[0m: Agent Starting Run: zn2o8gc0 with config:
[34m[1mwandb[0m: 	hidden_dim: 256
[34m[1mwandb[0m: 	learning_rate: 0.009628680375395132
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▂▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▂▄▅▆▆▇▇██████▇▆▅▄▄
regret,▁

0,1
avg_scores,18.84158
regret,137213.89572


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: ewjuksqr with config:
[34m[1mwandb[0m: 	hidden_dim: 64
[34m[1mwandb[0m: 	learning_rate: 0.002986913280104253
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.011111111111111112, max=1.0…

VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▁▁▁▁▁▁▁▁▁▁▁▁▂▂▂▂▂▂▂▂▂▃▃▃▃▃▃▄▄▄▄▅▅▆▆▆▇▇██
regret,▁

0,1
avg_scores,351.63366
regret,107404.75737


[34m[1mwandb[0m: Agent Starting Run: i2o0az9s with config:
[34m[1mwandb[0m: 	hidden_dim: 64
[34m[1mwandb[0m: 	learning_rate: 0.006895428820104657
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▁▁▁▁▁▁▁▁▁▁▁▁▁▂▂▂▂▂▂▂▂▃▃▃▄▄▄▅▅▅▆▆▇▇▇█████
regret,▁

0,1
avg_scores,443.0
regret,92322.00612


[34m[1mwandb[0m: Agent Starting Run: e6jew0ew with config:
[34m[1mwandb[0m: 	hidden_dim: 32
[34m[1mwandb[0m: 	learning_rate: 0.003348186980876342
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.000 MB of 0.001 MB uploaded\r'), FloatProgress(value=0.0, max=1.0)))

0,1
avg_scores,▃▅▄▄▅▅▄▄▆███▇▇▇▇▇▆▇▇▇▆▅▄▃▃▃▃▃▂▂▂▂▁▁▁▁▁▁▁
regret,▁

0,1
avg_scores,10.89109
regret,137761.27176


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: yo9kiqzz with config:
[34m[1mwandb[0m: 	hidden_dim: 256
[34m[1mwandb[0m: 	learning_rate: 0.006499216248165961
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.01127777777777131, max=1.0)…

VBox(children=(Label(value='0.000 MB of 0.001 MB uploaded\r'), FloatProgress(value=0.0, max=1.0)))

0,1
avg_scores,█▄▃▂▁▁▁▁▁▁▁▂▆▅▅▅▅▅▅▅▅▅▅▅▅▁▁▁▁▁▁▁▁▁▁▁▁▁▁▂
regret,▁

0,1
avg_scores,9.40594
regret,139532.97684


[34m[1mwandb[0m: Agent Starting Run: rlvepp7r with config:
[34m[1mwandb[0m: 	hidden_dim: 256
[34m[1mwandb[0m: 	learning_rate: 0.004293260112342862
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.011111111111111112, max=1.0…

VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▅█▅▃▃▂▂▂▂▂▂▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
regret,▁

0,1
avg_scores,10.0
regret,139299.38332


[34m[1mwandb[0m: Agent Starting Run: 0t194wlg with config:
[34m[1mwandb[0m: 	hidden_dim: 32
[34m[1mwandb[0m: 	learning_rate: 0.003614957843180072
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▂▂▂▂▂▂▂▃▃▃▄▄▄▅▅▆▆▇▇▇██
regret,▁

0,1
avg_scores,363.0396
regret,110694.18912


[34m[1mwandb[0m: Agent Starting Run: w910vcij with config:
[34m[1mwandb[0m: 	hidden_dim: 64
[34m[1mwandb[0m: 	learning_rate: 0.008118664235449675
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▁▁▁▁▁▂▂▂▂▂▂▂▂▃▃▃▃▄▅▆▇█████▇▇▇▇▆▅▄▃▂▂▂▂▂▂
regret,▁

0,1
avg_scores,42.12871
regret,115699.8994


[34m[1mwandb[0m: Agent Starting Run: zatn9vb6 with config:
[34m[1mwandb[0m: 	hidden_dim: 128
[34m[1mwandb[0m: 	learning_rate: 0.0014422288508653066
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.011111111111111112, max=1.0…

VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▁▁▁▁▁▁▁▁▁▁▁▂▂▂▂▂▂▂▂▂▂▂▃▃▃▃▄▄▄▄▅▅▅▆▆▆▆▇▇█
regret,▁

0,1
avg_scores,251.60396
regret,116410.02581


[34m[1mwandb[0m: Agent Starting Run: ehlyi9h6 with config:
[34m[1mwandb[0m: 	hidden_dim: 64
[34m[1mwandb[0m: 	learning_rate: 0.0016032657776974663
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▂▁▁▄▅▅▆▆▆▇▇▇█████▇▇▇▇▆▅▅▄▃▃▃▃▃▂▂▂▂▂▃▃▃▃▅
regret,▁

0,1
avg_scores,25.34653
regret,135079.81499


[34m[1mwandb[0m: Agent Starting Run: dzu3ddrs with config:
[34m[1mwandb[0m: 	hidden_dim: 256
[34m[1mwandb[0m: 	learning_rate: 0.0033771420334738817
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.011111111111111112, max=1.0…

VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▂▂▃▄▄▄▅▅▆▇█████▇██▇▇▇▆▆▆▆
regret,▁

0,1
avg_scores,200.09901
regret,101033.15805


[34m[1mwandb[0m: Agent Starting Run: we6g74nq with config:
[34m[1mwandb[0m: 	hidden_dim: 256
[34m[1mwandb[0m: 	learning_rate: 0.009844257985663322
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,█▆▄▄▃▃▃▂▂▂▂▂▂▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▂▂▁▁▁▁▁▁
regret,▁

0,1
avg_scores,9.32673
regret,139600.94822


[34m[1mwandb[0m: Agent Starting Run: jo8sdymc with config:
[34m[1mwandb[0m: 	hidden_dim: 128
[34m[1mwandb[0m: 	learning_rate: 0.00018355010248713983
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▂▁▁▁▂▂▂▂▂▂▃▃▃▃▄▄▅▅▅▆▆▇▇███▇▇▇▇▇▇▇▇▇▆▆▅▅▅
regret,▁

0,1
avg_scores,61.45545
regret,125177.77432


[34m[1mwandb[0m: Agent Starting Run: kt64c9e0 with config:
[34m[1mwandb[0m: 	hidden_dim: 32
[34m[1mwandb[0m: 	learning_rate: 0.006544131647340199
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▁▁▁▁▁▁▁▂▂▂▂▂▂▂▂▂▃▃▃▃▄▄▄▅▅▅▆▇▇█████▇▇▇▇▇▆
regret,▁

0,1
avg_scores,160.91089
regret,111433.94608


[34m[1mwandb[0m: Agent Starting Run: hfwgjd5u with config:
[34m[1mwandb[0m: 	hidden_dim: 128
[34m[1mwandb[0m: 	learning_rate: 0.004456098323041694
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.011111111111111112, max=1.0…

VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▁▁▁▂▂▂▂▂▂▂▂▂▂▂▂▂▂▃▃▃▃▃▃▃▃▃▃▃▃▄▄▄▄▅▆▆▇▇██
regret,▁

0,1
avg_scores,159.89109
regret,123583.03731


[34m[1mwandb[0m: Agent Starting Run: z5cpojal with config:
[34m[1mwandb[0m: 	hidden_dim: 32
[34m[1mwandb[0m: 	learning_rate: 0.0007365952720659039
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▁▁▂▂▂▃▃▃▃▄▄▄▄▄▅▅▅▆▆▆▆▆▆▆▇▇██████▇▇█▇▇▆▆▆
regret,▁

0,1
avg_scores,45.17822
regret,129733.50231


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: h24kwipa with config:
[34m[1mwandb[0m: 	hidden_dim: 64
[34m[1mwandb[0m: 	learning_rate: 0.003998682064259884
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.011111111111111112, max=1.0…

VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▁▁▂▁▂▃▆██▇▇▇▆▆▆▆▆▆▆▄▄▃▂▂▂▂▂▂▂▁▁▁▁▂▂▂▁▂▃▄
regret,▁

0,1
avg_scores,17.43564
regret,137678.83551


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: 7z243f20 with config:
[34m[1mwandb[0m: 	hidden_dim: 64
[34m[1mwandb[0m: 	learning_rate: 0.0040100672773069335
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.000 MB of 0.001 MB uploaded\r'), FloatProgress(value=0.0, max=1.0)))

0,1
avg_scores,▂▂▂▂▁▁▁▁▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▂▃▃▄▄▄▄▅▅▆▇▇██▇
regret,▁

0,1
avg_scores,31.63366
regret,137320.36914


[34m[1mwandb[0m: Agent Starting Run: 0eze3pi7 with config:
[34m[1mwandb[0m: 	hidden_dim: 128
[34m[1mwandb[0m: 	learning_rate: 0.009418452723140352
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.011111111111111112, max=1.0…

VBox(children=(Label(value='0.000 MB of 0.000 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,█▄▃▂▂▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▂
regret,▁

0,1
avg_scores,9.39604
regret,139671.47075


[34m[1mwandb[0m: Agent Starting Run: t3nnfluf with config:
[34m[1mwandb[0m: 	hidden_dim: 64
[34m[1mwandb[0m: 	learning_rate: 0.005665739349068273
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.000 MB of 0.000 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,█▄▃▆▇▆▆▅▅▄▄▄▃▃▃▃▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
regret,▁

0,1
avg_scores,9.32673
regret,138716.59111


[34m[1mwandb[0m: Agent Starting Run: 9rmu5qqc with config:
[34m[1mwandb[0m: 	hidden_dim: 32
[34m[1mwandb[0m: 	learning_rate: 0.008687913928096713
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.01127777777777131, max=1.0)…

VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,█▅▃▂▂▂▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
regret,▁

0,1
avg_scores,9.32673
regret,139209.61442


[34m[1mwandb[0m: Agent Starting Run: vmxntwaf with config:
[34m[1mwandb[0m: 	hidden_dim: 32
[34m[1mwandb[0m: 	learning_rate: 0.001971082465410321
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▂▂▂▂▂▂▂▃▃▃▃▃▄▄▄▅▅▅▆▇▇██
regret,▁

0,1
avg_scores,169.71287
regret,125178.13043


[34m[1mwandb[0m: Agent Starting Run: s2mlj7rw with config:
[34m[1mwandb[0m: 	hidden_dim: 128
[34m[1mwandb[0m: 	learning_rate: 0.003516363433538108
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▁▁▂▃▄▄▄▄▃▃▃▃▃▂▂▂▂▂▁▁▁▂▃▄▄▄▅▆▇▇▇████▆▆▆▆▆
regret,▁

0,1
avg_scores,22.0297
regret,137081.29632


[34m[1mwandb[0m: Agent Starting Run: 4mam0yfg with config:
[34m[1mwandb[0m: 	hidden_dim: 32
[34m[1mwandb[0m: 	learning_rate: 0.007740185970964823
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▁▁▁▁▁▁▁▁▁▁▂▂▂▂▂▂▃▃▄▄▄▄▄▅▅▅▆▆▆▆▆▆▆▆▇▇▇███
regret,▁

0,1
avg_scores,381.40594
regret,89761.10921


[34m[1mwandb[0m: Agent Starting Run: 9zli40u6 with config:
[34m[1mwandb[0m: 	hidden_dim: 32
[34m[1mwandb[0m: 	learning_rate: 0.006418403429565747
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▁▁▁▁▁▁▁▁▁▁▁▁▂▂▂▂▂▂▂▃▃▃▄▄▅▅▆▇▇▇▇▇▇▇▇▇▇██▇
regret,▁

0,1
avg_scores,225.9802
regret,108424.36597


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: 5t5qo1re with config:
[34m[1mwandb[0m: 	hidden_dim: 128
[34m[1mwandb[0m: 	learning_rate: 0.0027474774126336142
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▂▂▂▂▂▂▃▃▄▄▄▄▄▄▅▅▆▆▇██
regret,▁

0,1
avg_scores,81.75248
regret,134199.6764


[34m[1mwandb[0m: Agent Starting Run: tgujwq2r with config:
[34m[1mwandb[0m: 	hidden_dim: 64
[34m[1mwandb[0m: 	learning_rate: 0.00908499840036976
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.011288888888925108, max=1.0…

VBox(children=(Label(value='0.000 MB of 0.000 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▅█▆▅▄▄▃▃▃▃▃▂▂▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
regret,▁

0,1
avg_scores,9.32673
regret,139572.53803


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: fq0a9s6v with config:
[34m[1mwandb[0m: 	hidden_dim: 256
[34m[1mwandb[0m: 	learning_rate: 0.0010086232685716525
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▁▁▁▁▁▁▁▁▂▂▂▂▂▂▂▂▂▂▂▂▂▃▃▃▃▄▄▄▄▅▅▅▆▆▇▇████
regret,▁

0,1
avg_scores,262.17822
regret,111584.83302


[34m[1mwandb[0m: Agent Starting Run: ute880rl with config:
[34m[1mwandb[0m: 	hidden_dim: 64
[34m[1mwandb[0m: 	learning_rate: 0.00163840660491219
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▂▂▂▂▂▂▂▂▂▂▃▃▃▃▄▄▅▅▆▆▇██
regret,▁

0,1
avg_scores,141.07921
regret,127918.29456


[34m[1mwandb[0m: Agent Starting Run: tf2qqebj with config:
[34m[1mwandb[0m: 	hidden_dim: 128
[34m[1mwandb[0m: 	learning_rate: 0.007145243721769772
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.01127777777777131, max=1.0)…

VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▁▁▂▁▁▁▁▁▂▂▂▂▂▂▂▂▂▃▃▄▄▄▅▅▆▇▇▇█████▇▇▆▆▆▆▇
regret,▁

0,1
avg_scores,100.59406
regret,122532.78333


[34m[1mwandb[0m: Agent Starting Run: ibjc2rci with config:
[34m[1mwandb[0m: 	hidden_dim: 128
[34m[1mwandb[0m: 	learning_rate: 0.005833873504236181
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.000 MB of 0.001 MB uploaded\r'), FloatProgress(value=0.0, max=1.0)))

0,1
avg_scores,▇█▄▃▂▂▂▂▁▁▂▂▃▄▄▄▅▆▆▆▆▇██▇▇▆▆▆▅▅▄▄▄▃▂▂▂▁▁
regret,▁

0,1
avg_scores,10.53465
regret,137648.20389


[34m[1mwandb[0m: Agent Starting Run: os3fl7cy with config:
[34m[1mwandb[0m: 	hidden_dim: 256
[34m[1mwandb[0m: 	learning_rate: 0.009815991518854322
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.011111111111111112, max=1.0…

VBox(children=(Label(value='0.000 MB of 0.000 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,█▄▃▂▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
regret,▁

0,1
avg_scores,9.39604
regret,139597.80993


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: w0ucdqc1 with config:
[34m[1mwandb[0m: 	hidden_dim: 64
[34m[1mwandb[0m: 	learning_rate: 0.005237089406766094
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.011288888888844262, max=1.0…

VBox(children=(Label(value='0.000 MB of 0.000 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,█▅█▆▅▄▃▃▃▃▃▃▄▄▄▃▃▃▄▄▅▅▆▆▆▅▄▄▄▄▄▃▃▂▂▁▁▁▁▁
regret,▁

0,1
avg_scores,9.70297
regret,138300.74589


[34m[1mwandb[0m: Agent Starting Run: f3my471p with config:
[34m[1mwandb[0m: 	hidden_dim: 128
[34m[1mwandb[0m: 	learning_rate: 0.006843048014244778
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.011111111111111112, max=1.0…

VBox(children=(Label(value='0.000 MB of 0.001 MB uploaded\r'), FloatProgress(value=0.0, max=1.0)))

0,1
avg_scores,█▄▃▂▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
regret,▁

0,1
avg_scores,9.39604
regret,139536.25175


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: 5wddha6l with config:
[34m[1mwandb[0m: 	hidden_dim: 32
[34m[1mwandb[0m: 	learning_rate: 0.005715987673196202
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.011111111111111112, max=1.0…

VBox(children=(Label(value='0.000 MB of 0.000 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,█▇▄▃▃▃▂▂▂▂▂▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
regret,▁

0,1
avg_scores,9.48515
regret,138855.6921


[34m[1mwandb[0m: Agent Starting Run: 92uz0qma with config:
[34m[1mwandb[0m: 	hidden_dim: 64
[34m[1mwandb[0m: 	learning_rate: 0.002883091675461624
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▄█▆▆▅▇▆▆▇▇▆▆▅▅▄▄▄▄▃▃▃▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
regret,▁

0,1
avg_scores,10.26733
regret,138658.35526


[34m[1mwandb[0m: Agent Starting Run: 2badpmiz with config:
[34m[1mwandb[0m: 	hidden_dim: 128
[34m[1mwandb[0m: 	learning_rate: 0.007024200833049853
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.011111111111111112, max=1.0…

VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▁▁▁▁▁▁▁▁▁▂▂▂▂▃▃▄▅▅▆▆▆▆▆▇███▇▇▆▅▅▅▅▅▅▅▄▄▄
regret,▁

0,1
avg_scores,60.0198
regret,126059.61192


[34m[1mwandb[0m: Agent Starting Run: a4fxopua with config:
[34m[1mwandb[0m: 	hidden_dim: 64
[34m[1mwandb[0m: 	learning_rate: 0.00785424169128689
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▁▁▁▁▁▁▁▂▂▂▂▂▂▂▂▃▃▃▃▄▄▅▆▆▆▇▇▇▇▇▇██▇▇▇▇▇▇▆
regret,▁

0,1
avg_scores,250.93069
regret,92924.07944


[34m[1mwandb[0m: Agent Starting Run: racigogu with config:
[34m[1mwandb[0m: 	hidden_dim: 256
[34m[1mwandb[0m: 	learning_rate: 0.005626984422391721
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.011111111111111112, max=1.0…

VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▁▁▁▁▁▁▁▁▂▂▂▂▂▂▂▂▂▂▃▃▃▃▃▃▃▃▄▄▄▄▄▄▄▅▆▆▇▇▇█
regret,▁

0,1
avg_scores,271.93069
regret,114170.87224


[34m[1mwandb[0m: Agent Starting Run: f64d0sf6 with config:
[34m[1mwandb[0m: 	hidden_dim: 32
[34m[1mwandb[0m: 	learning_rate: 0.007082929392749546
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.011288888888925108, max=1.0…

VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▁▁▁▁▁▁▁▂▂▂▂▂▂▂▂▂▃▃▄▅▅▅▆▆▆▆▆▇█████▇▇▆▆▆▆▆
regret,▁

0,1
avg_scores,146.0297
regret,111482.61309


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: w0mkei1o with config:
[34m[1mwandb[0m: 	hidden_dim: 256
[34m[1mwandb[0m: 	learning_rate: 0.009966061564705867
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.011288888888844262, max=1.0…

VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▁▁▁▁▂▂▂▂▂▂▂▂▂▂▂▂▂▂▂▂▂▂▂▃▃▃▃▃▃▃▃▃▄▅▆▇▇▇██
regret,▁

0,1
avg_scores,215.37624
regret,120454.62185


[34m[1mwandb[0m: Agent Starting Run: bpi9vhng with config:
[34m[1mwandb[0m: 	hidden_dim: 64
[34m[1mwandb[0m: 	learning_rate: 0.005800828959557478
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.000 MB of 0.000 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▄▅▄▃▃▇▆▆█▇▇▆▆▆▅▅▅▅▄▃▃▃▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
regret,▁

0,1
avg_scores,9.39604
regret,138916.26347


[34m[1mwandb[0m: Agent Starting Run: h19l8rn5 with config:
[34m[1mwandb[0m: 	hidden_dim: 128
[34m[1mwandb[0m: 	learning_rate: 0.004376912175701112
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.011288888888925108, max=1.0…

VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▂▂▂▂▂▂▂▂▂▂▂▃▃▃▃▄▅▆▆▇█
regret,▁

0,1
avg_scores,257.46535
regret,124244.33317


[34m[1mwandb[0m: Agent Starting Run: 66k8389t with config:
[34m[1mwandb[0m: 	hidden_dim: 32
[34m[1mwandb[0m: 	learning_rate: 0.0004627871291844659
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▂▂▁▄▃▄▃▂▂▂▁▁▁▁▁▃▃▄▄▄▅▆▇████▇▆▅▅▇█▇▇▇▆▇▇▇
regret,▁

0,1
avg_scores,50.10891
regret,129790.09928


[34m[1mwandb[0m: Agent Starting Run: vkrsuj8h with config:
[34m[1mwandb[0m: 	hidden_dim: 64
[34m[1mwandb[0m: 	learning_rate: 0.0003047155649461232
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▁▁▁▁▂▂▂▂▂▂▂▃▃▃▃▄▄▄▄▅▅▅▅▅▆▅▅▅▆▆▆▇▇▇▇▇▇▇██
regret,▁

0,1
avg_scores,70.06931
regret,129858.64477


[34m[1mwandb[0m: Agent Starting Run: imjskwev with config:
[34m[1mwandb[0m: 	hidden_dim: 256
[34m[1mwandb[0m: 	learning_rate: 0.009561574937160163
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.000 MB of 0.000 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,█▄▃▂▂▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
regret,▁

0,1
avg_scores,9.40594
regret,139471.69041


[34m[1mwandb[0m: Agent Starting Run: 8n2fabvg with config:
[34m[1mwandb[0m: 	hidden_dim: 256
[34m[1mwandb[0m: 	learning_rate: 0.008276713993526362
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.011288888888925108, max=1.0…

VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▂▂▂▃▃▄▅▅▅▅▄▄▄▄▄▅▆▇▇█████▇▇▇▇▆▅▅▄▂▂▁▁▁▁▁▁
regret,▁

0,1
avg_scores,9.92079
regret,103716.2715


[34m[1mwandb[0m: Agent Starting Run: kvfbt239 with config:
[34m[1mwandb[0m: 	hidden_dim: 64
[34m[1mwandb[0m: 	learning_rate: 0.005935121321394175
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.011111111111111112, max=1.0…

VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▁▁▁▁▁▁▁▂▂▂▂▂▂▂▂▂▂▂▂▂▂▂▃▃▃▂▃▃▃▃▃▃▃▃▄▅▆▆▇█
regret,▁

0,1
avg_scores,200.60396
regret,125067.42758


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: 7smdt9w6 with config:
[34m[1mwandb[0m: 	hidden_dim: 256
[34m[1mwandb[0m: 	learning_rate: 0.003508564911435288
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▁▁▁▁▁▁▁▁▂▂▂▂▂▂▂▃▄▄▄▄▅▅▆▆▆▇▇██████▇▇▇▆▆▆▆
regret,▁

0,1
avg_scores,149.40594
regret,106343.16466


[34m[1mwandb[0m: Agent Starting Run: e8n4pkd1 with config:
[34m[1mwandb[0m: 	hidden_dim: 32
[34m[1mwandb[0m: 	learning_rate: 0.0034030819073366937
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▂▂▂▂▂▂▂▂▃▃▃▃▃▃▄▄▄▅▅▆▆▆▇▇█
regret,▁

0,1
avg_scores,288.75248
regret,114511.14096


[34m[1mwandb[0m: Agent Starting Run: sxkje2a2 with config:
[34m[1mwandb[0m: 	hidden_dim: 32
[34m[1mwandb[0m: 	learning_rate: 0.0058215054183812865
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▂▂▂▂▂▂▂▂▂▃▃▃▃▃▄▄▅▆▆▇▇██
regret,▁

0,1
avg_scores,321.54455
regret,115434.75081


[34m[1mwandb[0m: Agent Starting Run: mqb5uc4y with config:
[34m[1mwandb[0m: 	hidden_dim: 32
[34m[1mwandb[0m: 	learning_rate: 0.001099299672537282
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.000 MB of 0.001 MB uploaded\r'), FloatProgress(value=0.0, max=1.0)))

0,1
avg_scores,█▄▃▄▃▂▂▃▂▂▂▂▂▃▃▃▃▂▂▃▃▂▃▃▄▄▄▃▃▃▃▃▂▂▂▁▂▂▂▁
regret,▁

0,1
avg_scores,25.72277
regret,133218.34241


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: u6ip7j2q with config:
[34m[1mwandb[0m: 	hidden_dim: 64
[34m[1mwandb[0m: 	learning_rate: 0.00486125100809408
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▁▁▁▁▁▁▁▁▁▁▁▂▂▂▂▂▂▂▂▂▂▂▂▃▃▃▄▅▆▆▆▆▆▇▇███▇▇
regret,▁

0,1
avg_scores,255.9802
regret,107093.20915


[34m[1mwandb[0m: Agent Starting Run: hks6mzrp with config:
[34m[1mwandb[0m: 	hidden_dim: 64
[34m[1mwandb[0m: 	learning_rate: 0.004821662513083066
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▁▁▁▁▁▁▁▁▁▁▂▂▂▂▂▂▃▃▃▄▄▄▅▅▆▆▆▆▇███▇▇▆▆▆▅▅▅
regret,▁

0,1
avg_scores,115.0495
regret,116214.95092


[34m[1mwandb[0m: Agent Starting Run: ere7hyqs with config:
[34m[1mwandb[0m: 	hidden_dim: 256
[34m[1mwandb[0m: 	learning_rate: 0.007516756598611427
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▁▁▁▁▁▁▁▂▂▂▂▂▂▃▄▅▅▆▆▇▆▆▆▆▆▆▅▅▅▄▄▄▄▅▆▆▇▇▇█
regret,▁

0,1
avg_scores,139.54455
regret,120637.00229


[34m[1mwandb[0m: Agent Starting Run: yfv9xmud with config:
[34m[1mwandb[0m: 	hidden_dim: 128
[34m[1mwandb[0m: 	learning_rate: 2.2428271551911473e-05
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.000 MB of 0.001 MB uploaded\r'), FloatProgress(value=0.0, max=1.0)))

0,1
avg_scores,█▆▄▄▃▂▂▁▁▁▂▂▂▂▂▂▂▃▃▃▃▄▄▃▃▃▄▄▄▄▄▄▄▄▄▄▄▅▄▃
regret,▁

0,1
avg_scores,18.37624
regret,136919.99937


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: qksur904 with config:
[34m[1mwandb[0m: 	hidden_dim: 256
[34m[1mwandb[0m: 	learning_rate: 0.00053460721545854
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.01127777777777131, max=1.0)…

VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▁▁▁▁▁▁▁▁▁▁▁▁▁▁▂▂▂▂▂▂▂▂▂▃▃▃▄▄▄▅▅▅▆▆▆▇▇███
regret,▁

0,1
avg_scores,120.34653
regret,127389.68744


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: cghcyc0f with config:
[34m[1mwandb[0m: 	hidden_dim: 128
[34m[1mwandb[0m: 	learning_rate: 0.003981030331446277
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.000 MB of 0.001 MB uploaded\r'), FloatProgress(value=0.0, max=1.0)))

0,1
avg_scores,█▇█▆▅▆▆▆▆▅▅▅▅▅▅▄▄▄▄▃▃▃▃▃▂▂▂▂▂▂▁▁▁▁▁▁▁▁▁▁
regret,▁

0,1
avg_scores,11.32673
regret,136948.36577


[34m[1mwandb[0m: Agent Starting Run: otnr1c5f with config:
[34m[1mwandb[0m: 	hidden_dim: 64
[34m[1mwandb[0m: 	learning_rate: 0.005678013883549015
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▄▃▁▁▁▁▂▃▂▂▂▃▃▃▃▄▅▅▅▅▅▇██▇▇▇██▇▇▇▇▇▆▆▆▆▇▆
regret,▁

0,1
avg_scores,19.34653
regret,137381.40609


[34m[1mwandb[0m: Agent Starting Run: 87z8t8o1 with config:
[34m[1mwandb[0m: 	hidden_dim: 128
[34m[1mwandb[0m: 	learning_rate: 0.0035387363680852973
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.01127777777777131, max=1.0)…

VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▂▂▅█▆▆▆▅▅▄▄▄▄▄▄▄▃▂▂▂▂▂▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
regret,▁

0,1
avg_scores,9.35644
regret,139088.67451


[34m[1mwandb[0m: Agent Starting Run: spfbgcyi with config:
[34m[1mwandb[0m: 	hidden_dim: 256
[34m[1mwandb[0m: 	learning_rate: 0.0010274134585138736
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▁▁▁▁▂▂▂▂▂▂▂▂▂▂▂▂▃▃▃▃▃▄▄▄▄▄▅▅▅▅▅▅▆▅▆▆▇▇██
regret,▁

0,1
avg_scores,225.87129
regret,112855.93923


[34m[1mwandb[0m: Agent Starting Run: w3i4y8zs with config:
[34m[1mwandb[0m: 	hidden_dim: 128
[34m[1mwandb[0m: 	learning_rate: 0.004691558115590192
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▂▂▂▂▂▂▃▃▃▃▃▄▄▄▄▅▅▆▆▇▇██
regret,▁

0,1
avg_scores,407.58416
regret,107960.16137


[34m[1mwandb[0m: Agent Starting Run: xv6k6b7s with config:
[34m[1mwandb[0m: 	hidden_dim: 256
[34m[1mwandb[0m: 	learning_rate: 0.00572720682735994
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▁▁▂▂▂▂▂▂▂▂▂▂▂▂▂▂▂▂▂▂▂▂▃▃▄▄▄▄▅▅▅▅▆▇███▇▆▆
regret,▁

0,1
avg_scores,123.44554
regret,119316.78863


[34m[1mwandb[0m: Agent Starting Run: abo9dgck with config:
[34m[1mwandb[0m: 	hidden_dim: 64
[34m[1mwandb[0m: 	learning_rate: 0.005492333995986304
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▁▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▂▂▂▃▃▄▅▅▆▆▆▇█████▇▆▆▆▆▆▆
regret,▁

0,1
avg_scores,16.33663
regret,138354.87207


[34m[1mwandb[0m: Agent Starting Run: 4l3i7xb2 with config:
[34m[1mwandb[0m: 	hidden_dim: 32
[34m[1mwandb[0m: 	learning_rate: 0.002404937150791826
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▂▂▂▂▂▂▂▂▂▃▃▃▃▄▄▅▅▅▅▅▆▇▇██
regret,▁

0,1
avg_scores,211.76238
regret,121341.37572


[34m[1mwandb[0m: Agent Starting Run: 322rd0lt with config:
[34m[1mwandb[0m: 	hidden_dim: 256
[34m[1mwandb[0m: 	learning_rate: 0.003829430192249449
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▂▂▂▂▂▂▂▃▃▄▆█████████▇▇▆▆▅
regret,▁

0,1
avg_scores,85.0198
regret,124874.77704


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: vgfd887p with config:
[34m[1mwandb[0m: 	hidden_dim: 64
[34m[1mwandb[0m: 	learning_rate: 0.009369014097171157
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,█▅▇▅▄▄▃▃▃▃▃▂▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
regret,▁

0,1
avg_scores,9.42574
regret,139379.19024


[34m[1mwandb[0m: Agent Starting Run: t2v2vdm6 with config:
[34m[1mwandb[0m: 	hidden_dim: 64
[34m[1mwandb[0m: 	learning_rate: 0.004430497234748227
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▁▁▁▁▁▁▁▁▁▁▁▁▁▂▂▂▂▃▃▃▃▄▄▄▅▅▆▆▆▇▇▇▇▇██████
regret,▁

0,1
avg_scores,452.11881
regret,79123.09866


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: 4jv2ujwo with config:
[34m[1mwandb[0m: 	hidden_dim: 256
[34m[1mwandb[0m: 	learning_rate: 0.008886450947145196
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.000 MB of 0.000 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,██▇▅▄▄▃▃▃▂▂▂▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
regret,▁

0,1
avg_scores,10.83168
regret,138239.79817


[34m[1mwandb[0m: Agent Starting Run: j9cw5751 with config:
[34m[1mwandb[0m: 	hidden_dim: 32
[34m[1mwandb[0m: 	learning_rate: 0.003640950233522389
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,█▇▇▆▅▅▄▄▄▄▄▄▅▅▄▄▃▃▃▄▄▄▄▄▄▃▃▃▃▃▃▃▃▂▂▂▂▂▁▁
regret,▁

0,1
avg_scores,9.52475
regret,137640.35602


[34m[1mwandb[0m: Agent Starting Run: vbwot3yg with config:
[34m[1mwandb[0m: 	hidden_dim: 256
[34m[1mwandb[0m: 	learning_rate: 0.007863843228922775
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.011288888888925108, max=1.0…

VBox(children=(Label(value='0.000 MB of 0.000 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▅▄▂▂▂▂▅█▇▆▆▆▅▅▅▅▅▅▅▃▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
regret,▁

0,1
avg_scores,9.39604
regret,139436.0669


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: zeq0x1kt with config:
[34m[1mwandb[0m: 	hidden_dim: 256
[34m[1mwandb[0m: 	learning_rate: 7.78476553693953e-05
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.011288888888925108, max=1.0…

VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▁▁▂▁▂▃▃▃▃▄▄▃▄▃▄▄▄▄▅▅▅▅▅▅▆▆▇▇▇▇▇▇▇▇█████▇
regret,▁

0,1
avg_scores,28.56436
regret,134993.16


[34m[1mwandb[0m: Agent Starting Run: r6ubhnp3 with config:
[34m[1mwandb[0m: 	hidden_dim: 256
[34m[1mwandb[0m: 	learning_rate: 0.0067717505448382734
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.000 MB of 0.001 MB uploaded\r'), FloatProgress(value=0.0, max=1.0)))

0,1
avg_scores,█▄▃▁▁▁▁▁▁▁▂▂▂▂▂▂▂▃▃▃▃▃▃▃▂▂▂▂▂▂▂▂▁▂▂▂▂▂▂▂
regret,▁

0,1
avg_scores,9.40594
regret,139692.07915


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: bmrbbg7y with config:
[34m[1mwandb[0m: 	hidden_dim: 256
[34m[1mwandb[0m: 	learning_rate: 0.006298410285162798
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.000 MB of 0.001 MB uploaded\r'), FloatProgress(value=0.0, max=1.0)))

0,1
avg_scores,█▄▃▂▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
regret,▁

0,1
avg_scores,9.39604
regret,139413.57458


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: ntmsp3re with config:
[34m[1mwandb[0m: 	hidden_dim: 32
[34m[1mwandb[0m: 	learning_rate: 0.007541703662505528
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▆█▅▇█▇▆▆▅▅▅▄▄▄▃▃▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
regret,▁

0,1
avg_scores,9.39604
regret,138680.42085


[34m[1mwandb[0m: Agent Starting Run: x949ctyh with config:
[34m[1mwandb[0m: 	hidden_dim: 256
[34m[1mwandb[0m: 	learning_rate: 0.006370249061941923
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.011111111111111112, max=1.0…

VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▇▅▆█▆▅▅▄▄▃▃▃▃▃▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▂
regret,▁

0,1
avg_scores,9.48515
regret,139541.68072


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: 5nvt1pzy with config:
[34m[1mwandb[0m: 	hidden_dim: 64
[34m[1mwandb[0m: 	learning_rate: 0.009067296769609988
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.000 MB of 0.001 MB uploaded\r'), FloatProgress(value=0.0, max=1.0)))

0,1
avg_scores,▂▄▂▂▂▁▁▁▁▁▁▁▁▁▁▂▂▂▃▃▄▄▅▆▆▆▆██████▇▆▆▅▄▄▄
regret,▁

0,1
avg_scores,13.50495
regret,138336.86511


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: w3e89ljr with config:
[34m[1mwandb[0m: 	hidden_dim: 64
[34m[1mwandb[0m: 	learning_rate: 0.0018984041052528123
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▁▁▁▁▁▁▁▁▁▂▂▂▂▂▂▂▂▂▂▂▂▃▃▃▃▃▃▃▃▄▄▅▅▆▆▇▇▇██
regret,▁

0,1
avg_scores,136.42574
regret,126357.12515


[34m[1mwandb[0m: Agent Starting Run: n19822cd with config:
[34m[1mwandb[0m: 	hidden_dim: 32
[34m[1mwandb[0m: 	learning_rate: 0.00520246703341275
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.000 MB of 0.000 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▄▅▇█▆▅▄▄▄▃▃▃▃▃▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▂▂▂
regret,▁

0,1
avg_scores,11.28713
regret,138462.24716


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: 050xgk9h with config:
[34m[1mwandb[0m: 	hidden_dim: 64
[34m[1mwandb[0m: 	learning_rate: 0.0097344691567407
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▁▁▂▂▂▂▂▂▂▃▃▃▄▄▄▄▄▄▅▅▆▇▇▇▆▆▅▅▅▅▅▆▆▇██████
regret,▁

0,1
avg_scores,158.43564
regret,112191.53693


[34m[1mwandb[0m: Agent Starting Run: nm6thtqo with config:
[34m[1mwandb[0m: 	hidden_dim: 32
[34m[1mwandb[0m: 	learning_rate: 0.008571711617376417
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▂▂▂▂▂▂▂▃▃▃▃▃▃▃▃▄▄▅▅▅▅▆▆▇█
regret,▁

0,1
avg_scores,280.93069
regret,115383.18094


[34m[1mwandb[0m: Agent Starting Run: xx7hfmsv with config:
[34m[1mwandb[0m: 	hidden_dim: 32
[34m[1mwandb[0m: 	learning_rate: 0.003054231582201762
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▁▁▁▁▁▁▁▁▁▁▁▁▂▂▂▂▂▂▂▂▂▂▂▃▃▃▃▄▄▄▅▅▅▆▇▇████
regret,▁

0,1
avg_scores,223.80198
regret,118305.73593


[34m[1mwandb[0m: Agent Starting Run: 95cs4dmj with config:
[34m[1mwandb[0m: 	hidden_dim: 128
[34m[1mwandb[0m: 	learning_rate: 0.004874317856387692
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▂▃▅▇▇▇██
regret,▁

0,1
avg_scores,54.38614
regret,137670.92288


[34m[1mwandb[0m: Agent Starting Run: jgqq69m6 with config:
[34m[1mwandb[0m: 	hidden_dim: 64
[34m[1mwandb[0m: 	learning_rate: 0.0033683254815116905
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.000 MB of 0.001 MB uploaded\r'), FloatProgress(value=0.0, max=1.0)))

0,1
avg_scores,▄█▇▅▃▃▂▂▃▄▄▅▆▅▅▄▄▄▄▄▄▄▃▃▂▁▃▃▄▄▄▄▄▅▇▇▇▇▆▅
regret,▁

0,1
avg_scores,18.11881
regret,137275.09404


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: me14f6f3 with config:
[34m[1mwandb[0m: 	hidden_dim: 256
[34m[1mwandb[0m: 	learning_rate: 0.0028857596332665975
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▁▁▁▁▁▁▁▁▁▂▂▂▂▂▂▂▂▃▃▃▃▄▄▄▅▅▆▇▇▇▇████▇▇▇▇▇
regret,▁

0,1
avg_scores,331.85149
regret,87451.04568


[34m[1mwandb[0m: Agent Starting Run: 9i9p2tuk with config:
[34m[1mwandb[0m: 	hidden_dim: 256
[34m[1mwandb[0m: 	learning_rate: 0.008099772821328701
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▁▁▂▂▂▂▂▃▃▃▃▂▂▂▂▂▃▃▃▄▄▅▅▅▆▆▇████▇▆▅▅▄▄▄▃▃
regret,▁

0,1
avg_scores,30.08911
regret,130433.78974


[34m[1mwandb[0m: Agent Starting Run: vrqpb1p1 with config:
[34m[1mwandb[0m: 	hidden_dim: 32
[34m[1mwandb[0m: 	learning_rate: 0.0006708094543974918
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▁▁▁▂▂▂▂▂▃▃▃▄▄▄▅▆▆▇▆▆▆▇▇██▇██▇▇▇▇▇█▇▇▆▆▇▇
regret,▁

0,1
avg_scores,48.0
regret,130171.79925


[34m[1mwandb[0m: Agent Starting Run: 9pojrrwy with config:
[34m[1mwandb[0m: 	hidden_dim: 64
[34m[1mwandb[0m: 	learning_rate: 0.006152943770166117
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.011111111111111112, max=1.0…

VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▁▁▁▁▁▁▁▁▁▂▂▂▂▂▂▂▂▂▂▂▂▂▂▂▃▃▃▃▃▃▃▄▄▅▅▆▇▇▇█
regret,▁

0,1
avg_scores,382.51485
regret,109151.49123


[34m[1mwandb[0m: Agent Starting Run: hpurxwyh with config:
[34m[1mwandb[0m: 	hidden_dim: 32
[34m[1mwandb[0m: 	learning_rate: 0.002257403653510993
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.000 MB of 0.001 MB uploaded\r'), FloatProgress(value=0.0, max=1.0)))

0,1
avg_scores,▄█▄▂▂▁▁▂▂▂▂▂▂▂▁▁▁▁▂▂▂▂▃▃▃▃▃▃▄▄▅▅▅▅▅▄▄▄▃▃
regret,▁

0,1
avg_scores,28.81188
regret,134188.6953


[34m[1mwandb[0m: Agent Starting Run: 3pzxv99r with config:
[34m[1mwandb[0m: 	hidden_dim: 64
[34m[1mwandb[0m: 	learning_rate: 0.003477140737536793
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▁▁▁▁▁▁▁▂▂▂▂▂▂▂▂▃▃▄▄▄▅▅▆▆▆▇▇▇▇██████▇▇▆▆▆
regret,▁

0,1
avg_scores,189.20792
regret,102589.95143


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: mq1e0t2p with config:
[34m[1mwandb[0m: 	hidden_dim: 256
[34m[1mwandb[0m: 	learning_rate: 0.008513478755668444
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.000 MB of 0.001 MB uploaded\r'), FloatProgress(value=0.0, max=1.0)))

0,1
avg_scores,█▄▅▄▄▃▃▃▃▂▂▂▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
regret,▁

0,1
avg_scores,9.32673
regret,139557.21834


[34m[1mwandb[0m: Agent Starting Run: vhjxlr1k with config:
[34m[1mwandb[0m: 	hidden_dim: 256
[34m[1mwandb[0m: 	learning_rate: 0.0004312010715919605
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▁▄▆▆▆▇▇▇▇▇▇▆▆▆▆▆▅▅▅▆▆▆▆▇███████▇▇▆▆▆▅▅▅▆
regret,▁

0,1
avg_scores,30.93069
regret,132338.94478


[34m[1mwandb[0m: Agent Starting Run: 25drvfp0 with config:
[34m[1mwandb[0m: 	hidden_dim: 64
[34m[1mwandb[0m: 	learning_rate: 0.0036113040030771575
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▁▁▁▁▁▁▂▂▂▂▂▂▂▂▂▂▃▃▃▃▃▃▄▄▄▅▅▅▅▅▅▅▅▆▆▇████
regret,▁

0,1
avg_scores,166.89109
regret,121276.6581


[34m[1mwandb[0m: Agent Starting Run: sqsnchhy with config:
[34m[1mwandb[0m: 	hidden_dim: 32
[34m[1mwandb[0m: 	learning_rate: 0.002503009898327084
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.011288888888844262, max=1.0…

VBox(children=(Label(value='0.000 MB of 0.001 MB uploaded\r'), FloatProgress(value=0.0, max=1.0)))

0,1
avg_scores,▁▂▃▂▂▂▂▂▂▂▂▂▂▂▂▃▃▄▄▆▆▅▆▆▆▆▇▇█▇▇▇█████▇▇█
regret,▁

0,1
avg_scores,26.0198
regret,136707.15721


[34m[1mwandb[0m: Agent Starting Run: aa00sk7y with config:
[34m[1mwandb[0m: 	hidden_dim: 128
[34m[1mwandb[0m: 	learning_rate: 0.0023828811040033497
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.000 MB of 0.000 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,█▅▃▂▂▂▂▂▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
regret,▁

0,1
avg_scores,9.34653
regret,139458.94652


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: 6302sn6f with config:
[34m[1mwandb[0m: 	hidden_dim: 32
[34m[1mwandb[0m: 	learning_rate: 0.0014544924170997368
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.000 MB of 0.001 MB uploaded\r'), FloatProgress(value=0.0, max=1.0)))

0,1
avg_scores,▁▂▁▂▂▃▄▅▄▄▄▄▄▅▅▆▆▆▆▆▆▇▇▇███▇▇▆▆▆▅▅▄▄▃▃▃▄
regret,▁

0,1
avg_scores,26.88119
regret,133021.0516


[34m[1mwandb[0m: Agent Starting Run: s844w4kt with config:
[34m[1mwandb[0m: 	hidden_dim: 32
[34m[1mwandb[0m: 	learning_rate: 0.006065168438256567
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.01127777777777131, max=1.0)…

VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▂▂▂▂▂▃▃▃▃▄▄▅▅▆▆▆▆▆▇▇████▇
regret,▁

0,1
avg_scores,381.47525
regret,94311.76623


[34m[1mwandb[0m: Agent Starting Run: d3bu9q8c with config:
[34m[1mwandb[0m: 	hidden_dim: 256
[34m[1mwandb[0m: 	learning_rate: 0.002131120432988236
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▁▁▁▁▁▁▁▁▂▂▂▂▂▂▂▂▂▃▃▃▃▄▄▅▅▅▅▆▆▇▇▇████▇▇▇▇
regret,▁

0,1
avg_scores,257.90099
regret,102569.61813


[34m[1mwandb[0m: Agent Starting Run: 0d1joe5w with config:
[34m[1mwandb[0m: 	hidden_dim: 32
[34m[1mwandb[0m: 	learning_rate: 0.004758797587502772
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▇▅▅█▇▅▅▄▄▄▃▃▃▃▃▃▂▂▂▂▂▂▂▂▃▃▃▃▃▂▂▂▃▂▂▂▂▂▁▁
regret,▁

0,1
avg_scores,10.26733
regret,138512.0443


[34m[1mwandb[0m: Agent Starting Run: b113d5u8 with config:
[34m[1mwandb[0m: 	hidden_dim: 128
[34m[1mwandb[0m: 	learning_rate: 0.007279214834025053
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▁▁▁▁▂▂▂▃▃▃▃▃▃▃▄▅▆▇█████▇▇▇▇▆▅▄▄▂▂▂▂▂▂▃▃▄
regret,▁

0,1
avg_scores,72.0495
regret,120681.19806


[34m[1mwandb[0m: Agent Starting Run: ooz6r7op with config:
[34m[1mwandb[0m: 	hidden_dim: 128
[34m[1mwandb[0m: 	learning_rate: 0.008479384378346711
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▆██▆▅▄▄▄▄▃▃▃▃▃▂▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
regret,▁

0,1
avg_scores,9.39604
regret,138379.94469


[34m[1mwandb[0m: Agent Starting Run: q1nlmmbb with config:
[34m[1mwandb[0m: 	hidden_dim: 128
[34m[1mwandb[0m: 	learning_rate: 0.001299928603556825
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▁▁▁▁▁▁▁▁▁▁▁▁▁▁▂▂▂▂▂▂▃▃▃▃▄▄▄▄▅▆▆▆▇▇▇▇▇███
regret,▁

0,1
avg_scores,213.30693
regret,114679.19765


[34m[1mwandb[0m: Agent Starting Run: r1tyvh6b with config:
[34m[1mwandb[0m: 	hidden_dim: 64
[34m[1mwandb[0m: 	learning_rate: 0.009006832791608172
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.01127777777777131, max=1.0)…

VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▁▁▁▁▁▂▂▂▂▃▃▃▃▃▄▄▅▆▆▆▇██████▇▇▇▇▇▆▆▅▅▅▅▅▅
regret,▁

0,1
avg_scores,114.87129
regret,108378.33907


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: 0ry4demn with config:
[34m[1mwandb[0m: 	hidden_dim: 64
[34m[1mwandb[0m: 	learning_rate: 0.0020064330301899714
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▁▁▃▄▃▃▃▃▄▃▄▄▄▄▄▃▃▄▄▄▄▃▃▃▃▃▄▄▅▅▅▅▆▇▇▇████
regret,▁

0,1
avg_scores,29.33663
regret,136364.6351


[34m[1mwandb[0m: Agent Starting Run: gccyuzz2 with config:
[34m[1mwandb[0m: 	hidden_dim: 64
[34m[1mwandb[0m: 	learning_rate: 0.00474275563732855
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.011111111111111112, max=1.0…

VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▁▁▁▁▁▁▁▁▁▂▂▂▂▂▂▃▄▄▅▅▆▆▆▆▆▆▇▇▇▇▇▇▇▇▇▇▇███
regret,▁

0,1
avg_scores,155.65347
regret,115758.40848


[34m[1mwandb[0m: Agent Starting Run: qtu9710b with config:
[34m[1mwandb[0m: 	hidden_dim: 64
[34m[1mwandb[0m: 	learning_rate: 0.004411200988499444
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▁▃▂▁▁▁▁▁▂▂▂▂▂▃▃▃▃▃▃▃▃▃▃▃▄▅▅▅▆▆▆▇▇████▇▆▅
regret,▁

0,1
avg_scores,19.38614
regret,137466.54153


[34m[1mwandb[0m: Agent Starting Run: voga6lz9 with config:
[34m[1mwandb[0m: 	hidden_dim: 32
[34m[1mwandb[0m: 	learning_rate: 0.00934970035501912
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.011111111111111112, max=1.0…

VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▁▁▁▁▁▁▁▁▁▁▁▂▂▂▃▃▄▅▆▆▆▆▇▇▇█████▇▇▆▆▇▇▇▇▆▇
regret,▁

0,1
avg_scores,114.35644
regret,118538.67414


[34m[1mwandb[0m: Agent Starting Run: dqmv3ycp with config:
[34m[1mwandb[0m: 	hidden_dim: 64
[34m[1mwandb[0m: 	learning_rate: 0.005361972682387592
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.000 MB of 0.001 MB uploaded\r'), FloatProgress(value=0.0, max=1.0)))

0,1
avg_scores,▂▂█▄▃▅▅▇▇▇▇██▇▇▇▆▆▆▅▄▄▃▃▂▂▂▂▂▂▂▁▁▁▁▁▁▁▁▁
regret,▁

0,1
avg_scores,13.73267
regret,137496.28194


[34m[1mwandb[0m: Agent Starting Run: fxe6uxoh with config:
[34m[1mwandb[0m: 	hidden_dim: 128
[34m[1mwandb[0m: 	learning_rate: 0.002839599213234842
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.000 MB of 0.001 MB uploaded\r'), FloatProgress(value=0.0, max=1.0)))

0,1
avg_scores,▃▂▂▁▁▁▁▂▂▁▁▁▁▁▁▁▂▂▃▃▃▃▃▃▄▄▄▄▅▇▇▇▇▇▇▇████
regret,▁

0,1
avg_scores,33.88119
regret,136465.30066


[34m[1mwandb[0m: Agent Starting Run: qnswuqlw with config:
[34m[1mwandb[0m: 	hidden_dim: 128
[34m[1mwandb[0m: 	learning_rate: 0.005771837380497962
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.000 MB of 0.001 MB uploaded\r'), FloatProgress(value=0.0, max=1.0)))

0,1
avg_scores,█▆▃▃▃▃▂▂▂▂▂▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▂▂▂▄▅▆▆▆
regret,▁

0,1
avg_scores,12.26733
regret,139454.12353


[34m[1mwandb[0m: Agent Starting Run: x3kw5uia with config:
[34m[1mwandb[0m: 	hidden_dim: 256
[34m[1mwandb[0m: 	learning_rate: 0.001313647414139755
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.011111111111111112, max=1.0…

VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▁▂▃▅▄▄▄▄▄▄▅▅▅▅▇▇▇▇▇█████▇▇▇▇▇▇▇▇▇▆▆▆▅▅▅▄
regret,▁

0,1
avg_scores,20.29703
regret,135479.46079


[34m[1mwandb[0m: Agent Starting Run: g80wl5mv with config:
[34m[1mwandb[0m: 	hidden_dim: 256
[34m[1mwandb[0m: 	learning_rate: 0.003230657260167698
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▁▁▁▁▂▂▂▁▁▁▁▁▂▂▃▃▃▃▄▅▅▆▇▇████████▇▇▇▆▆▆▆▆
regret,▁

0,1
avg_scores,150.31683
regret,108302.64085


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: pbsl6fy7 with config:
[34m[1mwandb[0m: 	hidden_dim: 32
[34m[1mwandb[0m: 	learning_rate: 0.006742335565553793
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.01127777777777131, max=1.0)…

VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▁▁▁▁▁▁▁▁▁▁▁▂▂▂▂▂▃▃▃▄▄▅▅▅▆▆▆▆▆▇▇▇▇▇▇▇▇▇██
regret,▁

0,1
avg_scores,350.81188
regret,93104.31504


[34m[1mwandb[0m: Agent Starting Run: cic1xryc with config:
[34m[1mwandb[0m: 	hidden_dim: 256
[34m[1mwandb[0m: 	learning_rate: 0.0022255804198577614
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▁▁▁▁▁▁▁▁▁▁▁▁▁▁▂▂▂▂▂▂▂▂▃▃▄▄▄▄▄▅▅▅▆▆▆▆▇▇██
regret,▁

0,1
avg_scores,205.52475
regret,119104.38948


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: rb2nhn1z with config:
[34m[1mwandb[0m: 	hidden_dim: 128
[34m[1mwandb[0m: 	learning_rate: 0.007350891727790795
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▁▁▂▂▂▂▂▃▄▅▅▅▅▄▄▄▄▄▄▄▄▄▄▃▃▄▄▄▄▅▅▅▅▆▅▅▅▆▇█
regret,▁

0,1
avg_scores,177.85149
regret,113980.71376


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: 797mqa6n with config:
[34m[1mwandb[0m: 	hidden_dim: 128
[34m[1mwandb[0m: 	learning_rate: 0.0047782743277375314
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.01127777777777131, max=1.0)…

VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,█▆▄▄▄▄▄▃▃▃▃▃▃▂▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
regret,▁

0,1
avg_scores,9.48515
regret,139494.74835


[34m[1mwandb[0m: Agent Starting Run: ovh6zh8o with config:
[34m[1mwandb[0m: 	hidden_dim: 32
[34m[1mwandb[0m: 	learning_rate: 0.006479847245044044
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.011111111111111112, max=1.0…

VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▇▆█▆▄▄▃▃▃▃▂▂▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
regret,▁

0,1
avg_scores,9.40594
regret,139107.09862


[34m[1mwandb[0m: Agent Starting Run: 6ou9jy55 with config:
[34m[1mwandb[0m: 	hidden_dim: 128
[34m[1mwandb[0m: 	learning_rate: 0.0015937547445719414
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.011288888888925108, max=1.0…

VBox(children=(Label(value='0.000 MB of 0.000 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,█▆▅▅▅▅▄▄▄▃▃▃▃▃▃▄▃▃▃▃▃▃▃▃▃▃▂▂▁▁▁▁▁▁▁▁▁▁▁▂
regret,▁

0,1
avg_scores,11.13861
regret,138669.95546


[34m[1mwandb[0m: Agent Starting Run: cj96e8s2 with config:
[34m[1mwandb[0m: 	hidden_dim: 32
[34m[1mwandb[0m: 	learning_rate: 0.009344393747600375
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.011111111111111112, max=1.0…

VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▂▂▂▂▂▃▃▃▃▃▄▄▅▅▆▆▆▇▇▇▇████
regret,▁

0,1
avg_scores,469.89109
regret,90194.58451


[34m[1mwandb[0m: Agent Starting Run: o4ty6y0r with config:
[34m[1mwandb[0m: 	hidden_dim: 256
[34m[1mwandb[0m: 	learning_rate: 0.0004648436041141235
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▄▅▆▆▅▄▄▃▃▃▃▃▃▂▂▂▁▁▁▁▁▁▁▂▂▃▄▅▅▆▇████▇▇▆▅▅
regret,▁

0,1
avg_scores,18.80198
regret,137271.32327


[34m[1mwandb[0m: Agent Starting Run: bi6od4qq with config:
[34m[1mwandb[0m: 	hidden_dim: 64
[34m[1mwandb[0m: 	learning_rate: 0.0009180945262451562
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,█▅▅▃▃▄▄▆▇▆▆▅▄▄▄▃▃▃▃▃▃▁▂▂▃▄▅▅▆▆▆▆▇▆▆▆▅▅▄▄
regret,▁

0,1
avg_scores,24.45545
regret,134423.1526


[34m[1mwandb[0m: Agent Starting Run: 4blzrhjg with config:
[34m[1mwandb[0m: 	hidden_dim: 64
[34m[1mwandb[0m: 	learning_rate: 0.00422191080862467
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▂▂▂▂▂▃▃▄▄▄▄▅▅▅▆▆▆▇▇▇▇███
regret,▁

0,1
avg_scores,437.72277
regret,92671.12362


[34m[1mwandb[0m: Agent Starting Run: b8ot2r5a with config:
[34m[1mwandb[0m: 	hidden_dim: 128
[34m[1mwandb[0m: 	learning_rate: 0.005772139077341473
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.000 MB of 0.000 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,█▅▃▃▂▂▂▂▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
regret,▁

0,1
avg_scores,9.39604
regret,138942.20796


[34m[1mwandb[0m: Agent Starting Run: 8qhonx78 with config:
[34m[1mwandb[0m: 	hidden_dim: 64
[34m[1mwandb[0m: 	learning_rate: 0.003959965614598252
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.011111111111111112, max=1.0…

VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▃▂▁▁▄▅▆▅▇▇▆▆▆▆▇██▇▇▆▆▆▅▅▆▆▆▆▅▅▅▅▅▅▆▆▆▆▆▆
regret,▁

0,1
avg_scores,21.0297
regret,136440.31388


[34m[1mwandb[0m: Agent Starting Run: pm0s9pp8 with config:
[34m[1mwandb[0m: 	hidden_dim: 32
[34m[1mwandb[0m: 	learning_rate: 0.004392745822577008
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▂▂▂▂▂▂▂▂▂▂▃▃▃▃▃▃▄▄▅▅▆▇▇▇█
regret,▁

0,1
avg_scores,215.35644
regret,123563.91147


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: 0pzt2hmy with config:
[34m[1mwandb[0m: 	hidden_dim: 128
[34m[1mwandb[0m: 	learning_rate: 0.0007067016081231835
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▁▃▅▄▅▄▄▅▄▅▅▇▇▇▇▆▇▇▇▇▇▇▇▇▆▆▆▇▇▆▆▅▅▅▆▇████
regret,▁

0,1
avg_scores,37.90099
regret,132841.27597


[34m[1mwandb[0m: Agent Starting Run: kqa0lit9 with config:
[34m[1mwandb[0m: 	hidden_dim: 32
[34m[1mwandb[0m: 	learning_rate: 0.0034208128633492927
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▃█▅▄▃▂▂▁▁▂▂▁▁▁▁▃▃▄▄▄▅▅▅▅▅▅▅▅▄▃▃▂▂▂▂▂▁▁▁▁
regret,▁

0,1
avg_scores,16.0495
regret,136817.7193


[34m[1mwandb[0m: Agent Starting Run: xmjzbkay with config:
[34m[1mwandb[0m: 	hidden_dim: 256
[34m[1mwandb[0m: 	learning_rate: 0.0012048920642783025
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▂▁▂▃▃▃▄▅▇▇▇▇▆▆▆▆▆▇▇▇▆▅▅▅▅▅▅▅▅▆▆▆▆▇▇▇▇▇▇█
regret,▁

0,1
avg_scores,33.60396
regret,134490.51319


[34m[1mwandb[0m: Agent Starting Run: 09nze2re with config:
[34m[1mwandb[0m: 	hidden_dim: 128
[34m[1mwandb[0m: 	learning_rate: 0.009484705365668797
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▁▁▁▁▁▁▂▂▂▁▁▁▂▂▂▂▃▃▃▄▄▅▅▅▅▆▆▆▇▇██▇▇▆▆▅▅▅▄
regret,▁

0,1
avg_scores,193.34653
regret,88365.34076


[34m[1mwandb[0m: Agent Starting Run: 0xirdvgf with config:
[34m[1mwandb[0m: 	hidden_dim: 128
[34m[1mwandb[0m: 	learning_rate: 0.0037978013900060816
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.011111111111111112, max=1.0…

VBox(children=(Label(value='0.000 MB of 0.001 MB uploaded\r'), FloatProgress(value=0.0, max=1.0)))

0,1
avg_scores,▄▇█▆▆▅▅▇▆▅▅▅▄▄▄▃▃▃▂▂▂▁▁▁▁▁▁▁▂▂▃▄▄▅▆▆▇▇▇▇
regret,▁

0,1
avg_scores,21.38614
regret,137920.96385


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: g8l1c435 with config:
[34m[1mwandb[0m: 	hidden_dim: 128
[34m[1mwandb[0m: 	learning_rate: 0.0016371147963022904
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.011111111111111112, max=1.0…

VBox(children=(Label(value='0.000 MB of 0.000 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▅▆█▆▆█▆▆▅▅▄▄▄▄▃▃▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
regret,▁

0,1
avg_scores,9.41584
regret,138272.76778


[34m[1mwandb[0m: Agent Starting Run: wf6ad0p6 with config:
[34m[1mwandb[0m: 	hidden_dim: 64
[34m[1mwandb[0m: 	learning_rate: 0.0010019564907082555
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,█▅▄▄▃▄▃▃▃▃▃▃▃▃▃▃▃▃▃▄▄▄▄▄▃▃▃▃▃▃▂▂▂▁▁▁▁▁▁▁
regret,▁

0,1
avg_scores,16.73267
regret,134060.63225


[34m[1mwandb[0m: Agent Starting Run: 0zs4qzwj with config:
[34m[1mwandb[0m: 	hidden_dim: 128
[34m[1mwandb[0m: 	learning_rate: 0.008170818554640882
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▁▁▁▂▃▄▅▅▅▅▅▆▇▇████▇▇▇███▇▆▅▅▅▅▆▆▆▆▆▆▆▇██
regret,▁

0,1
avg_scores,75.28713
regret,124921.27296


[34m[1mwandb[0m: Agent Starting Run: ouedakya with config:
[34m[1mwandb[0m: 	hidden_dim: 64
[34m[1mwandb[0m: 	learning_rate: 0.007963880384832136
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.000 MB of 0.000 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▆█▇▅▄▄▃▃▃▃▂▂▂▂▂▁▂▂▂▂▂▂▂▂▂▂▂▂▂▁▁▁▁▁▁▁▁▁▁▁
regret,▁

0,1
avg_scores,9.32673
regret,139040.14902


[34m[1mwandb[0m: Agent Starting Run: ckspqfcf with config:
[34m[1mwandb[0m: 	hidden_dim: 256
[34m[1mwandb[0m: 	learning_rate: 0.002868510997460331
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.011111111111111112, max=1.0…

VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▃▃▅▄▅▇█▇▇▆▆▆▆▆▆▅▅▅▄▃▃▂▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
regret,▁

0,1
avg_scores,9.32673
regret,136921.64993


[34m[1mwandb[0m: Agent Starting Run: w5rydmxb with config:
[34m[1mwandb[0m: 	hidden_dim: 128
[34m[1mwandb[0m: 	learning_rate: 0.009983141577719772
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.000 MB of 0.001 MB uploaded\r'), FloatProgress(value=0.0, max=1.0)))

0,1
avg_scores,█▅▃▂▂▂▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
regret,▁

0,1
avg_scores,9.35644
regret,139311.88569


[34m[1mwandb[0m: Agent Starting Run: qegg2d87 with config:
[34m[1mwandb[0m: 	hidden_dim: 128
[34m[1mwandb[0m: 	learning_rate: 0.0021610923553000154
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,█▇▄▄▄▃▃▃▂▂▂▂▂▂▂▂▂▂▂▂▂▂▂▂▂▂▂▂▂▁▁▁▁▁▁▁▁▁▁▁
regret,▁

0,1
avg_scores,9.35644
regret,138859.46243


[34m[1mwandb[0m: Agent Starting Run: skg8fcoh with config:
[34m[1mwandb[0m: 	hidden_dim: 256
[34m[1mwandb[0m: 	learning_rate: 0.004461389991929581
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.011111111111111112, max=1.0…

VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▆█▆▅▅▅▄▄▄▃▃▃▃▃▃▂▂▂▁▁▁▁▁▁▁▂▂▁▁▂▂▂▂▂▂▂▁▁▁▁
regret,▁

0,1
avg_scores,9.32673
regret,139593.51909


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: 0mlijjzk with config:
[34m[1mwandb[0m: 	hidden_dim: 128
[34m[1mwandb[0m: 	learning_rate: 0.007497028246316635
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.011111111111111112, max=1.0…

VBox(children=(Label(value='0.000 MB of 0.000 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,█▅▃▂▂▂▂▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
regret,▁

0,1
avg_scores,9.32673
regret,139381.11047


[34m[1mwandb[0m: Agent Starting Run: cj93ql3u with config:
[34m[1mwandb[0m: 	hidden_dim: 64
[34m[1mwandb[0m: 	learning_rate: 0.0024584982735876685
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,█▃▂▁▁▂▃▄▄▅▅▆▆▆▆▆▆▇▆▆▆▅▅▅▄▄▅▆▆▆▆▆▆▇▇▇█▇█▇
regret,▁

0,1
avg_scores,32.85149
regret,134032.1744


[34m[1mwandb[0m: Agent Starting Run: ma7t26hb with config:
[34m[1mwandb[0m: 	hidden_dim: 128
[34m[1mwandb[0m: 	learning_rate: 0.004595539246825281
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▂▁▁▁▁▁▁▁▂▂▂▂▂▂▂▂▂▂▂▃▃▃▃▃▃▃▃▃▃▃▃▃▃▃▃▄▄▆▇█
regret,▁

0,1
avg_scores,214.59406
regret,121348.23406


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: 2jye0v33 with config:
[34m[1mwandb[0m: 	hidden_dim: 64
[34m[1mwandb[0m: 	learning_rate: 0.0069744243331273
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.000 MB of 0.000 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▃▂▇█▆▅▅▄▄▃▃▃▃▃▃▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
regret,▁

0,1
avg_scores,9.37624
regret,139263.14486


[34m[1mwandb[0m: Agent Starting Run: m51kcvla with config:
[34m[1mwandb[0m: 	hidden_dim: 256
[34m[1mwandb[0m: 	learning_rate: 0.005965549265112954
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.011111111111111112, max=1.0…

VBox(children=(Label(value='0.000 MB of 0.000 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,█▄▃▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
regret,▁

0,1
avg_scores,9.39604
regret,139673.16389


[34m[1mwandb[0m: Agent Starting Run: 5j2hkvqa with config:
[34m[1mwandb[0m: 	hidden_dim: 256
[34m[1mwandb[0m: 	learning_rate: 0.005739515617303861
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▂▂▂▂▂▃▃▃▃▃▃▃▃▃▄▄▄▄▄▄▄▄▅▆███▇▇▇▆▆▆▆▆▅▃▂▁▁
regret,▁

0,1
avg_scores,9.42574
regret,115845.45601


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: zpwpix9y with config:
[34m[1mwandb[0m: 	hidden_dim: 64
[34m[1mwandb[0m: 	learning_rate: 0.002179925564734639
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.000 MB of 0.001 MB uploaded\r'), FloatProgress(value=0.0, max=1.0)))

0,1
avg_scores,▅██▇█▇▆▅▄▄▄▄▄▃▃▄▄▄▄▄▄▄▄▄▄▄▄▄▂▁▁▁▁▁▁▁▁▂▂▂
regret,▁

0,1
avg_scores,16.40594
regret,136423.97507


[34m[1mwandb[0m: Agent Starting Run: 0rg1ixrx with config:
[34m[1mwandb[0m: 	hidden_dim: 128
[34m[1mwandb[0m: 	learning_rate: 0.007298489428637275
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.000 MB of 0.000 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▄█▆▅▆▅▄▄▃▃▃▃▃▃▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
regret,▁

0,1
avg_scores,9.32673
regret,139354.50982


[34m[1mwandb[0m: Agent Starting Run: bs0zrbom with config:
[34m[1mwandb[0m: 	hidden_dim: 32
[34m[1mwandb[0m: 	learning_rate: 0.0015692563226060836
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▁▁▂▂▂▂▁▁▁▂▂▂▂▂▂▂▂▂▂▃▃▃▃▃▃▄▄▄▄▅▅▆▆▆▆▇▇███
regret,▁

0,1
avg_scores,63.78218
regret,131259.76636


[34m[1mwandb[0m: Agent Starting Run: ro9twezw with config:
[34m[1mwandb[0m: 	hidden_dim: 32
[34m[1mwandb[0m: 	learning_rate: 0.0036327157610307743
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.011111111111111112, max=1.0…

VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▂▂▂▂▂▂▂▂▂▂▃▃▃▃▃▃▃▃▄▄▅▅▆▇█
regret,▁

0,1
avg_scores,201.06931
regret,125116.53292


[34m[1mwandb[0m: Agent Starting Run: 02xenelm with config:
[34m[1mwandb[0m: 	hidden_dim: 32
[34m[1mwandb[0m: 	learning_rate: 0.004428527966560021
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▁▁▁▁▁▁▁▁▁▁▁▁▁▂▂▂▂▂▂▃▃▃▃▃▄▄▄▄▄▅▅▅▆▆▆▆▆▇▇█
regret,▁

0,1
avg_scores,191.66337
regret,119510.75375


[34m[1mwandb[0m: Agent Starting Run: 5tx0n132 with config:
[34m[1mwandb[0m: 	hidden_dim: 64
[34m[1mwandb[0m: 	learning_rate: 0.0031393516595627138
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.000 MB of 0.000 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,█▄▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▂▃▄▄▄▄▄▄▅▅▅▆▆▆▄▃▃▃▃▃▃▃▂
regret,▁

0,1
avg_scores,12.18812
regret,138556.3642


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: 1wvvqac5 with config:
[34m[1mwandb[0m: 	hidden_dim: 32
[34m[1mwandb[0m: 	learning_rate: 0.005206862185642037
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▃▄▃▂▃▄▄▅▅▅▅▅▆▆███▇▇▇▆▆▆▅▅▄▃▁▁▁▁▁▁▁▁▂▂▂▃▃
regret,▁

0,1
avg_scores,14.76238
regret,137532.05965


[34m[1mwandb[0m: Agent Starting Run: 3ouf01mr with config:
[34m[1mwandb[0m: 	hidden_dim: 256
[34m[1mwandb[0m: 	learning_rate: 0.002240771890167816
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.01128888888876342, max=1.0)…

VBox(children=(Label(value='0.000 MB of 0.001 MB uploaded\r'), FloatProgress(value=0.0, max=1.0)))

0,1
avg_scores,█▇▅▆▅▅▅▄▄▅▅▅▅▅▅▅▄▄▄▄▄▄▃▃▂▂▁▁▁▁▁▁▁▁▁▂▂▂▂▂
regret,▁

0,1
avg_scores,15.60396
regret,134802.66683


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: 9f6bv8kf with config:
[34m[1mwandb[0m: 	hidden_dim: 256
[34m[1mwandb[0m: 	learning_rate: 0.006017425887659266
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,██▅▄▃▃▂▂▂▂▂▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
regret,▁

0,1
avg_scores,9.32673
regret,139356.2632


[34m[1mwandb[0m: Agent Starting Run: v355lo97 with config:
[34m[1mwandb[0m: 	hidden_dim: 32
[34m[1mwandb[0m: 	learning_rate: 0.0007496955926466867
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.01127777777777131, max=1.0)…

VBox(children=(Label(value='0.000 MB of 0.001 MB uploaded\r'), FloatProgress(value=0.0, max=1.0)))

0,1
avg_scores,▂▁▁▁▂▂▃▃▃▃▃▃▃▃▃▄▄▄▄▄▄▄▄▅▅▅▅▅▅▅▆▆▆▇▇▇▇▇██
regret,▁

0,1
avg_scores,35.82178
regret,134583.21459


[34m[1mwandb[0m: Agent Starting Run: gjvfogxp with config:
[34m[1mwandb[0m: 	hidden_dim: 256
[34m[1mwandb[0m: 	learning_rate: 0.007515572872793128
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▁▁▁▃▃▃▂▂▂▃▃▃▄▄▅▅▆▆▇████▇▇▇▆▅▅▅▅▄▃▃▃▄▄▆▇▇
regret,▁

0,1
avg_scores,50.36634
regret,131272.66779


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: fk6tjioq with config:
[34m[1mwandb[0m: 	hidden_dim: 64
[34m[1mwandb[0m: 	learning_rate: 0.006392770812443366
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▄▃▅▄▆█▇▆▆▅▅▆▆▆▆▆▅▅▄▃▄▃▃▃▂▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁
regret,▁

0,1
avg_scores,9.32673
regret,138809.34372


[34m[1mwandb[0m: Agent Starting Run: a0boky7m with config:
[34m[1mwandb[0m: 	hidden_dim: 128
[34m[1mwandb[0m: 	learning_rate: 0.008811792967267234
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.000 MB of 0.000 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,█▆▄▃▂▂▂▂▂▂▂▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
regret,▁

0,1
avg_scores,9.39604
regret,139619.41693


[34m[1mwandb[0m: Agent Starting Run: n1g4t4hn with config:
[34m[1mwandb[0m: 	hidden_dim: 256
[34m[1mwandb[0m: 	learning_rate: 0.002660112768535982
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.011288888888925108, max=1.0…

VBox(children=(Label(value='0.001 MB of 0.006 MB uploaded\r'), FloatProgress(value=0.19536268212439292, max=1.…

0,1
avg_scores,▁▁▁▁▁▁▂▂▂▂▂▂▃▃▃▃▄▄▄▅▅▅▅▅▅▅▅▅▅▅▅▄▄▄▅▆▇▇▇█
regret,▁

0,1
avg_scores,110.72277
regret,126739.00639


[34m[1mwandb[0m: Agent Starting Run: bb54z74b with config:
[34m[1mwandb[0m: 	hidden_dim: 32
[34m[1mwandb[0m: 	learning_rate: 0.0054728007303826865
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.011111111111111112, max=1.0…

VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▂▂▂▂▂▂▂▂▂▂▃▃▃▄▄▄▄▅▅▆▆▇▇██
regret,▁

0,1
avg_scores,296.9802
regret,114408.20732


[34m[1mwandb[0m: Agent Starting Run: q4pz2uyz with config:
[34m[1mwandb[0m: 	hidden_dim: 64
[34m[1mwandb[0m: 	learning_rate: 0.007871335941926806
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.011288888888925108, max=1.0…

VBox(children=(Label(value='0.001 MB of 0.006 MB uploaded\r'), FloatProgress(value=0.19542391474690488, max=1.…

0,1
avg_scores,▇▇▄▃▃▂▃▅▆▆▅▅▅▆▆▇▇████▇▆▇▇▇▆▅▅▅▄▄▃▃▃▂▂▂▁▁
regret,▁

0,1
avg_scores,10.23762
regret,137045.80644


[34m[1mwandb[0m: Agent Starting Run: qg9qiqlr with config:
[34m[1mwandb[0m: 	hidden_dim: 128
[34m[1mwandb[0m: 	learning_rate: 0.0044053429577168126
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.006 MB uploaded\r'), FloatProgress(value=0.19542391474690488, max=1.…

0,1
avg_scores,█▇▄▄▄▃▃▃▂▂▂▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▂▃
regret,▁

0,1
avg_scores,10.25743
regret,139540.13133


[34m[1mwandb[0m: Agent Starting Run: 03up2e3d with config:
[34m[1mwandb[0m: 	hidden_dim: 64
[34m[1mwandb[0m: 	learning_rate: 0.009813070405371743
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.006 MB uploaded\r'), FloatProgress(value=0.1953932936383579, max=1.0…

0,1
avg_scores,▁▁▁▁▁▁▁▁▂▂▂▂▃▃▄▅▅▆▆▆▆▇▇████▇▇▇▇▇███▇▇▇▇▇
regret,▁

0,1
avg_scores,186.92079
regret,105688.46277


[34m[1mwandb[0m: Agent Starting Run: l3lklmmc with config:
[34m[1mwandb[0m: 	hidden_dim: 64
[34m[1mwandb[0m: 	learning_rate: 0.0064712028384463095
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.011288888888925108, max=1.0…

VBox(children=(Label(value='0.001 MB of 0.006 MB uploaded\r'), FloatProgress(value=0.19529780564263322, max=1.…

0,1
avg_scores,▁▁▁▁▁▁▁▁▁▁▁▁▂▂▂▂▂▂▂▂▃▃▃▃▃▃▃▄▄▅▅▅▆▆▇▇▇███
regret,▁

0,1
avg_scores,409.26733
regret,97915.83803


[34m[1mwandb[0m: Agent Starting Run: fouddt7b with config:
[34m[1mwandb[0m: 	hidden_dim: 256
[34m[1mwandb[0m: 	learning_rate: 0.009662971816398178
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.011111111111111112, max=1.0…

VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▁▁▁▁▁▁▁▁▁▂▂▂▂▂▂▂▂▂▂▂▂▂▂▂▂▂▂▃▃▃▄▅▆▇▇████▇
regret,▁

0,1
avg_scores,242.32673
regret,116924.55207


[34m[1mwandb[0m: Agent Starting Run: 1veh248l with config:
[34m[1mwandb[0m: 	hidden_dim: 256
[34m[1mwandb[0m: 	learning_rate: 0.0040496122171101686
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.006 MB uploaded\r'), FloatProgress(value=0.19520601597994675, max=1.…

0,1
avg_scores,▁▁▁▁▂▂▂▂▁▁▁▁▁▁▁▂▂▂▂▂▃▃▃▃▃▃▂▂▃▃▃▃▃▂▃▄▅▆▇█
regret,▁

0,1
avg_scores,204.84158
regret,125380.14628


[34m[1mwandb[0m: Agent Starting Run: rd8xkxkn with config:
[34m[1mwandb[0m: 	hidden_dim: 256
[34m[1mwandb[0m: 	learning_rate: 0.0027531968998444367
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.006 MB uploaded\r'), FloatProgress(value=0.19533208020050125, max=1.…

0,1
avg_scores,▁▁▂▂▂▂▂▂▂▂▂▂▃▃▃▃▂▃▃▄▄▄▄▄▄▄▄▄▅▅▆▇█▇▇▇▇███
regret,▁

0,1
avg_scores,181.24752
regret,115183.99606


[34m[1mwandb[0m: Agent Starting Run: 0jq7avgu with config:
[34m[1mwandb[0m: 	hidden_dim: 32
[34m[1mwandb[0m: 	learning_rate: 0.0029407001643807443
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.006 MB uploaded\r'), FloatProgress(value=0.1953932936383579, max=1.0…

0,1
avg_scores,▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▂▂▂▂▂▂▃▃▃▄▄▄▄▄▄▄▅▅▅▆▇▇█
regret,▁

0,1
avg_scores,220.72277
regret,120209.95225


[34m[1mwandb[0m: Agent Starting Run: 2cahwo36 with config:
[34m[1mwandb[0m: 	hidden_dim: 256
[34m[1mwandb[0m: 	learning_rate: 0.008637082509563103
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▁▁▁▁▁▂▂▂▂▂▂▂▂▂▂▃▃▃▄▄▄▅▅▆▇▇██████▇▇▇▆▅▅▅▅
regret,▁

0,1
avg_scores,78.65347
regret,120916.58263


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: kfzhmv5f with config:
[34m[1mwandb[0m: 	hidden_dim: 128
[34m[1mwandb[0m: 	learning_rate: 0.009607166023301576
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,█▅▃▃▂▂▂▂▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
regret,▁

0,1
avg_scores,9.32673
regret,139098.2101


[34m[1mwandb[0m: Agent Starting Run: dynuoeny with config:
[34m[1mwandb[0m: 	hidden_dim: 32
[34m[1mwandb[0m: 	learning_rate: 0.006338618814869905
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.011111111111111112, max=1.0…

VBox(children=(Label(value='0.000 MB of 0.000 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,█▄▃▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▂▂▂▂▂▁▁▁▁▁▁▁▁
regret,▁

0,1
avg_scores,11.35644
regret,138672.69879


[34m[1mwandb[0m: Agent Starting Run: 1s59s6c9 with config:
[34m[1mwandb[0m: 	hidden_dim: 64
[34m[1mwandb[0m: 	learning_rate: 0.008631442187839535
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.006 MB uploaded\r'), FloatProgress(value=0.19542391474690488, max=1.…

0,1
avg_scores,▁▁▁▁▁▂▂▂▂▂▂▂▂▂▃▃▄▄▅▅▅▅▆▆▇▇█████▇▇▇▇▇▇▇▆▆
regret,▁

0,1
avg_scores,114.13861
regret,117569.35175


[34m[1mwandb[0m: Agent Starting Run: hwcl0kp7 with config:
[34m[1mwandb[0m: 	hidden_dim: 64
[34m[1mwandb[0m: 	learning_rate: 0.003617790622618096
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.011111111111111112, max=1.0…

VBox(children=(Label(value='0.000 MB of 0.000 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▂▂▂▂▂▂▃▄▄▄▄▅▅▅▅▅▅▅▆▆▅▆▆▇███▇▇▇▇▆▆▅▅▄▃▂▁▁
regret,▁

0,1
avg_scores,9.39604
regret,137394.31433


[34m[1mwandb[0m: Agent Starting Run: 7q5d7yk2 with config:
[34m[1mwandb[0m: 	hidden_dim: 256
[34m[1mwandb[0m: 	learning_rate: 0.008442438481702721
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.01128888888876342, max=1.0)…

VBox(children=(Label(value='0.000 MB of 0.000 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,█▆▄▂▂▅▄▄▃▃▃▃▃▂▂▂▂▂▁▁▁▁▁▁▁▁▁▁▁▂▂▂▂▂▂▂▂▁▁▁
regret,▁

0,1
avg_scores,9.47525
regret,139549.98701


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: 7t0oxswz with config:
[34m[1mwandb[0m: 	hidden_dim: 32
[34m[1mwandb[0m: 	learning_rate: 0.00868652909797042
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.000 MB of 0.000 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▃▃▇▆█▇▆▆▅▅▅▅▅▅▅▄▄▃▂▂▂▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
regret,▁

0,1
avg_scores,9.32673
regret,139143.01269


[34m[1mwandb[0m: Agent Starting Run: 300uja4o with config:
[34m[1mwandb[0m: 	hidden_dim: 128
[34m[1mwandb[0m: 	learning_rate: 0.008972526546852677
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.011111111111111112, max=1.0…

VBox(children=(Label(value='0.000 MB of 0.000 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,█▅▃▄▅▄▄▃▃▃▃▃▂▂▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▂
regret,▁

0,1
avg_scores,9.41584
regret,139593.76639


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: xif6ibdc with config:
[34m[1mwandb[0m: 	hidden_dim: 128
[34m[1mwandb[0m: 	learning_rate: 0.004807526646874359
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▁▁▁▁▁▁▁▁▂▂▂▂▃▃▄▄▄▅▅▆▆▇████▇▇▆▆▆▆▅▄▃▂▂▁▁▂
regret,▁

0,1
avg_scores,34.73267
regret,111910.56627


[34m[1mwandb[0m: Agent Starting Run: 3wsdq6vu with config:
[34m[1mwandb[0m: 	hidden_dim: 128
[34m[1mwandb[0m: 	learning_rate: 0.005140822195371239
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.006 MB uploaded\r'), FloatProgress(value=0.19520601597994675, max=1.…

0,1
avg_scores,▁▁▁▁▂▂▂▃▃▄▄▄▄▅▅▆▇▇▇███████▇▇▆▆▆▆▇▇▇▆▆▆▇█
regret,▁

0,1
avg_scores,104.29703
regret,121038.16314


[34m[1mwandb[0m: Agent Starting Run: jmvwqykq with config:
[34m[1mwandb[0m: 	hidden_dim: 128
[34m[1mwandb[0m: 	learning_rate: 0.0004259065049031786
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▂▂▁▁▂▂▃▃▃▃▄▄▄▄▄▄▅▆▆▇▇████▇███▇▇▆▅▅▅▄▅▅▅▄
regret,▁

0,1
avg_scores,28.08911
regret,133292.04815


[34m[1mwandb[0m: Agent Starting Run: q5mi6yni with config:
[34m[1mwandb[0m: 	hidden_dim: 64
[34m[1mwandb[0m: 	learning_rate: 0.001265046618224674
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▄▅▆▅▇▇▇▇▇▇▇████▇▇▆▆▅▅▅▄▄▃▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁
regret,▁

0,1
avg_scores,9.85149
regret,137722.48575


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: 71380zmj with config:
[34m[1mwandb[0m: 	hidden_dim: 256
[34m[1mwandb[0m: 	learning_rate: 0.008445538491211919
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.011111111111111112, max=1.0…

VBox(children=(Label(value='0.000 MB of 0.000 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,█▇▄▄▃▃▃▂▂▂▂▂▂▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
regret,▁

0,1
avg_scores,9.32673
regret,139586.7633


[34m[1mwandb[0m: Agent Starting Run: o0x2yie6 with config:
[34m[1mwandb[0m: 	hidden_dim: 32
[34m[1mwandb[0m: 	learning_rate: 0.003578615509754604
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▁▁▁▁▁▁▁▁▁▁▁▁▁▂▂▂▂▂▂▂▂▃▃▃▃▄▄▅▆▆▆▆▆▆▇▇▇▇██
regret,▁

0,1
avg_scores,187.19802
regret,117114.17613


[34m[1mwandb[0m: Agent Starting Run: s97s7i18 with config:
[34m[1mwandb[0m: 	hidden_dim: 256
[34m[1mwandb[0m: 	learning_rate: 0.008054879058409695
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▁▁▂▂▂▂▂▂▂▂▂▂▂▂▂▂▃▃▃▃▃▃▃▃▃▃▄▄▆▆▆▆▆▆▆▆██▇▇
regret,▁

0,1
avg_scores,128.46535
regret,122334.19721


[34m[1mwandb[0m: Agent Starting Run: 0xy61ssi with config:
[34m[1mwandb[0m: 	hidden_dim: 128
[34m[1mwandb[0m: 	learning_rate: 0.007309585615778597
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.011111111111111112, max=1.0…

VBox(children=(Label(value='0.001 MB of 0.006 MB uploaded\r'), FloatProgress(value=0.19533208020050125, max=1.…

0,1
avg_scores,▁▁▁▁▁▂▂▃▃▄▄▅▆▆▆▆▆▆▆▇▇▇▇▇▆▄▄▅▅▅▅▅▅▅▅▅▆▆▇█
regret,▁

0,1
avg_scores,115.18812
regret,119206.17628


[34m[1mwandb[0m: Agent Starting Run: hgpsauk6 with config:
[34m[1mwandb[0m: 	hidden_dim: 64
[34m[1mwandb[0m: 	learning_rate: 0.002851625214333008
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.006 MB uploaded\r'), FloatProgress(value=0.1953932936383579, max=1.0…

0,1
avg_scores,▁▁▁▁▁▁▁▁▂▂▂▂▂▂▂▂▂▂▂▃▃▃▃▃▃▃▄▄▄▅▅▅▅▆▆▇████
regret,▁

0,1
avg_scores,191.18812
regret,119211.6951


[34m[1mwandb[0m: Agent Starting Run: p3xfzzdt with config:
[34m[1mwandb[0m: 	hidden_dim: 32
[34m[1mwandb[0m: 	learning_rate: 0.00554249622901733
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.01127777777777131, max=1.0)…

VBox(children=(Label(value='0.001 MB of 0.006 MB uploaded\r'), FloatProgress(value=0.1953932936383579, max=1.0…

0,1
avg_scores,▁▁▁▁▁▁▁▁▁▁▁▁▁▁▂▂▂▂▂▂▂▂▂▃▃▃▄▄▄▅▅▆▆▇██████
regret,▁

0,1
avg_scores,247.86139
regret,110852.8757


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: 808sxiq1 with config:
[34m[1mwandb[0m: 	hidden_dim: 128
[34m[1mwandb[0m: 	learning_rate: 0.0030388101774079016
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.006 MB uploaded\r'), FloatProgress(value=0.19545454545454546, max=1.…

0,1
avg_scores,█▆▇▆▅▄▄▃▃▃▃▂▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
regret,▁

0,1
avg_scores,9.39604
regret,138742.36788


[34m[1mwandb[0m: Agent Starting Run: f9yr440e with config:
[34m[1mwandb[0m: 	hidden_dim: 128
[34m[1mwandb[0m: 	learning_rate: 0.00988088942437981
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▁▁▁▂▂▂▂▂▂▂▂▂▂▂▂▂▃▃▃▃▃▃▄▄▅▇█████████▇▇▆▄▃
regret,▁

0,1
avg_scores,43.14851
regret,125486.7497


[34m[1mwandb[0m: Agent Starting Run: rx2b84f3 with config:
[34m[1mwandb[0m: 	hidden_dim: 256
[34m[1mwandb[0m: 	learning_rate: 0.008837518630311816
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,█▄▃▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
regret,▁

0,1
avg_scores,9.39604
regret,139663.79874


[34m[1mwandb[0m: Agent Starting Run: 6f888ezt with config:
[34m[1mwandb[0m: 	hidden_dim: 256
[34m[1mwandb[0m: 	learning_rate: 0.003787899979847084
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.000 MB of 0.000 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,█▅▃▂▂▂▂▂▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
regret,▁

0,1
avg_scores,9.32673
regret,139457.39642


[34m[1mwandb[0m: Agent Starting Run: bwv9el5l with config:
[34m[1mwandb[0m: 	hidden_dim: 64
[34m[1mwandb[0m: 	learning_rate: 0.004813533238281616
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.006 MB uploaded\r'), FloatProgress(value=0.1953932936383579, max=1.0…

0,1
avg_scores,▁▁▁▁▁▁▁▁▁▁▁▁▂▂▂▂▂▃▃▃▄▄▅▆▆▇███████▇▇▇▇▇▇▇
regret,▁

0,1
avg_scores,276.13861
regret,95532.73141


[34m[1mwandb[0m: Agent Starting Run: jetiqr65 with config:
[34m[1mwandb[0m: 	hidden_dim: 64
[34m[1mwandb[0m: 	learning_rate: 0.0007994114088578846
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.000 MB of 0.006 MB uploaded\r'), FloatProgress(value=0.0, max=1.0)))

0,1
avg_scores,▁▁▁▂▃▄▅▅▅▅▅▆▆▆▇███▇▇▇▇█▇▆▆▅▄▃▃▂▂▂▂▂▁▁▂▂▂
regret,▁

0,1
avg_scores,20.20792
regret,133655.50767


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: ppgy3yx3 with config:
[34m[1mwandb[0m: 	hidden_dim: 128
[34m[1mwandb[0m: 	learning_rate: 0.009204838067283134
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.006 MB uploaded\r'), FloatProgress(value=0.19542391474690488, max=1.…

0,1
avg_scores,▁▁▁▂▂▂▂▂▂▂▂▂▂▃▃▄▄▆▆▆▆▆▆▇██████▇▆▆▆▇▇▇▇▆▆
regret,▁

0,1
avg_scores,127.19802
regret,113006.7151


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: kevqzajk with config:
[34m[1mwandb[0m: 	hidden_dim: 128
[34m[1mwandb[0m: 	learning_rate: 0.0058525296369523515
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.000 MB of 0.006 MB uploaded\r'), FloatProgress(value=0.0, max=1.0)))

0,1
avg_scores,▁▂▂▃▃▃▃▂▂▂▂▂▂▂▃▃▄▅▆▆▇▇▇▇███▇▇▇▇▆▅▅▅▄▄▄▄▄
regret,▁

0,1
avg_scores,19.23762
regret,136309.21157


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: t4fqs3l1 with config:
[34m[1mwandb[0m: 	hidden_dim: 256
[34m[1mwandb[0m: 	learning_rate: 0.002238258111552105
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.006 MB uploaded\r'), FloatProgress(value=0.19542391474690488, max=1.…

0,1
avg_scores,▁▁▁▁▁▁▁▁▁▁▁▁▁▂▂▂▂▃▃▃▃▃▄▄▄▄▅▅▆▆▆▆▆▆▆▇▇███
regret,▁

0,1
avg_scores,362.87129
regret,97681.75674


[34m[1mwandb[0m: Agent Starting Run: wc7kkmek with config:
[34m[1mwandb[0m: 	hidden_dim: 128
[34m[1mwandb[0m: 	learning_rate: 0.009094707019478943
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▂▁▃▂▂▂▂▂▂▂▂▃▂▂▂▂▂▂▃▃▄▃▄▄▄▅▅▆▆▇██████▇▇▇█
regret,▁

0,1
avg_scores,61.0198
regret,130308.98281


[34m[1mwandb[0m: Agent Starting Run: legavf4m with config:
[34m[1mwandb[0m: 	hidden_dim: 128
[34m[1mwandb[0m: 	learning_rate: 0.008525878590657196
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.011111111111111112, max=1.0…

VBox(children=(Label(value='0.000 MB of 0.000 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▇▅▃▃▃▃▃▄▄▄▄█▇▇▇▇▆▆▆▆▅▅▅▅▁▁▁▁▁▁▁▁▂▂▁▁▁▁▁▁
regret,▁

0,1
avg_scores,9.35644
regret,139459.01899


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: tkqgzjsd with config:
[34m[1mwandb[0m: 	hidden_dim: 256
[34m[1mwandb[0m: 	learning_rate: 0.0070833533824348665
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.011111111111111112, max=1.0…

VBox(children=(Label(value='0.001 MB of 0.006 MB uploaded\r'), FloatProgress(value=0.2006758931445124, max=1.0…

0,1
avg_scores,▁▁▁▁▁▁▁▁▁▁▁▁▁▂▂▂▂▂▂▃▃▃▄▅▅▅▆▆▇▇▇██████▇▇▇
regret,▁

0,1
avg_scores,408.9802
regret,81427.64918


[34m[1mwandb[0m: Agent Starting Run: io9esyq1 with config:
[34m[1mwandb[0m: 	hidden_dim: 128
[34m[1mwandb[0m: 	learning_rate: 0.009780755524732648
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.006 MB uploaded\r'), FloatProgress(value=0.19545454545454546, max=1.…

0,1
avg_scores,█▇▄▃▃▂▂▂▃▃▃▂▂▂▂▂▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
regret,▁

0,1
avg_scores,9.32673
regret,138754.21392


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: j7i5yoeb with config:
[34m[1mwandb[0m: 	hidden_dim: 256
[34m[1mwandb[0m: 	learning_rate: 0.0074645274548936
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.01128888888876342, max=1.0)…

VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,█▆▅▄▃▃▂▂▂▂▂▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
regret,▁

0,1
avg_scores,9.39604
regret,138552.66333


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: ev6goz7y with config:
[34m[1mwandb[0m: 	hidden_dim: 32
[34m[1mwandb[0m: 	learning_rate: 0.008969584680609238
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.011111111111111112, max=1.0…

VBox(children=(Label(value='0.000 MB of 0.000 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▇▅▅██▇▆▅▅▄▄▄▃▃▃▃▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
regret,▁

0,1
avg_scores,9.32673
regret,138729.86752


[34m[1mwandb[0m: Agent Starting Run: kg0sfzoc with config:
[34m[1mwandb[0m: 	hidden_dim: 32
[34m[1mwandb[0m: 	learning_rate: 0.000801515238508375
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.000 MB of 0.006 MB uploaded\r'), FloatProgress(value=0.0, max=1.0)))

0,1
avg_scores,▁▁▂▂▂▃▃▃▃▃▃▃▃▃▃▃▃▃▃▃▃▃▃▃▃▃▃▄▄▄▅▅▅▅▆▆▇▇██
regret,▁

0,1
avg_scores,53.58416
regret,132717.55993


[34m[1mwandb[0m: Agent Starting Run: ptr94zaa with config:
[34m[1mwandb[0m: 	hidden_dim: 256
[34m[1mwandb[0m: 	learning_rate: 0.0006390082061284547
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,█▅▃▂▂▁▁▁▁▁▁▁▂▂▂▂▂▃▃▄▄▄▅▅▆▆▆▆▆▆▆▆▆▆▆▇▇▆▆▆
regret,▁

0,1
avg_scores,24.92079
regret,136602.0099


[34m[1mwandb[0m: Agent Starting Run: 0k3mjt9n with config:
[34m[1mwandb[0m: 	hidden_dim: 64
[34m[1mwandb[0m: 	learning_rate: 0.00942331545407088
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.011111111111111112, max=1.0…

VBox(children=(Label(value='0.001 MB of 0.006 MB uploaded\r'), FloatProgress(value=0.1952671994985112, max=1.0…

0,1
avg_scores,▁▁▂▂▃▃▃▃▃▃▃▃▃▃▃▃▃▄▄▅▅▆▇▇▇▇▇▆▆▆▆▅▅▅▅▆▆▇▇█
regret,▁

0,1
avg_scores,101.17822
regret,124298.99959


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: 1kuom158 with config:
[34m[1mwandb[0m: 	hidden_dim: 64
[34m[1mwandb[0m: 	learning_rate: 0.006682050914865312
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.000 MB of 0.000 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,█▆▆▅▄▄▃▃▃▃▂▂▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
regret,▁

0,1
avg_scores,9.38614
regret,139444.25267


[34m[1mwandb[0m: Agent Starting Run: zhsyt0e7 with config:
[34m[1mwandb[0m: 	hidden_dim: 32
[34m[1mwandb[0m: 	learning_rate: 0.003711480635936455
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.011111111111111112, max=1.0…

VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,█▅█▆▅▅▅▅▄▄▄▄▄▃▃▂▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▂▂▂▂▃▃▄
regret,▁

0,1
avg_scores,16.06931
regret,138294.08039


[34m[1mwandb[0m: Agent Starting Run: n21eurds with config:
[34m[1mwandb[0m: 	hidden_dim: 128
[34m[1mwandb[0m: 	learning_rate: 0.008982332179890638
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.006 MB uploaded\r'), FloatProgress(value=0.19542391474690488, max=1.…

0,1
avg_scores,█▇▄▄▃▃▃▂▂▂▂▂▂▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
regret,▁

0,1
avg_scores,9.32673
regret,139589.91299


[34m[1mwandb[0m: Agent Starting Run: 67vgu98t with config:
[34m[1mwandb[0m: 	hidden_dim: 64
[34m[1mwandb[0m: 	learning_rate: 0.0043934816376723865
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.01128888888876342, max=1.0)…

VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,█▄▃▂▂▂▁▁▁▁▁▂▂▂▂▂▂▂▂▂▂▂▂▂▂▂▂▂▂▂▂▂▂▂▂▂▂▃▂▂
regret,▁

0,1
avg_scores,19.73267
regret,136525.63882


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: i155q3u5 with config:
[34m[1mwandb[0m: 	hidden_dim: 64
[34m[1mwandb[0m: 	learning_rate: 0.005812657018547666
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.000 MB of 0.006 MB uploaded\r'), FloatProgress(value=0.0, max=1.0)))

0,1
avg_scores,▃▂▂▁▁▁▁▂▂▂▃▄▅▅▅▅▅▅▅▅▅▅▄▄▃▂▂▃▃▄▄▅▆▆▇█████
regret,▁

0,1
avg_scores,17.31683
regret,138497.3378


[34m[1mwandb[0m: Agent Starting Run: 1wv9aowi with config:
[34m[1mwandb[0m: 	hidden_dim: 128
[34m[1mwandb[0m: 	learning_rate: 0.0007155634265115121
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.011111111111111112, max=1.0…

VBox(children=(Label(value='0.001 MB of 0.006 MB uploaded\r'), FloatProgress(value=0.19533208020050125, max=1.…

0,1
avg_scores,▂▁▁▁▁▁▁▁▁▂▂▂▂▂▂▂▂▃▃▃▃▃▃▄▄▄▄▄▅▅▅▅▅▆▆▆▇▇██
regret,▁

0,1
avg_scores,96.36634
regret,128038.05137


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: z8iveep4 with config:
[34m[1mwandb[0m: 	hidden_dim: 64
[34m[1mwandb[0m: 	learning_rate: 0.005054313560037875
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▁▁▁▁▁▁▁▂▂▂▃▃▃▃▄▄▅▆▆▇▇▇██████▇▇▇▇▇▇▇▆▆▅▅▅
regret,▁

0,1
avg_scores,173.34653
regret,92579.31872


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: uaeow4cj with config:
[34m[1mwandb[0m: 	hidden_dim: 128
[34m[1mwandb[0m: 	learning_rate: 0.006352725170733846
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.01127777777777131, max=1.0)…

VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▁▁▂▂▂▂▂▂▂▃▃▃▄▄▄▄▄▄▄▅▅▅▅▅▅▅▅▆▆▆▆▆▇▇███▇▇▆
regret,▁

0,1
avg_scores,122.81188
regret,114304.37342


[34m[1mwandb[0m: Agent Starting Run: rbgtgbwt with config:
[34m[1mwandb[0m: 	hidden_dim: 128
[34m[1mwandb[0m: 	learning_rate: 0.003763020722647558
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.000 MB of 0.006 MB uploaded\r'), FloatProgress(value=0.0, max=1.0)))

0,1
avg_scores,▇▄▃▂▂▂▂▂▃▃▂▂▂▁▁▁▂▄▅▅▆▆▇███████▇▆▆▆▄▄▅▅▇█
regret,▁

0,1
avg_scores,19.87129
regret,137421.9185


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: tbqsw8ky with config:
[34m[1mwandb[0m: 	hidden_dim: 64
[34m[1mwandb[0m: 	learning_rate: 0.00907537357484407
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.006 MB uploaded\r'), FloatProgress(value=0.19542391474690488, max=1.…

0,1
avg_scores,▁▁▁▁▂▂▂▂▃▃▃▃▄▅▅▅▅▅▅▅▅▅▅▅▅▅▄▄▅▅▅▆▆▇▇▇▇███
regret,▁

0,1
avg_scores,130.68317
regret,119604.13034


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: psuokrth with config:
[34m[1mwandb[0m: 	hidden_dim: 64
[34m[1mwandb[0m: 	learning_rate: 0.001825758367330987
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.01127777777777131, max=1.0)…

VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▂▂▂▂▂▂▂▂▂▃▃▃▃▄▄▄▅▅▆▆▆▇▇██
regret,▁

0,1
avg_scores,256.31683
regret,117545.24074


[34m[1mwandb[0m: Agent Starting Run: tkhvvur7 with config:
[34m[1mwandb[0m: 	hidden_dim: 32
[34m[1mwandb[0m: 	learning_rate: 0.0023830690677128564
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.011111111111111112, max=1.0…

VBox(children=(Label(value='0.001 MB of 0.006 MB uploaded\r'), FloatProgress(value=0.1953932936383579, max=1.0…

0,1
avg_scores,▁▁▁▁▁▁▁▁▁▁▁▂▂▂▂▂▂▂▂▂▂▃▃▃▃▃▃▄▄▄▄▅▅▅▆▇▇███
regret,▁

0,1
avg_scores,130.44554
regret,128382.54573


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: g13ny7hk with config:
[34m[1mwandb[0m: 	hidden_dim: 256
[34m[1mwandb[0m: 	learning_rate: 0.005492294108251141
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.000 MB of 0.006 MB uploaded\r'), FloatProgress(value=0.0, max=1.0)))

0,1
avg_scores,▅█▅▃▂▂▂▂▂▂▂▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
regret,▁

0,1
avg_scores,9.39604
regret,139632.03556


[34m[1mwandb[0m: Agent Starting Run: sl3uefl3 with config:
[34m[1mwandb[0m: 	hidden_dim: 128
[34m[1mwandb[0m: 	learning_rate: 0.00428634328295296
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,█▄▃▂▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
regret,▁

0,1
avg_scores,9.39604
regret,139195.69635


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: dxcmpebi with config:
[34m[1mwandb[0m: 	hidden_dim: 64
[34m[1mwandb[0m: 	learning_rate: 0.008973377757682678
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.011288888888925108, max=1.0…

VBox(children=(Label(value='0.001 MB of 0.006 MB uploaded\r'), FloatProgress(value=0.19542391474690488, max=1.…

0,1
avg_scores,▁▁▁▁▁▁▁▂▂▂▂▂▂▃▃▄▅▅▅▅▅▄▄▄▄▄▄▃▂▂▂▂▃▄▄▅▆▇██
regret,▁

0,1
avg_scores,223.26733
regret,117146.86531


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: wncqno4j with config:
[34m[1mwandb[0m: 	hidden_dim: 256
[34m[1mwandb[0m: 	learning_rate: 0.00425222136059881
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.006 MB uploaded\r'), FloatProgress(value=0.1953932936383579, max=1.0…

0,1
avg_scores,▁▁▁▂▂▂▃▃▂▂▂▂▂▂▃▃▃▃▃▃▃▃▃▄▄▄▄▄▃▃▃▃▄▄▄▄▄▆▇█
regret,▁

0,1
avg_scores,71.07921
regret,132554.44215


[34m[1mwandb[0m: Agent Starting Run: 9fyrzt15 with config:
[34m[1mwandb[0m: 	hidden_dim: 64
[34m[1mwandb[0m: 	learning_rate: 0.00997928165747363
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.000 MB of 0.000 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▆▄▄▃▅██▇▇▆▆▅▅▅▄▄▄▄▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
regret,▁

0,1
avg_scores,9.32673
regret,138967.48395


[34m[1mwandb[0m: Agent Starting Run: z3g2ufjy with config:
[34m[1mwandb[0m: 	hidden_dim: 128
[34m[1mwandb[0m: 	learning_rate: 0.004531092665912529
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.006 MB uploaded\r'), FloatProgress(value=0.19529780564263322, max=1.…

0,1
avg_scores,▁▁▁▁▁▁▁▁▁▁▁▂▂▂▂▃▃▄▄▄▄▄▅▅▅▅▆▆▅▅▅▅▅▆▇▇▇███
regret,▁

0,1
avg_scores,283.40594
regret,103566.20348


[34m[1mwandb[0m: Agent Starting Run: 00vqi9et with config:
[34m[1mwandb[0m: 	hidden_dim: 64
[34m[1mwandb[0m: 	learning_rate: 0.008561838180638935
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.011288888888925108, max=1.0…

VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,█▅▄▄▄▄▃▃▃▃▃▂▂▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
regret,▁

0,1
avg_scores,9.39604
regret,138948.64806


[34m[1mwandb[0m: Agent Starting Run: mv0o9lhw with config:
[34m[1mwandb[0m: 	hidden_dim: 64
[34m[1mwandb[0m: 	learning_rate: 0.0014089638061245873
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.006 MB uploaded\r'), FloatProgress(value=0.19536268212439292, max=1.…

0,1
avg_scores,▂▂▂▁▁▁▁▁▁▂▂▂▂▂▂▂▃▃▃▃▄▄▄▄▄▄▄▄▄▄▅▄▅▅▅▆▆▇▇█
regret,▁

0,1
avg_scores,60.59406
regret,132568.14829


[34m[1mwandb[0m: Agent Starting Run: l8v645bc with config:
[34m[1mwandb[0m: 	hidden_dim: 32
[34m[1mwandb[0m: 	learning_rate: 0.00671186739376011
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.011288888888925108, max=1.0…

VBox(children=(Label(value='0.000 MB of 0.000 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,█▇▄▄▄▄▃▃▄▄▄▃▄▄▃▃▃▃▂▂▂▂▂▂▁▁▁▁▁▁▂▂▂▃▃▃▃▃▃▂
regret,▁

0,1
avg_scores,15.63366
regret,137527.75339


[34m[1mwandb[0m: Agent Starting Run: 0h5ledya with config:
[34m[1mwandb[0m: 	hidden_dim: 64
[34m[1mwandb[0m: 	learning_rate: 0.0066035301343964296
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.006 MB uploaded\r'), FloatProgress(value=0.19545454545454546, max=1.…

0,1
avg_scores,▇█▆▆▆▅▄▄▄▃▃▃▃▃▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
regret,▁

0,1
avg_scores,9.46535
regret,139191.87499


[34m[1mwandb[0m: Agent Starting Run: q7kk8qtf with config:
[34m[1mwandb[0m: 	hidden_dim: 256
[34m[1mwandb[0m: 	learning_rate: 0.004601919967175708
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.006 MB uploaded\r'), FloatProgress(value=0.1953932936383579, max=1.0…

0,1
avg_scores,▁▁▁▁▁▁▁▁▂▂▂▂▂▃▃▃▄▄▄▄▄▄▄▄▄▄▄▄▄▅▅▆█████▇▇▇
regret,▁

0,1
avg_scores,113.59406
regret,124752.01538


[34m[1mwandb[0m: Agent Starting Run: 663s8tad with config:
[34m[1mwandb[0m: 	hidden_dim: 32
[34m[1mwandb[0m: 	learning_rate: 0.0015829397305661631
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.000 MB of 0.006 MB uploaded\r'), FloatProgress(value=0.0, max=1.0)))

0,1
avg_scores,▂▂▁▂▃▄▅▅▆▆▆▇██▇▇▇▇▆▆▆▅▅▄▃▂▂▂▂▂▃▃▃▃▄▄▃▃▃▃
regret,▁

0,1
avg_scores,23.61386
regret,134679.12235


[34m[1mwandb[0m: Agent Starting Run: 54t0pnou with config:
[34m[1mwandb[0m: 	hidden_dim: 64
[34m[1mwandb[0m: 	learning_rate: 0.004496220656318507
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.01128888888876342, max=1.0)…

VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▁▁▁▁▁▁▁▁▁▁▁▁▂▂▂▂▂▂▂▂▂▂▂▃▃▄▄▅▅▅▅▆▆▆▇▇███▇
regret,▁

0,1
avg_scores,285.26733
regret,108099.21063


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: o93pq8g5 with config:
[34m[1mwandb[0m: 	hidden_dim: 256
[34m[1mwandb[0m: 	learning_rate: 0.007166047226512027
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.006 MB uploaded\r'), FloatProgress(value=0.1953932936383579, max=1.0…

0,1
avg_scores,▂▁▁▁▁▁▁▂▂▂▂▂▂▂▂▃▃▄▄▄▄▅▆█████▇▇▇▇▆▆▅▄▂▃▄▄
regret,▁

0,1
avg_scores,92.62376
regret,113639.79701


[34m[1mwandb[0m: Agent Starting Run: rk4cdkgb with config:
[34m[1mwandb[0m: 	hidden_dim: 32
[34m[1mwandb[0m: 	learning_rate: 0.0036033295132389337
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.006 MB uploaded\r'), FloatProgress(value=0.1953932936383579, max=1.0…

0,1
avg_scores,▁▁▁▁▁▁▂▂▂▂▂▂▂▂▂▂▃▃▃▃▃▃▄▄▄▅▅▅▅▅▅▆▆▆▇▇████
regret,▁

0,1
avg_scores,161.72277
regret,121115.39443


[34m[1mwandb[0m: Agent Starting Run: bx95o78h with config:
[34m[1mwandb[0m: 	hidden_dim: 256
[34m[1mwandb[0m: 	learning_rate: 0.002994546469965442
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.011288888888925108, max=1.0…

VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▁▁▁▁▂▂▂▂▂▂▂▃▃▃▄▄▄▄▅▅▅▅▅▅▄▄▄▃▃▃▄▄▅▆▇▇▇▇██
regret,▁

0,1
avg_scores,199.66337
regret,112669.65669


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: kxxxccau with config:
[34m[1mwandb[0m: 	hidden_dim: 32
[34m[1mwandb[0m: 	learning_rate: 0.006165136881539584
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.
[34m[1mwandb[0m: W&B API key is configured. Use [1m`wandb login --relogin`[0m to force relogin


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.011111111111111112, max=1.0…

VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▂▂▂▃▃▃▄▄▅▅▅▆▆▆▇▇▇▇▇▇▇▇███
regret,▁

0,1
avg_scores,393.65347
regret,89166.7599


[34m[1mwandb[0m: Agent Starting Run: i1r9ksjt with config:
[34m[1mwandb[0m: 	hidden_dim: 256
[34m[1mwandb[0m: 	learning_rate: 0.0019983820226059526
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▅▆▄▃▃▄▅▇█▇▇▇▆██▇▇▇▇▆▅▅▄▄▃▃▁▁▁▁▁▁▁▁▁▁▁▁▁▁
regret,▁

0,1
avg_scores,9.32673
regret,138783.50616


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: fo1wtft1 with config:
[34m[1mwandb[0m: 	hidden_dim: 256
[34m[1mwandb[0m: 	learning_rate: 0.0012008121315794772
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.01127777777777131, max=1.0)…

VBox(children=(Label(value='0.001 MB of 0.006 MB uploaded\r'), FloatProgress(value=0.19536268212439292, max=1.…

0,1
avg_scores,▁▁▁▁▁▁▁▁▁▂▂▂▂▂▂▂▃▃▃▃▃▄▄▅▆▆▇▇▇▇▇▇▇▇▇▇████
regret,▁

0,1
avg_scores,188.55446
regret,113823.06066


[34m[1mwandb[0m: Agent Starting Run: d18n9gop with config:
[34m[1mwandb[0m: 	hidden_dim: 64
[34m[1mwandb[0m: 	learning_rate: 0.005261144942769551
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.000 MB of 0.006 MB uploaded\r'), FloatProgress(value=0.0, max=1.0)))

0,1
avg_scores,▄█▅▃▃▂▂▂▂▂▂▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
regret,▁

0,1
avg_scores,9.45545
regret,139410.1253


[34m[1mwandb[0m: Agent Starting Run: azcmzhx7 with config:
[34m[1mwandb[0m: 	hidden_dim: 64
[34m[1mwandb[0m: 	learning_rate: 0.0018276993577680631
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.006 MB uploaded\r'), FloatProgress(value=0.19536268212439292, max=1.…

0,1
avg_scores,▁▁▁▁▁▁▁▁▁▁▁▂▂▂▂▂▂▂▂▂▂▂▃▃▃▃▃▃▃▄▄▄▄▅▅▆▆▇▇█
regret,▁

0,1
avg_scores,138.43564
regret,127427.48074


[34m[1mwandb[0m: Agent Starting Run: sh04ls12 with config:
[34m[1mwandb[0m: 	hidden_dim: 64
[34m[1mwandb[0m: 	learning_rate: 0.003681196613608402
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.006 MB uploaded\r'), FloatProgress(value=0.1952671994985112, max=1.0…

0,1
avg_scores,▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▂▂▂▂▂▂▃▃▃▃▄▄▅▆▇▇▇██
regret,▁

0,1
avg_scores,135.50495
regret,131033.80576


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: v40mjfwf with config:
[34m[1mwandb[0m: 	hidden_dim: 128
[34m[1mwandb[0m: 	learning_rate: 0.007043390841409152
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.01127777777777131, max=1.0)…

VBox(children=(Label(value='0.000 MB of 0.006 MB uploaded\r'), FloatProgress(value=0.0, max=1.0)))

0,1
avg_scores,█▃▄▁▁▂▂▂▂▂▂▄▄▄▄▄▄▅▅▄▅▅▅▅▅▄▄▆▆▇▇▇▇▇▇▇▆▆▆▆
regret,▁

0,1
avg_scores,9.68317
regret,139638.86477


[34m[1mwandb[0m: Agent Starting Run: px3q3r65 with config:
[34m[1mwandb[0m: 	hidden_dim: 128
[34m[1mwandb[0m: 	learning_rate: 0.005123576655315089
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.01128888888876342, max=1.0)…

VBox(children=(Label(value='0.001 MB of 0.006 MB uploaded\r'), FloatProgress(value=0.1953932936383579, max=1.0…

0,1
avg_scores,▁▁▁▂▂▂▂▂▂▂▂▂▃▃▃▃▃▄▄▅▅▅▆▆▇▇██████▇▇▇▆▆▇▇▇
regret,▁

0,1
avg_scores,238.74257
regret,97598.41577


[34m[1mwandb[0m: Agent Starting Run: foqafngs with config:
[34m[1mwandb[0m: 	hidden_dim: 128
[34m[1mwandb[0m: 	learning_rate: 0.0052527806748199485
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.000 MB of 0.000 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▇▄▇█▆▅▅▄▄▃▃▃▃▃▃▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
regret,▁

0,1
avg_scores,9.33663
regret,139299.55158


[34m[1mwandb[0m: Agent Starting Run: 0g85im5b with config:
[34m[1mwandb[0m: 	hidden_dim: 64
[34m[1mwandb[0m: 	learning_rate: 0.005674043186843707
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.011111111111111112, max=1.0…

VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▁▁▁▁▁▂▂▂▂▂▂▂▂▂▂▃▃▃▃▃▃▃▃▄▄▅▅▆▆▆▆▆▆▇▇█████
regret,▁

0,1
avg_scores,205.9802
regret,112102.06296


[34m[1mwandb[0m: Agent Starting Run: gnamyr7u with config:
[34m[1mwandb[0m: 	hidden_dim: 256
[34m[1mwandb[0m: 	learning_rate: 0.005383534836247951
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.01127777777777131, max=1.0)…

VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▁▁▁▁▁▁▁▁▁▁▁▁▂▂▂▂▂▂▂▂▂▃▃▃▃▄▄▄▅▅▅▆███▇▇▇▇█
regret,▁

0,1
avg_scores,179.16832
regret,120430.06119


[34m[1mwandb[0m: Agent Starting Run: d2c4zqs9 with config:
[34m[1mwandb[0m: 	hidden_dim: 256
[34m[1mwandb[0m: 	learning_rate: 0.0022723873357498453
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.006 MB uploaded\r'), FloatProgress(value=0.19536268212439292, max=1.…

0,1
avg_scores,▁▁▁▁▁▁▁▁▁▁▂▂▂▂▂▂▃▃▃▃▄▄▄▄▄▄▄▄▅▅▅▅▆▆▆▇▇███
regret,▁

0,1
avg_scores,378.0396
regret,96636.52162


[34m[1mwandb[0m: Agent Starting Run: 53l3yd58 with config:
[34m[1mwandb[0m: 	hidden_dim: 128
[34m[1mwandb[0m: 	learning_rate: 0.00845320551352564
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▁▁▁▂▂▃▃▃▄▄▄▄▄▅▅▆▇████████▇▇▇▆▅▅▅▄▄▄▄▄▄▄▄
regret,▁

0,1
avg_scores,48.91089
regret,124874.28884


[34m[1mwandb[0m: Agent Starting Run: q195bw04 with config:
[34m[1mwandb[0m: 	hidden_dim: 32
[34m[1mwandb[0m: 	learning_rate: 0.0055888586498053176
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.011111111111111112, max=1.0…

VBox(children=(Label(value='0.000 MB of 0.000 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▄▃▃▃▃▃▅▆█▇▇▆▆▆▆▅▅▅▅▄▄▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
regret,▁

0,1
avg_scores,9.32673
regret,138916.25619


[34m[1mwandb[0m: Agent Starting Run: yxiy3emw with config:
[34m[1mwandb[0m: 	hidden_dim: 256
[34m[1mwandb[0m: 	learning_rate: 0.0007479824276874249
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.011111111111111112, max=1.0…

VBox(children=(Label(value='0.001 MB of 0.006 MB uploaded\r'), FloatProgress(value=0.1953932936383579, max=1.0…

0,1
avg_scores,▂▁▁▁▁▁▂▂▂▂▂▂▂▂▂▂▂▃▃▃▃▃▄▄▄▄▄▄▅▅▅▅▅▅▅▅▆▆▇█
regret,▁

0,1
avg_scores,84.89109
regret,128070.14709


[34m[1mwandb[0m: Agent Starting Run: 51wv5xc6 with config:
[34m[1mwandb[0m: 	hidden_dim: 32
[34m[1mwandb[0m: 	learning_rate: 0.006541107890594561
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.01127777777777131, max=1.0)…

VBox(children=(Label(value='0.001 MB of 0.006 MB uploaded\r'), FloatProgress(value=0.1953932936383579, max=1.0…

0,1
avg_scores,▁▁▁▁▁▁▂▂▂▂▂▂▂▂▃▃▄▅▅▆▆▇███████▇▇▇▇▇▆▆▆▆▆▆
regret,▁

0,1
avg_scores,130.22772
regret,113719.88466


[34m[1mwandb[0m: Agent Starting Run: 36m1omxb with config:
[34m[1mwandb[0m: 	hidden_dim: 64
[34m[1mwandb[0m: 	learning_rate: 0.0029749018265052404
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.011111111111111112, max=1.0…

VBox(children=(Label(value='0.001 MB of 0.006 MB uploaded\r'), FloatProgress(value=0.19501489261639757, max=1.…

0,1
avg_scores,▁▁▁▁▁▁▂▂▂▂▂▂▂▂▂▂▂▂▂▃▃▃▄▄▄▄▄▅▅▅▅▅▅▅▆▆▇▇██
regret,▁

0,1
avg_scores,209.16832
regret,117051.19157


[34m[1mwandb[0m: Agent Starting Run: ysp1lx2e with config:
[34m[1mwandb[0m: 	hidden_dim: 64
[34m[1mwandb[0m: 	learning_rate: 0.002969552983565494
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.000 MB of 0.000 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▃▁▁▃▃▄▄▄▃▃▃▃▃▂▂▃▃▃▃▃▃▃▃▃▃▃▃▃▃▄▄▅▇█████▇▇
regret,▁

0,1
avg_scores,27.10891
regret,136411.84781


[34m[1mwandb[0m: Agent Starting Run: hpaerbe6 with config:
[34m[1mwandb[0m: 	hidden_dim: 128
[34m[1mwandb[0m: 	learning_rate: 0.005929625740115542
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.011288888888925108, max=1.0…

VBox(children=(Label(value='0.000 MB of 0.000 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▄▃▂▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▂▂▄▄▆▆▆▆▆▇▇▇▇██▆▆▅▅▅▆
regret,▁

0,1
avg_scores,14.90099
regret,138658.31178


[34m[1mwandb[0m: Agent Starting Run: qsz712as with config:
[34m[1mwandb[0m: 	hidden_dim: 32
[34m[1mwandb[0m: 	learning_rate: 0.008691591579119381
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.006 MB uploaded\r'), FloatProgress(value=0.19551583568516775, max=1.…

0,1
avg_scores,▅▅█▆▅▅▄▄▃▃▃▃▃▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
regret,▁

0,1
avg_scores,9.41584
regret,139154.53165


[34m[1mwandb[0m: Agent Starting Run: 59kfwipv with config:
[34m[1mwandb[0m: 	hidden_dim: 256
[34m[1mwandb[0m: 	learning_rate: 0.006415560089160219
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.000 MB of 0.000 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,█▅▃▃▂▂▂▂▂▂▂▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▂▂▂▃▃▃▃▃▃
regret,▁

0,1
avg_scores,11.11881
regret,139469.34295


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: dzasq35o with config:
[34m[1mwandb[0m: 	hidden_dim: 128
[34m[1mwandb[0m: 	learning_rate: 0.007687391974918398
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.006 MB uploaded\r'), FloatProgress(value=0.19545454545454546, max=1.…

0,1
avg_scores,█▅▃▂▂▂▂▂▁▁▁▁▁▁▁▁▂▂▂▂▂▃▃▄▅████▇▇▇▇▇▆▆▆▄▁▁
regret,▁

0,1
avg_scores,9.39604
regret,139036.37186


[34m[1mwandb[0m: Agent Starting Run: 1lu5ko42 with config:
[34m[1mwandb[0m: 	hidden_dim: 128
[34m[1mwandb[0m: 	learning_rate: 0.009418867580779476
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.000 MB of 0.000 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,█▆▃▃▃▃▂▂▂▂▂▂▂▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▂▂▂▁▁▁▁▁
regret,▁

0,1
avg_scores,9.32673
regret,139612.81746


[34m[1mwandb[0m: Agent Starting Run: 0tpgfndf with config:
[34m[1mwandb[0m: 	hidden_dim: 64
[34m[1mwandb[0m: 	learning_rate: 0.00097726286091197
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.000 MB of 0.000 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▁▂▁▁▁▁▁▂▂▂▂▁▂▂▂▂▃▃▃▃▃▄▄▄▅▅▅▅▅▅▅▅▆▆▆▆▇▇▇█
regret,▁

0,1
avg_scores,41.37624
regret,134702.80143


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: w5tywr3e with config:
[34m[1mwandb[0m: 	hidden_dim: 128
[34m[1mwandb[0m: 	learning_rate: 0.007235379393605523
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.006 MB uploaded\r'), FloatProgress(value=0.19545454545454546, max=1.…

0,1
avg_scores,█▄▃▂▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▂▂▂▂▂
regret,▁

0,1
avg_scores,11.22772
regret,139287.8436


[34m[1mwandb[0m: Agent Starting Run: mcug6qfa with config:
[34m[1mwandb[0m: 	hidden_dim: 256
[34m[1mwandb[0m: 	learning_rate: 0.0050751793741151945
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.000 MB of 0.000 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,█▃▃▁▂▂▂▂▂▂▂▂▂▂▂▂▂▂▂▂▂▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▂▂▂
regret,▁

0,1
avg_scores,9.43564
regret,139680.38632


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: ud31iz59 with config:
[34m[1mwandb[0m: 	hidden_dim: 64
[34m[1mwandb[0m: 	learning_rate: 0.0059189143547478075
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.011111111111111112, max=1.0…

VBox(children=(Label(value='0.001 MB of 0.006 MB uploaded\r'), FloatProgress(value=0.19520601597994675, max=1.…

0,1
avg_scores,▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▂▂▂▂▂▂▂▂▂▃▃▄▄▅▅▅▆▆▇▇▇███
regret,▁

0,1
avg_scores,255.53465
regret,113275.95581


[34m[1mwandb[0m: Agent Starting Run: 9zondao9 with config:
[34m[1mwandb[0m: 	hidden_dim: 128
[34m[1mwandb[0m: 	learning_rate: 0.006903764270659283
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▁▁▁▁▁▁▁▁▁▁▁▁▂▂▂▂▂▂▂▂▂▃▃▃▃▃▃▃▃▃▃▄▅▅▅▆▆▇▇█
regret,▁

0,1
avg_scores,415.89109
regret,107251.85408


[34m[1mwandb[0m: Agent Starting Run: b6fyb7qz with config:
[34m[1mwandb[0m: 	hidden_dim: 32
[34m[1mwandb[0m: 	learning_rate: 0.009044678126568995
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▆▇▆▄▄▃▃▃▂▂▂▂▂▂▁▁▁▂▂▂▂▂▂▂▂▂▂▂▃▄▄▄▅▅▆▇███▇
regret,▁

0,1
avg_scores,17.08911
regret,138752.84292


[34m[1mwandb[0m: Agent Starting Run: mf6km06b with config:
[34m[1mwandb[0m: 	hidden_dim: 64
[34m[1mwandb[0m: 	learning_rate: 0.007899558223617835
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.000 MB of 0.000 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,█▄▂▂▁▁▁▁▁▂▂▂▂▃▃▄▄▄▄▄▄▄▅▄▄▄▄▃▂▂▂▃▂▃▂▂▂▂▁▁
regret,▁

0,1
avg_scores,10.63366
regret,138879.60105


[34m[1mwandb[0m: Agent Starting Run: qqf6a8rt with config:
[34m[1mwandb[0m: 	hidden_dim: 64
[34m[1mwandb[0m: 	learning_rate: 0.0034743521306950156
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.011111111111111112, max=1.0…

VBox(children=(Label(value='0.001 MB of 0.006 MB uploaded\r'), FloatProgress(value=0.1952671994985112, max=1.0…

0,1
avg_scores,▁▁▁▁▁▁▂▂▃▄▄▅▆▅▆▆▆▇▇▇▇▇▇▇▇▆▇█████████▇▇▆▅
regret,▁

0,1
avg_scores,23.9802
regret,134948.64366


[34m[1mwandb[0m: Agent Starting Run: 7im7ipmk with config:
[34m[1mwandb[0m: 	hidden_dim: 128
[34m[1mwandb[0m: 	learning_rate: 0.00638518376691247
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.006 MB uploaded\r'), FloatProgress(value=0.19548518576579402, max=1.…

0,1
avg_scores,▁▁▁▁▁▁▁▁▁▁▁▁▂▂▂▂▂▂▂▂▂▂▂▂▃▃▃▃▃▃▃▃▄▄▅▆▆▇██
regret,▁

0,1
avg_scores,345.59406
regret,113364.79893


[34m[1mwandb[0m: Agent Starting Run: f2agrw9t with config:
[34m[1mwandb[0m: 	hidden_dim: 32
[34m[1mwandb[0m: 	learning_rate: 0.002672253046710576
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.000 MB of 0.006 MB uploaded\r'), FloatProgress(value=0.0, max=1.0)))

0,1
avg_scores,▂▁▂▂▁▁▂▂▁▁▁▁▂▂▂▂▁▂▂▁▁▁▁▂▄▃▄▅▆▆▆▆▆███▇▆▅▄
regret,▁

0,1
avg_scores,25.60396
regret,135344.00538


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: 26elsjxh with config:
[34m[1mwandb[0m: 	hidden_dim: 128
[34m[1mwandb[0m: 	learning_rate: 0.002682501444143848
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.011288888888925108, max=1.0…

VBox(children=(Label(value='0.001 MB of 0.006 MB uploaded\r'), FloatProgress(value=0.1953932936383579, max=1.0…

0,1
avg_scores,▄▄▄▃▂▂▄▆▇▇▇███▇▇▇▇▇▅▅▃▃▃▁▁▁▂▂▂▃▃▃▃▃▃▃▃▃▃
regret,▁

0,1
avg_scores,18.87129
regret,135984.85937


[34m[1mwandb[0m: Agent Starting Run: e1z630eo with config:
[34m[1mwandb[0m: 	hidden_dim: 32
[34m[1mwandb[0m: 	learning_rate: 0.0051294032797665964
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.000 MB of 0.000 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▆█▅▄▄▆▆▆▅▅▄▄▄▄▃▃▃▃▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
regret,▁

0,1
avg_scores,9.44554
regret,138899.07461


[34m[1mwandb[0m: Agent Starting Run: vz1yfgm7 with config:
[34m[1mwandb[0m: 	hidden_dim: 128
[34m[1mwandb[0m: 	learning_rate: 0.0039343759140126715
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.006 MB uploaded\r'), FloatProgress(value=0.19530148786217696, max=1.…

0,1
avg_scores,▁▁▁▁▁▁▂▂▂▂▂▂▂▂▂▂▂▂▂▃▃▂▂▂▂▃▄▅▆▇▇▇▇▇▇▇███▇
regret,▁

0,1
avg_scores,167.84158
regret,115207.13571


[34m[1mwandb[0m: Agent Starting Run: q6nraug9 with config:
[34m[1mwandb[0m: 	hidden_dim: 32
[34m[1mwandb[0m: 	learning_rate: 0.006374622431725384
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.006 MB uploaded\r'), FloatProgress(value=0.20061181774271453, max=1.…

0,1
avg_scores,▁▁▂▁▁▂▂▂▂▂▂▂▂▂▂▃▃▃▃▄▄▄▅▇█████▇▇▇███▇▆▆▇▇
regret,▁

0,1
avg_scores,133.09901
regret,116605.45972


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: hd40mglm with config:
[34m[1mwandb[0m: 	hidden_dim: 128
[34m[1mwandb[0m: 	learning_rate: 0.0032510762409657472
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▁▁▁▁▁▁▁▁▁▁▁▁▂▂▂▂▂▃▃▃▄▄▄▄▄▄▄▄▅▅▅▅▆▆▆▆▇▇██
regret,▁

0,1
avg_scores,411.15842
regret,93592.25667


[34m[1mwandb[0m: Agent Starting Run: fhw7mb6d with config:
[34m[1mwandb[0m: 	hidden_dim: 256
[34m[1mwandb[0m: 	learning_rate: 0.009335071884442044
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.011288888888925108, max=1.0…

VBox(children=(Label(value='0.001 MB of 0.006 MB uploaded\r'), FloatProgress(value=0.19545454545454546, max=1.…

0,1
avg_scores,█▄▄▃▂▂▂▂▂▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
regret,▁

0,1
avg_scores,9.39604
regret,139564.7494


[34m[1mwandb[0m: Agent Starting Run: 1f1nylrz with config:
[34m[1mwandb[0m: 	hidden_dim: 256
[34m[1mwandb[0m: 	learning_rate: 0.009666646745329854
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▁▁▁▁▁▂▂▂▃▃▄▄▄▄▄▅▅▆▇███▇▆▆▆▅▅▅▄▄▃▁▁▁▁▁▁▁▁
regret,▁

0,1
avg_scores,9.76238
regret,114245.85222


[34m[1mwandb[0m: Agent Starting Run: unntdho8 with config:
[34m[1mwandb[0m: 	hidden_dim: 256
[34m[1mwandb[0m: 	learning_rate: 0.005819077734038537
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.006 MB uploaded\r'), FloatProgress(value=0.19545454545454546, max=1.…

0,1
avg_scores,█▄▆▅▄▃▃▃▃▂▂▂▂▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
regret,▁

0,1
avg_scores,9.32673
regret,139431.28908


[34m[1mwandb[0m: Agent Starting Run: wb0vpbdi with config:
[34m[1mwandb[0m: 	hidden_dim: 32
[34m[1mwandb[0m: 	learning_rate: 0.00838913154428669
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.006 MB uploaded\r'), FloatProgress(value=0.19538968166849616, max=1.…

0,1
avg_scores,▆▆█▆▅▄▄▃▃▃▃▃▃▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▂▂▃▆▆▆▆▆
regret,▁

0,1
avg_scores,12.29703
regret,139332.98259


[34m[1mwandb[0m: Agent Starting Run: 97f9ysk0 with config:
[34m[1mwandb[0m: 	hidden_dim: 64
[34m[1mwandb[0m: 	learning_rate: 0.009844415807770596
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.000 MB of 0.000 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▆█▅▄▃▃▂▂▂▂▂▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
regret,▁

0,1
avg_scores,9.39604
regret,139197.37714


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: kqcfwl7b with config:
[34m[1mwandb[0m: 	hidden_dim: 32
[34m[1mwandb[0m: 	learning_rate: 0.007596615701678207
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.006 MB uploaded\r'), FloatProgress(value=0.20074050225370252, max=1.…

0,1
avg_scores,▁▁▁▁▁▁▁▁▁▁▁▂▂▂▂▂▂▂▂▃▃▄▅▆▇▇▇███████▇▇▆▆▆▇
regret,▁

0,1
avg_scores,198.0099
regret,106935.53273


[34m[1mwandb[0m: Agent Starting Run: j1u7dcqz with config:
[34m[1mwandb[0m: 	hidden_dim: 256
[34m[1mwandb[0m: 	learning_rate: 0.0006515563279298372
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.006 MB uploaded\r'), FloatProgress(value=0.19542391474690488, max=1.…

0,1
avg_scores,▅▅▃▂▁▁▁▁▂▂▁▂▁▁▁▁▁▁▁▂▁▂▂▃▃▄▅▇▇▇▇███▇▆▆▅▄▃
regret,▁

0,1
avg_scores,20.18812
regret,136319.88757


[34m[1mwandb[0m: Agent Starting Run: c2e4894x with config:
[34m[1mwandb[0m: 	hidden_dim: 64
[34m[1mwandb[0m: 	learning_rate: 0.0063345455832759905
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.006 MB uploaded\r'), FloatProgress(value=0.195141065830721, max=1.0)…

0,1
avg_scores,▁▁▁▁▁▁▁▁▁▁▁▁▂▂▂▂▂▂▂▂▃▃▃▄▃▃▃▃▄▄▄▅▆▆▆▆▆▇▇█
regret,▁

0,1
avg_scores,341.40594
regret,106991.93859


[34m[1mwandb[0m: Agent Starting Run: pagijcy6 with config:
[34m[1mwandb[0m: 	hidden_dim: 32
[34m[1mwandb[0m: 	learning_rate: 0.0031391356280010964
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▁▁▁▁▁▁▁▂▂▂▂▂▂▂▂▂▂▂▂▃▃▃▃▃▃▃▃▃▃▄▄▄▄▄▄▅▅▆▇█
regret,▁

0,1
avg_scores,128.43564
regret,128419.05707


[34m[1mwandb[0m: Agent Starting Run: josiau9b with config:
[34m[1mwandb[0m: 	hidden_dim: 128
[34m[1mwandb[0m: 	learning_rate: 0.002464725955403844
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▁▁▁▁▁▁▁▁▁▁▁▁▁▂▂▂▂▂▂▂▂▃▃▃▃▃▃▃▃▃▄▄▄▄▅▅▆▇▇█
regret,▁

0,1
avg_scores,269.55446
regret,118416.57459


[34m[1mwandb[0m: Agent Starting Run: ae1k45hp with config:
[34m[1mwandb[0m: 	hidden_dim: 32
[34m[1mwandb[0m: 	learning_rate: 0.0005927455323758088
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.011111111111111112, max=1.0…

VBox(children=(Label(value='0.001 MB of 0.006 MB uploaded\r'), FloatProgress(value=0.1953932936383579, max=1.0…

0,1
avg_scores,▄▂▁▁▁▁▂▃▄▄▄▄▄▃▃▃▃▃▃▄▃▃▃▃▃▃▄▅▆▆▆▆▆▅▆▇▇▇██
regret,▁

0,1
avg_scores,56.45545
regret,130456.74929


[34m[1mwandb[0m: Agent Starting Run: fuykygma with config:
[34m[1mwandb[0m: 	hidden_dim: 128
[34m[1mwandb[0m: 	learning_rate: 0.007127943812312918
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.01127777777777131, max=1.0)…

VBox(children=(Label(value='0.001 MB of 0.006 MB uploaded\r'), FloatProgress(value=0.19542391474690488, max=1.…

0,1
avg_scores,▁▁▁▁▁▂▂▂▂▂▂▂▂▂▂▂▂▂▂▂▂▂▂▂▂▃▃▄▄▅▅▅▅▆▆▇▇███
regret,▁

0,1
avg_scores,445.15842
regret,92934.97826


[34m[1mwandb[0m: Agent Starting Run: v7nq47u8 with config:
[34m[1mwandb[0m: 	hidden_dim: 64
[34m[1mwandb[0m: 	learning_rate: 0.005296267480680701
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.006 MB uploaded\r'), FloatProgress(value=0.19542391474690488, max=1.…

0,1
avg_scores,▁▁▁▁▁▁▁▁▁▁▁▁▂▂▂▂▂▃▃▄▄▄▅▅▅▆▆▆▇█████▇▇▇▇▇▇
regret,▁

0,1
avg_scores,215.15842
regret,105978.15695


[34m[1mwandb[0m: Agent Starting Run: hzqxn61k with config:
[34m[1mwandb[0m: 	hidden_dim: 128
[34m[1mwandb[0m: 	learning_rate: 0.004597126467412844
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.006 MB uploaded\r'), FloatProgress(value=0.19523660294578501, max=1.…

0,1
avg_scores,▁▁▁▁▂▂▂▂▂▂▂▂▃▃▃▃▃▃▃▃▃▄▅▆▇████████▇▇▅▅▃▁▁
regret,▁

0,1
avg_scores,18.91089
regret,115023.75663


[34m[1mwandb[0m: Agent Starting Run: k33nmqjf with config:
[34m[1mwandb[0m: 	hidden_dim: 128
[34m[1mwandb[0m: 	learning_rate: 7.1631076627772e-05
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.006 MB uploaded\r'), FloatProgress(value=0.19551583568516775, max=1.…

0,1
avg_scores,▁▁▂▂▂▂▂▂▂▂▂▂▃▃▃▃▃▃▄▄▄▄▄▄▅▅▅▅▅▅▅▆▆▆▆▆▇▇██
regret,▁

0,1
avg_scores,65.40594
regret,131209.47481


[34m[1mwandb[0m: Agent Starting Run: 92epeuin with config:
[34m[1mwandb[0m: 	hidden_dim: 256
[34m[1mwandb[0m: 	learning_rate: 0.0002597581196031832
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.011111111111111112, max=1.0…

VBox(children=(Label(value='0.001 MB of 0.006 MB uploaded\r'), FloatProgress(value=0.19536268212439292, max=1.…

0,1
avg_scores,▁▂▃▃▄▃▃▄▄▄▄▃▄▄▄▅▅▅▆▆▆▆▇▇██▇▇▇▇▇▇▇▇▇▇▆▆▇█
regret,▁

0,1
avg_scores,44.9802
regret,131432.04179


[34m[1mwandb[0m: Agent Starting Run: gdg3u053 with config:
[34m[1mwandb[0m: 	hidden_dim: 64
[34m[1mwandb[0m: 	learning_rate: 0.003171954554562372
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.01127777777777131, max=1.0)…

VBox(children=(Label(value='0.001 MB of 0.006 MB uploaded\r'), FloatProgress(value=0.1953932936383579, max=1.0…

0,1
avg_scores,▁▁▁▁▁▁▁▁▁▁▁▂▂▂▂▂▂▂▃▃▃▃▃▃▄▄▄▄▄▅▆▇▇███████
regret,▁

0,1
avg_scores,201.94059
regret,117284.74146


[34m[1mwandb[0m: Agent Starting Run: ofjvnot0 with config:
[34m[1mwandb[0m: 	hidden_dim: 32
[34m[1mwandb[0m: 	learning_rate: 0.008513769488450626
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.000 MB of 0.000 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▅▄▃▅▆█▇▆▅▅▅▄▄▄▄▃▃▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
regret,▁

0,1
avg_scores,9.39604
regret,139032.25676


[34m[1mwandb[0m: Agent Starting Run: n7x6rj2i with config:
[34m[1mwandb[0m: 	hidden_dim: 64
[34m[1mwandb[0m: 	learning_rate: 0.003522469290533893
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.011111111111111112, max=1.0…

VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,█▆▇▆▅▄▄▃▃▂▂▂▂▃▂▂▂▃▄▄▄▄▅▅▅▅▄▅▅▅▄▃▃▃▂▂▁▁▁▁
regret,▁

0,1
avg_scores,15.60396
regret,136697.06668


[34m[1mwandb[0m: Agent Starting Run: i969qww2 with config:
[34m[1mwandb[0m: 	hidden_dim: 64
[34m[1mwandb[0m: 	learning_rate: 0.004681626731739174
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.011111111111111112, max=1.0…

VBox(children=(Label(value='0.001 MB of 0.006 MB uploaded\r'), FloatProgress(value=0.19542391474690488, max=1.…

0,1
avg_scores,▁▁▁▁▁▁▁▁▂▂▂▂▂▂▃▃▃▃▃▄▄▄▄▄▄▄▅▅▅▆▆▆▆▆▇▇▇███
regret,▁

0,1
avg_scores,489.55446
regret,79982.58607


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: w6qidthq with config:
[34m[1mwandb[0m: 	hidden_dim: 32
[34m[1mwandb[0m: 	learning_rate: 0.00779078766319016
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▅▆█▆▅▄▄▃▃▃▃▃▃▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
regret,▁

0,1
avg_scores,9.53465
regret,139141.55463


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: lqj0flr6 with config:
[34m[1mwandb[0m: 	hidden_dim: 256
[34m[1mwandb[0m: 	learning_rate: 0.008836955311232296
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.01127777777777131, max=1.0)…

VBox(children=(Label(value='0.000 MB of 0.000 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,█▄▃▂▂▂▂▂▃▄▄▅▅▅▅▅▅▅▅▅▅▅▃▃▂▂▁▁▁▁▁▁▁▁▁▁▂▂▂▂
regret,▁

0,1
avg_scores,13.53465
regret,137897.39261


[34m[1mwandb[0m: Agent Starting Run: 7f9pf5ik with config:
[34m[1mwandb[0m: 	hidden_dim: 128
[34m[1mwandb[0m: 	learning_rate: 0.006575798245123899
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.01128888888876342, max=1.0)…

VBox(children=(Label(value='0.001 MB of 0.006 MB uploaded\r'), FloatProgress(value=0.19532842138266185, max=1.…

0,1
avg_scores,█▅▄▃▃▄▄▄▃▃▃▃▃▃▂▂▂▂▂▁▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
regret,▁

0,1
avg_scores,9.40594
regret,139335.83464


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: f2opgcdw with config:
[34m[1mwandb[0m: 	hidden_dim: 64
[34m[1mwandb[0m: 	learning_rate: 0.0013788696242795883
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.01127777777777131, max=1.0)…

VBox(children=(Label(value='0.001 MB of 0.006 MB uploaded\r'), FloatProgress(value=0.1953932936383579, max=1.0…

0,1
avg_scores,▁▁▁▁▁▁▁▂▂▂▂▂▂▂▂▂▂▃▃▃▃▃▃▃▃▃▄▄▄▄▄▅▅▅▆▆▆▇██
regret,▁

0,1
avg_scores,101.53465
regret,129088.70338


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: t682jaf3 with config:
[34m[1mwandb[0m: 	hidden_dim: 128
[34m[1mwandb[0m: 	learning_rate: 0.0030339333309635777
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.006 MB uploaded\r'), FloatProgress(value=0.19536268212439292, max=1.…

0,1
avg_scores,▁▁▁▁▁▁▁▁▁▁▁▁▂▂▂▂▂▂▂▂▂▃▃▃▃▃▃▃▃▃▄▄▅▅▅▆▆▇▇█
regret,▁

0,1
avg_scores,352.92079
regret,110122.9752


[34m[1mwandb[0m: Agent Starting Run: 3zyoz8yy with config:
[34m[1mwandb[0m: 	hidden_dim: 128
[34m[1mwandb[0m: 	learning_rate: 0.004741721330174519
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.006 MB uploaded\r'), FloatProgress(value=0.19536268212439292, max=1.…

0,1
avg_scores,▁▁▁▁▁▂▂▂▂▂▂▃▃▃▃▃▃▃▃▃▃▃▃▃▃▃▃▃▃▃▄▅▆▆▆▆▆▆▇█
regret,▁

0,1
avg_scores,184.64356
regret,118777.24242


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: b0yljltt with config:
[34m[1mwandb[0m: 	hidden_dim: 128
[34m[1mwandb[0m: 	learning_rate: 0.000919709455346917
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.006 MB uploaded\r'), FloatProgress(value=0.19542391474690488, max=1.…

0,1
avg_scores,▁▁▁▁▃▃▄▄▅▆▅▆▆▆▆▆▆▆▇▇▇▇▇▆▆▆▆▇▇▇████▇▇▇███
regret,▁

0,1
avg_scores,50.28713
regret,130041.11082


[34m[1mwandb[0m: Agent Starting Run: y94p8xi7 with config:
[34m[1mwandb[0m: 	hidden_dim: 64
[34m[1mwandb[0m: 	learning_rate: 0.004839630015987159
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.006 MB uploaded\r'), FloatProgress(value=0.19548518576579402, max=1.…

0,1
avg_scores,▃▃▄▅▆▅▅▆▆▇██▇▇▇▇▇▆▆▆▆▅▅▃▃▂▂▂▂▂▁▁▁▁▁▁▁▁▁▁
regret,▁

0,1
avg_scores,9.39604
regret,137906.60303


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: p2xa5cjt with config:
[34m[1mwandb[0m: 	hidden_dim: 32
[34m[1mwandb[0m: 	learning_rate: 0.003786857851955396
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.011111111111111112, max=1.0…

VBox(children=(Label(value='0.001 MB of 0.006 MB uploaded\r'), FloatProgress(value=0.19548518576579402, max=1.…

0,1
avg_scores,▁▁▂▂▂▂▂▂▂▂▂▂▂▂▂▂▂▃▃▃▃▃▄▄▄▄▅▅▅▆▆▆▇▇▇█████
regret,▁

0,1
avg_scores,73.55446
regret,130164.38605


[34m[1mwandb[0m: Agent Starting Run: 6i41xhuv with config:
[34m[1mwandb[0m: 	hidden_dim: 128
[34m[1mwandb[0m: 	learning_rate: 0.009389097693880816
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.000 MB of 0.000 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▁▁▁▁▁▁▁▁▁▁▁▁▂▂▂▂▂▂▂▂▂▂▂▂▁▁▁▁▂▂▂▄▅▅▅▆▆▇██
regret,▁

0,1
avg_scores,29.25743
regret,138385.57499


[34m[1mwandb[0m: Agent Starting Run: ajl6c4rz with config:
[34m[1mwandb[0m: 	hidden_dim: 128
[34m[1mwandb[0m: 	learning_rate: 0.007903368219392607
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.011111111111111112, max=1.0…

VBox(children=(Label(value='0.001 MB of 0.006 MB uploaded\r'), FloatProgress(value=0.19536268212439292, max=1.…

0,1
avg_scores,▁▁▁▂▂▂▃▃▃▂▂▂▂▂▂▂▂▃▃▃▃▃▃▄▄▄▄▅▅▆▆▆▆▅▅▅▅▆▇█
regret,▁

0,1
avg_scores,159.66337
regret,121675.03086


[34m[1mwandb[0m: Agent Starting Run: yr78j3hf with config:
[34m[1mwandb[0m: 	hidden_dim: 256
[34m[1mwandb[0m: 	learning_rate: 0.0030062807077985447
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.011288888888925108, max=1.0…

VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▁▁▁▁▁▂▂▂▂▂▂▂▂▂▂▂▂▂▂▂▂▂▂▃▃▄▄▅▅▅▅▆▇▇██████
regret,▁

0,1
avg_scores,214.25743
regret,115689.31239


[34m[1mwandb[0m: Agent Starting Run: 8rghn068 with config:
[34m[1mwandb[0m: 	hidden_dim: 32
[34m[1mwandb[0m: 	learning_rate: 0.004739677436157908
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.000 MB of 0.001 MB uploaded\r'), FloatProgress(value=0.0, max=1.0)))

0,1
avg_scores,▇▅█▅▄▃▂▂▂▂▂▄▄▄▅▄▄▄▄▄▄▄▄▄▃▂▂▁▁▁▁▁▂▂▂▂▂▂▂▂
regret,▁

0,1
avg_scores,13.07921
regret,138317.37808


[34m[1mwandb[0m: Agent Starting Run: adj3vrq2 with config:
[34m[1mwandb[0m: 	hidden_dim: 128
[34m[1mwandb[0m: 	learning_rate: 0.007417038818106106
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.000 MB of 0.000 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,██▅▅▅▄▄▄▃▃▃▃▃▃▂▂▂▂▂▁▁▁▁▁▁▂▂▁▁▂▂▂▂▂▂▂▁▁▁▁
regret,▁

0,1
avg_scores,9.34653
regret,139603.71267


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: tmr3de74 with config:
[34m[1mwandb[0m: 	hidden_dim: 64
[34m[1mwandb[0m: 	learning_rate: 0.003746706673682269
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.006 MB uploaded\r'), FloatProgress(value=0.20077282241184993, max=1.…

0,1
avg_scores,▇▆▅▆▇▇▇▇▇▇▇▇█▇▇▇▆▆▅▄▅▄▃▃▃▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
regret,▁

0,1
avg_scores,11.25743
regret,137290.84578


[34m[1mwandb[0m: Agent Starting Run: 9imqyibk with config:
[34m[1mwandb[0m: 	hidden_dim: 64
[34m[1mwandb[0m: 	learning_rate: 0.0011330587669012148
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.01128888888876342, max=1.0)…

VBox(children=(Label(value='0.001 MB of 0.006 MB uploaded\r'), FloatProgress(value=0.19536268212439292, max=1.…

0,1
avg_scores,▁▁▁▁▁▁▁▁▁▁▁▁▁▁▂▂▂▂▂▂▂▂▂▃▃▃▃▃▃▄▄▄▅▆▆▆▇▇██
regret,▁

0,1
avg_scores,141.0495
regret,126530.55738


[34m[1mwandb[0m: Agent Starting Run: obvczilk with config:
[34m[1mwandb[0m: 	hidden_dim: 64
[34m[1mwandb[0m: 	learning_rate: 0.00759329684051943
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.000 MB of 0.000 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▆▄▄▆█▇▆▆▅▅▅▄▄▄▄▃▃▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
regret,▁

0,1
avg_scores,9.39604
regret,138741.58064


[34m[1mwandb[0m: Agent Starting Run: g85xeoij with config:
[34m[1mwandb[0m: 	hidden_dim: 32
[34m[1mwandb[0m: 	learning_rate: 0.006283769234026571
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▅█▅▄▃▃▂▂▂▂▂▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
regret,▁

0,1
avg_scores,9.41584
regret,139500.61197


[34m[1mwandb[0m: Agent Starting Run: erbx7gy0 with config:
[34m[1mwandb[0m: 	hidden_dim: 256
[34m[1mwandb[0m: 	learning_rate: 0.0006658688951944023
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.006 MB uploaded\r'), FloatProgress(value=0.1953932936383579, max=1.0…

0,1
avg_scores,▃▂▁▁▁▂▂▂▂▂▂▂▃▃▃▃▃▄▄▅▅▆▇▇████████▇▆▆▄▄▅▅▅
regret,▁

0,1
avg_scores,36.9604
regret,131579.19776


[34m[1mwandb[0m: Agent Starting Run: wtbwhb3n with config:
[34m[1mwandb[0m: 	hidden_dim: 128
[34m[1mwandb[0m: 	learning_rate: 0.0020751997071077988
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.006 MB uploaded\r'), FloatProgress(value=0.1953932936383579, max=1.0…

0,1
avg_scores,▁▁▁▁▁▁▁▁▁▁▂▁▂▂▂▂▂▂▂▂▂▂▂▂▂▂▂▃▃▃▃▄▄▅▅▆▆▇▇█
regret,▁

0,1
avg_scores,232.80198
regret,120902.42449


[34m[1mwandb[0m: Agent Starting Run: bq0knv94 with config:
[34m[1mwandb[0m: 	hidden_dim: 128
[34m[1mwandb[0m: 	learning_rate: 0.0050415070479704885
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.01128888888876342, max=1.0)…

VBox(children=(Label(value='0.001 MB of 0.006 MB uploaded\r'), FloatProgress(value=0.19523660294578501, max=1.…

0,1
avg_scores,▁▁▁▁▁▁▂▂▂▂▂▃▃▃▃▄▄▄▄▄▄▅▅▅▅▆▆▆▆▆▆▆▇▇███▇▇▆
regret,▁

0,1
avg_scores,188.93069
regret,105835.51183


[34m[1mwandb[0m: Agent Starting Run: c6fira7q with config:
[34m[1mwandb[0m: 	hidden_dim: 32
[34m[1mwandb[0m: 	learning_rate: 0.003185724000308891
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.000 MB of 0.000 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,█▇█▆▆▅▅▄▅▄▄▃▃▃▂▁▁▁▁▁▂▂▂▂▃▃▃▄▄▄▄▅▅▄▄▃▃▂▂▂
regret,▁

0,1
avg_scores,21.22772
regret,134773.13576


[34m[1mwandb[0m: Agent Starting Run: bzg75vu1 with config:
[34m[1mwandb[0m: 	hidden_dim: 64
[34m[1mwandb[0m: 	learning_rate: 0.0008278717367335692
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.11909999999997024, max=1.0)…

VBox(children=(Label(value='0.001 MB of 0.006 MB uploaded\r'), FloatProgress(value=0.20070819249959762, max=1.…

0,1
avg_scores,▁▁▂▁▂▂▂▂▂▂▂▂▃▃▃▃▃▃▃▄▄▄▄▄▅▅▅▅▅▆▆▆▇▇▇▇▇▇██
regret,▁

0,1
avg_scores,56.57426
regret,131512.62989


[34m[1mwandb[0m: Agent Starting Run: u8hw0h8l with config:
[34m[1mwandb[0m: 	hidden_dim: 128
[34m[1mwandb[0m: 	learning_rate: 0.00669912420181783
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.000 MB of 0.000 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,█▆▇▅▄▄▃▃▃▂▂▂▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
regret,▁

0,1
avg_scores,9.32673
regret,139053.30654


[34m[1mwandb[0m: Agent Starting Run: df4e2adz with config:
[34m[1mwandb[0m: 	hidden_dim: 32
[34m[1mwandb[0m: 	learning_rate: 0.006422815757146013
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▁▁▁▁▁▂▂▂▂▂▂▂▃▃▃▃▃▃▃▃▃▃▃▃▃▃▄▄▄▄▄▅▅▆▆▆▇▇██
regret,▁

0,1
avg_scores,110.72277
regret,126472.30778


[34m[1mwandb[0m: Agent Starting Run: mzwle9sg with config:
[34m[1mwandb[0m: 	hidden_dim: 128
[34m[1mwandb[0m: 	learning_rate: 0.007535006652382876
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.011111111111111112, max=1.0…

VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▁▁▁▁▁▂▂▂▂▂▂▂▂▂▂▃▃▃▃▄▄▄▄▄▄▄▄▄▃▃▃▃▄▄▅▅▆▇▇█
regret,▁

0,1
avg_scores,324.07921
regret,102954.33722


[34m[1mwandb[0m: Agent Starting Run: 44qe3rr7 with config:
[34m[1mwandb[0m: 	hidden_dim: 128
[34m[1mwandb[0m: 	learning_rate: 0.002814802292833221
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▃▂▁▁▁▁▁▁▁▁▁▁▁▂▂▂▂▃▃▃▃▄▄▅▅▆▆▆▆▆▆▆▇▇▇█████
regret,▁

0,1
avg_scores,34.0198
regret,135998.53285


[34m[1mwandb[0m: Agent Starting Run: knz0xl2a with config:
[34m[1mwandb[0m: 	hidden_dim: 32
[34m[1mwandb[0m: 	learning_rate: 0.007139138383232071
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.011111111111111112, max=1.0…

VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,█▆▄▂▂▂▂▂▂▂▃▄▄▃▃▃▃▃▃▃▃▃▃▂▁▁▁▁▁▁▁▁▁▁▁▁▁▂▂▂
regret,▁

0,1
avg_scores,10.0495
regret,139233.1183


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: t41gx7st with config:
[34m[1mwandb[0m: 	hidden_dim: 32
[34m[1mwandb[0m: 	learning_rate: 0.0031545572026709288
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.000 MB of 0.001 MB uploaded\r'), FloatProgress(value=0.0, max=1.0)))

0,1
avg_scores,▃▅▁▁▂▂▃▅▆▆▆▆▅▅▅▅▅▅▄▃▃▂▁▁▁▁▁▁▂▄▅▆▆▇██████
regret,▁

0,1
avg_scores,33.22772
regret,134694.79986


[34m[1mwandb[0m: Agent Starting Run: fu48ja7i with config:
[34m[1mwandb[0m: 	hidden_dim: 64
[34m[1mwandb[0m: 	learning_rate: 0.008498952480262677
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▁▁▁▁▁▁▁▂▂▂▂▂▂▂▃▄▄▅▅▆▆▇▇█████▇▇▇▇▇▇▇▇▇▇▇▇
regret,▁

0,1
avg_scores,186.18812
regret,104845.15538


[34m[1mwandb[0m: Agent Starting Run: 9nuqhh38 with config:
[34m[1mwandb[0m: 	hidden_dim: 128
[34m[1mwandb[0m: 	learning_rate: 0.006427903064510916
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.000 MB of 0.001 MB uploaded\r'), FloatProgress(value=0.0, max=1.0)))

0,1
avg_scores,▃▃▂▁▁▁▁▁▁▁▂▃▃▃▃▃▃▃▃▃▃▃▃▄▅▅▅▅▆▆▇█████▇▆▅▅
regret,▁

0,1
avg_scores,20.19802
regret,137322.22693


[34m[1mwandb[0m: Agent Starting Run: uecutpg4 with config:
[34m[1mwandb[0m: 	hidden_dim: 256
[34m[1mwandb[0m: 	learning_rate: 0.0017429038712935413
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.011111111111111112, max=1.0…

VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,█▅▃▂▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
regret,▁

0,1
avg_scores,9.48515
regret,139465.95072


[34m[1mwandb[0m: Agent Starting Run: c9pg46uk with config:
[34m[1mwandb[0m: 	hidden_dim: 32
[34m[1mwandb[0m: 	learning_rate: 0.009336110792294593
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.011633333333399302, max=1.0…

VBox(children=(Label(value='0.000 MB of 0.006 MB uploaded\r'), FloatProgress(value=0.0, max=1.0)))

0,1
avg_scores,▇█▇▅▄▃▃▃▂▂▂▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
regret,▁

0,1
avg_scores,9.62376
regret,139507.30201


[34m[1mwandb[0m: Agent Starting Run: vgqu8q5r with config:
[34m[1mwandb[0m: 	hidden_dim: 256
[34m[1mwandb[0m: 	learning_rate: 0.004253333416490272
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.000 MB of 0.001 MB uploaded\r'), FloatProgress(value=0.0, max=1.0)))

0,1
avg_scores,█▆▄▃▃▃▃▂▂▂▂▂▂▂▂▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
regret,▁

0,1
avg_scores,9.32673
regret,139581.33221


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: ldyw1ez0 with config:
[34m[1mwandb[0m: 	hidden_dim: 64
[34m[1mwandb[0m: 	learning_rate: 0.0026122008710127
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▁▁▁▁▂▂▂▂▂▂▂▂▂▂▃▃▄▄▄▄▅▅▅▅▆▆▇▇▇▇▆▆▇▇██████
regret,▁

0,1
avg_scores,125.9604
regret,119175.75485


[34m[1mwandb[0m: Agent Starting Run: wf4cf85d with config:
[34m[1mwandb[0m: 	hidden_dim: 64
[34m[1mwandb[0m: 	learning_rate: 0.004176728563383955
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.000 MB of 0.000 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▃▄▅▄▄▄▄▃▃▃▃▂▂▂▂▂▂▁▁▁▁▁▁▂▂▂▂▃▄▄▄▅▆▇▇▇▇▇██
regret,▁

0,1
avg_scores,31.91089
regret,137177.9663


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: 7yudh2s9 with config:
[34m[1mwandb[0m: 	hidden_dim: 32
[34m[1mwandb[0m: 	learning_rate: 0.009877361962265511
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.011288888888925108, max=1.0…

VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▁▁▁▁▁▁▁▁▁▁▁▁▂▂▂▂▂▃▃▃▄▄▄▅▅▆▆▇▇▇█████▇▇▇▆▆
regret,▁

0,1
avg_scores,334.9901
regret,82249.90888


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: zwdfbs3d with config:
[34m[1mwandb[0m: 	hidden_dim: 128
[34m[1mwandb[0m: 	learning_rate: 0.00900330013316739
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.000 MB of 0.001 MB uploaded\r'), FloatProgress(value=0.0, max=1.0)))

0,1
avg_scores,█▅▃▂▂▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
regret,▁

0,1
avg_scores,9.39604
regret,139401.20903


[34m[1mwandb[0m: Agent Starting Run: ze36uw9v with config:
[34m[1mwandb[0m: 	hidden_dim: 32
[34m[1mwandb[0m: 	learning_rate: 0.004996411861170479
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.01128888888876342, max=1.0)…

VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▁▁▁▁▁▁▁▁▁▁▁▁▁▁▂▂▂▂▂▂▃▃▃▄▄▄▆▇▇▇████▇▇████
regret,▁

0,1
avg_scores,168.62376
regret,118862.10346


[34m[1mwandb[0m: Agent Starting Run: fixrdwfg with config:
[34m[1mwandb[0m: 	hidden_dim: 128
[34m[1mwandb[0m: 	learning_rate: 0.003432528916671453
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.000 MB of 0.001 MB uploaded\r'), FloatProgress(value=0.0, max=1.0)))

0,1
avg_scores,▄█▅▄▃▄▄▄▃▃▃▃▃▃▂▂▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
regret,▁

0,1
avg_scores,9.32673
regret,139391.438


[34m[1mwandb[0m: Agent Starting Run: 6r2nwq4j with config:
[34m[1mwandb[0m: 	hidden_dim: 32
[34m[1mwandb[0m: 	learning_rate: 0.0018016185165038849
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.011288888888925108, max=1.0…

VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▁▁▁▁▁▁▁▁▁▂▂▂▂▂▂▂▂▂▂▃▃▃▃▃▃▃▄▄▄▄▄▄▅▅▅▆▆▇▇█
regret,▁

0,1
avg_scores,118.82178
regret,128653.08637


[34m[1mwandb[0m: Agent Starting Run: t633nvbk with config:
[34m[1mwandb[0m: 	hidden_dim: 256
[34m[1mwandb[0m: 	learning_rate: 0.004241454110353238
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,█▅▃▃▂▂▂▂▂▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▂▂▂▂▂▂▂▂▂
regret,▁

0,1
avg_scores,10.79208
regret,139361.80904


[34m[1mwandb[0m: Agent Starting Run: nwjvzhum with config:
[34m[1mwandb[0m: 	hidden_dim: 256
[34m[1mwandb[0m: 	learning_rate: 0.007640064524443215
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,█▆▄▃▂▂▂▂▂▂▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
regret,▁

0,1
avg_scores,9.39604
regret,139309.07919


[34m[1mwandb[0m: Agent Starting Run: rfvbz1u5 with config:
[34m[1mwandb[0m: 	hidden_dim: 32
[34m[1mwandb[0m: 	learning_rate: 0.0062212974865677685
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.011288888888925108, max=1.0…

VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▁▁▁▁▁▁▁▁▁▁▁▁▁▁▂▂▂▂▂▂▂▂▃▃▃▃▃▄▄▅▅▅▆▆▆▇▇▇▇█
regret,▁

0,1
avg_scores,315.75248
regret,110871.03898


[34m[1mwandb[0m: Agent Starting Run: sjdp4of6 with config:
[34m[1mwandb[0m: 	hidden_dim: 32
[34m[1mwandb[0m: 	learning_rate: 0.00606988891896528
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▁▁▁▁▁▁▁▁▁▁▁▁▂▂▂▂▂▂▂▃▃▃▃▃▄▄▅▅▅▆▆▆▇▇▇█████
regret,▁

0,1
avg_scores,484.0396
regret,84655.92339


[34m[1mwandb[0m: Agent Starting Run: xnpydj64 with config:
[34m[1mwandb[0m: 	hidden_dim: 128
[34m[1mwandb[0m: 	learning_rate: 0.0034056071568887695
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▇▆▄▅▄▄▄▄▄▄▃▃▃▃▂▂▂▂▂▁▁▁▁▁▂▂▃▃▄▅▅▅▆▆▇▇████
regret,▁

0,1
avg_scores,35.47525
regret,135673.39824


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: arjumyik with config:
[34m[1mwandb[0m: 	hidden_dim: 256
[34m[1mwandb[0m: 	learning_rate: 0.0026082419713485978
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.000 MB of 0.001 MB uploaded\r'), FloatProgress(value=0.0, max=1.0)))

0,1
avg_scores,█▇▇▅▄▃▃▃▃▂▂▂▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
regret,▁

0,1
avg_scores,9.33663
regret,139115.57981


[34m[1mwandb[0m: Agent Starting Run: ulq0cfr4 with config:
[34m[1mwandb[0m: 	hidden_dim: 256
[34m[1mwandb[0m: 	learning_rate: 0.007137378037161882
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.000 MB of 0.001 MB uploaded\r'), FloatProgress(value=0.0, max=1.0)))

0,1
avg_scores,█▆▃▄▃▃▃▃▂▃▂▂▂▂▂▂▂▂▂▆▇▇▇▇▇▇▇▇▇▆▆▆▄▂▁▁▁▁▁▂
regret,▁

0,1
avg_scores,9.39604
regret,139446.00558


[34m[1mwandb[0m: Agent Starting Run: z28owe12 with config:
[34m[1mwandb[0m: 	hidden_dim: 64
[34m[1mwandb[0m: 	learning_rate: 0.007463361963759563
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▁▁▁▁▁▁▁▁▁▁▁▂▂▂▂▂▂▂▂▂▂▃▃▃▄▄▄▅▅▆▆▆▇▇▇▇████
regret,▁

0,1
avg_scores,455.05941
regret,86259.80194


[34m[1mwandb[0m: Agent Starting Run: ynvge107 with config:
[34m[1mwandb[0m: 	hidden_dim: 64
[34m[1mwandb[0m: 	learning_rate: 0.00906246174517457
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.011111111111111112, max=1.0…

VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▁▁▁▁▁▁▁▁▂▂▂▂▂▂▂▃▃▃▃▃▃▄▄▄▄▄▅▅▆▆▆▇▇▇▇▇████
regret,▁

0,1
avg_scores,402.87129
regret,88510.28024


[34m[1mwandb[0m: Agent Starting Run: 7b7fkh8r with config:
[34m[1mwandb[0m: 	hidden_dim: 32
[34m[1mwandb[0m: 	learning_rate: 0.008551770007974947
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▁▁▁▁▁▁▁▁▁▁▁▁▁▂▂▂▂▂▃▃▃▃▃▄▄▅▅▆▆▇▇██████▇▇▇
regret,▁

0,1
avg_scores,292.24752
regret,100281.86045


[34m[1mwandb[0m: Agent Starting Run: f5puneeh with config:
[34m[1mwandb[0m: 	hidden_dim: 128
[34m[1mwandb[0m: 	learning_rate: 0.005693669628573834
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.011111111111111112, max=1.0…

VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▁▁▁▁▁▁▁▁▁▁▂▂▂▂▂▂▂▃▃▃▄▅▆▆▇▇████████▇▆▆▆▆▆
regret,▁

0,1
avg_scores,145.77228
regret,110118.00293


[34m[1mwandb[0m: Agent Starting Run: 6of5k28o with config:
[34m[1mwandb[0m: 	hidden_dim: 256
[34m[1mwandb[0m: 	learning_rate: 0.00974514724206544
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,█▆▃▃▃▃▃▂▂▂▂▂▂▂▂▂▁▁▁▁▁▂▄▄▄▄▄▄▄▄▄▄▅▅▄▂▁▁▁▁
regret,▁

0,1
avg_scores,9.32673
regret,139536.02464


[34m[1mwandb[0m: Agent Starting Run: mzglyta7 with config:
[34m[1mwandb[0m: 	hidden_dim: 64
[34m[1mwandb[0m: 	learning_rate: 0.0033437711711773164
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.011288888888925108, max=1.0…

VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▁▁▁▁▁▁▁▁▁▁▁▂▂▂▂▂▂▂▂▃▃▃▃▄▄▄▅▆▆▇▇█████▇▇▇▆
regret,▁

0,1
avg_scores,172.0198
regret,112903.09709


[34m[1mwandb[0m: Agent Starting Run: 468mxnvy with config:
[34m[1mwandb[0m: 	hidden_dim: 32
[34m[1mwandb[0m: 	learning_rate: 0.0013656910729085898
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▂▁▁▁▁▁▁▁▂▁▁▂▂▂▂▂▂▂▂▃▃▃▃▃▃▄▄▄▄▅▅▅▅▅▆▆▆▇██
regret,▁

0,1
avg_scores,76.06931
regret,131234.88576


[34m[1mwandb[0m: Agent Starting Run: s2np35b6 with config:
[34m[1mwandb[0m: 	hidden_dim: 128
[34m[1mwandb[0m: 	learning_rate: 0.008029873151156372
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▁▁▂▁▂▂▂▂▂▂▂▂▂▂▂▂▂▂▂▃▃▃▃▄▄▄▄▄▅▅▅▄▄▄▅▅▅▆▇█
regret,▁

0,1
avg_scores,195.66337
regret,119055.3616


[34m[1mwandb[0m: Agent Starting Run: htz4qabi with config:
[34m[1mwandb[0m: 	hidden_dim: 64
[34m[1mwandb[0m: 	learning_rate: 0.006979632748816569
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.01127777777777131, max=1.0)…

VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▃▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▂▃▄▄▅▅▆▆▇█
regret,▁

0,1
avg_scores,15.81188
regret,139378.35374


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: dc297fn8 with config:
[34m[1mwandb[0m: 	hidden_dim: 64
[34m[1mwandb[0m: 	learning_rate: 0.004786569253088788
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.011111111111111112, max=1.0…

VBox(children=(Label(value='0.000 MB of 0.001 MB uploaded\r'), FloatProgress(value=0.0, max=1.0)))

0,1
avg_scores,▆▅▃▇▆▇▇▇▇███▇▇▇▇▇▇▇██▇▇▆▆▅▅▅▄▄▄▃▂▁▁▁▁▂▂▂
regret,▁

0,1
avg_scores,13.38614
regret,137458.43182


[34m[1mwandb[0m: Agent Starting Run: dn74o83h with config:
[34m[1mwandb[0m: 	hidden_dim: 64
[34m[1mwandb[0m: 	learning_rate: 0.0017294842118254202
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▁▁▃▅▅▆▆▆▆▆▆▆▅▅▆▆▆▆▆▆▆▇▇▇████▇▇▇▆▆▆▅▅▄▄▄▄
regret,▁

0,1
avg_scores,27.45545
regret,132694.41169


[34m[1mwandb[0m: Agent Starting Run: s9awy4mn with config:
[34m[1mwandb[0m: 	hidden_dim: 64
[34m[1mwandb[0m: 	learning_rate: 0.004980542369542667
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▁▁▁▁▁▁▁▁▁▁▁▂▁▂▂▂▂▃▃▃▃▃▃▃▃▃▃▃▄▄▄▄▅▅▅▆▇▇██
regret,▁

0,1
avg_scores,370.39604
regret,106356.89319


[34m[1mwandb[0m: Agent Starting Run: us3mf2wz with config:
[34m[1mwandb[0m: 	hidden_dim: 128
[34m[1mwandb[0m: 	learning_rate: 0.0030258795092558805
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.011111111111111112, max=1.0…

VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▃▄▂▂▂▃▂▁▃▃▃▄▅▅▅▅▅▄▄▄▄▄▃▃▂▂▁▂▄▅▅▆▆▇▇▇████
regret,▁

0,1
avg_scores,32.62376
regret,134516.03236


[34m[1mwandb[0m: Agent Starting Run: 7o0df82i with config:
[34m[1mwandb[0m: 	hidden_dim: 256
[34m[1mwandb[0m: 	learning_rate: 0.0003506621413859092
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.011288888888925108, max=1.0…

VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▁▁▁▂▃▃▄▃▄▄▄▄▅▅▅▅▅▅▅▅▅▅▅▅▅▅▅▅▆▆▆▆▇▇▇███▇▇
regret,▁

0,1
avg_scores,51.32673
regret,131515.05836


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: n80axlp1 with config:
[34m[1mwandb[0m: 	hidden_dim: 32
[34m[1mwandb[0m: 	learning_rate: 0.0069904356010100045
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.000 MB of 0.000 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▆█▆▅▄▃▃▃▃▂▂▂▂▂▂▁▁▁▁▁▁▁▁▂▃▃▃▃▃▃▃▃▃▃▂▂▁▁▁▁
regret,▁

0,1
avg_scores,9.45545
regret,138794.124


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: w2hhod4t with config:
[34m[1mwandb[0m: 	hidden_dim: 64
[34m[1mwandb[0m: 	learning_rate: 0.009285128272273346
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.011111111111111112, max=1.0…

VBox(children=(Label(value='0.000 MB of 0.000 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▃▂▃▂▂▂▄█▇▇▇▆▆▆▅▅▅▅▅▄▄▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▂
regret,▁

0,1
avg_scores,9.39604
regret,139541.67229


[34m[1mwandb[0m: Agent Starting Run: u0nqn6es with config:
[34m[1mwandb[0m: 	hidden_dim: 256
[34m[1mwandb[0m: 	learning_rate: 0.0019600483935295373
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.011288888888925108, max=1.0…

VBox(children=(Label(value='0.000 MB of 0.001 MB uploaded\r'), FloatProgress(value=0.0, max=1.0)))

0,1
avg_scores,█▅▃▂▃▄▄▃▃▃▃▃▃▂▂▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
regret,▁

0,1
avg_scores,9.42574
regret,139086.13675


[34m[1mwandb[0m: Agent Starting Run: uy7ariwd with config:
[34m[1mwandb[0m: 	hidden_dim: 64
[34m[1mwandb[0m: 	learning_rate: 0.0026783757040482487
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.000 MB of 0.001 MB uploaded\r'), FloatProgress(value=0.0, max=1.0)))

0,1
avg_scores,▄▅▃▂▂▁▁▁▁▁▁▁▁▁▂▂▃▃▃▃▃▄▄▄▅▅▆▆▆▆▆▆▇▇▇▇▇▇██
regret,▁

0,1
avg_scores,32.48515
regret,136240.1706


[34m[1mwandb[0m: Agent Starting Run: e86c6pm4 with config:
[34m[1mwandb[0m: 	hidden_dim: 128
[34m[1mwandb[0m: 	learning_rate: 0.0034603138550018133
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▄▃▂▂▂▂▂▂▂▂▁▁▁▁▁▁▁▁▁▂▂▃▃▄▅▅▆▆▇▇████▇▇▇▆▆▅
regret,▁

0,1
avg_scores,25.86139
regret,136529.0247


[34m[1mwandb[0m: Agent Starting Run: 3ojr5rjq with config:
[34m[1mwandb[0m: 	hidden_dim: 32
[34m[1mwandb[0m: 	learning_rate: 0.0048165395708397694
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▂▂▂▂▂▂▂▃▃▃▃▃▃▃▃▃▄▄▅▆▆▆▇▇█
regret,▁

0,1
avg_scores,228.49505
regret,120445.51672


[34m[1mwandb[0m: Agent Starting Run: igbrl6w9 with config:
[34m[1mwandb[0m: 	hidden_dim: 32
[34m[1mwandb[0m: 	learning_rate: 0.00568469379537484
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.011288888888925108, max=1.0…

VBox(children=(Label(value='0.000 MB of 0.001 MB uploaded\r'), FloatProgress(value=0.0, max=1.0)))

0,1
avg_scores,██▄▃▃▂▂▂▂▂▃▂▂▂▂▂▂▂▂▂▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
regret,▁

0,1
avg_scores,9.41584
regret,138746.32059


[34m[1mwandb[0m: Agent Starting Run: vqdy6a3x with config:
[34m[1mwandb[0m: 	hidden_dim: 64
[34m[1mwandb[0m: 	learning_rate: 0.003481121869468777
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.000 MB of 0.000 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▆██▆▅▄▃▃▃▃▃▂▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
regret,▁

0,1
avg_scores,9.33663
regret,139123.09973


[34m[1mwandb[0m: Agent Starting Run: gldwwfl9 with config:
[34m[1mwandb[0m: 	hidden_dim: 64
[34m[1mwandb[0m: 	learning_rate: 0.008982364911177591
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.011111111111111112, max=1.0…

VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▁▁▁▁▁▂▂▂▂▂▃▃▃▃▃▄▄▄▅▆▆▇█▇▇▇▇▇▇▇▇▆▆▆▆▆▇▇▇█
regret,▁

0,1
avg_scores,315.61386
regret,86918.99256


[34m[1mwandb[0m: Agent Starting Run: dn9k1ihp with config:
[34m[1mwandb[0m: 	hidden_dim: 64
[34m[1mwandb[0m: 	learning_rate: 0.0034957405723359384
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▁▁▁▁▁▁▁▁▁▁▂▂▂▂▂▂▂▂▂▂▂▂▃▃▃▄▄▄▄▄▄▅▅▅▅▅▆▆▇█
regret,▁

0,1
avg_scores,205.34653
regret,120993.62448


[34m[1mwandb[0m: Agent Starting Run: pgz2lhad with config:
[34m[1mwandb[0m: 	hidden_dim: 64
[34m[1mwandb[0m: 	learning_rate: 0.0044982127559935695
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.011111111111111112, max=1.0…

VBox(children=(Label(value='0.000 MB of 0.000 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▇█▅▄▃▃▃▃▂▂▂▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
regret,▁

0,1
avg_scores,9.46535
regret,139154.10509


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: hkqempnu with config:
[34m[1mwandb[0m: 	hidden_dim: 32
[34m[1mwandb[0m: 	learning_rate: 0.008515195907606127
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▆▄▅▆█▇▆▅▅▄▄▄▄▃▃▃▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
regret,▁

0,1
avg_scores,9.32673
regret,138919.00059


[34m[1mwandb[0m: Agent Starting Run: aijdq61t with config:
[34m[1mwandb[0m: 	hidden_dim: 256
[34m[1mwandb[0m: 	learning_rate: 0.0067967740519313145
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.011111111111111112, max=1.0…

VBox(children=(Label(value='0.000 MB of 0.001 MB uploaded\r'), FloatProgress(value=0.0, max=1.0)))

0,1
avg_scores,█▇█▅▄▃▃▃▃▃▃▃▃▃▂▂▂▂▂▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▂
regret,▁

0,1
avg_scores,9.39604
regret,139583.46817


[34m[1mwandb[0m: Agent Starting Run: xqbr4uwr with config:
[34m[1mwandb[0m: 	hidden_dim: 32
[34m[1mwandb[0m: 	learning_rate: 0.0036647695854949854
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▂▂▂▂▂▂▃▃▃▄▄▅▅▆▆▆▇▇▇▇▇▇██
regret,▁

0,1
avg_scores,273.0495
regret,112424.99706


[34m[1mwandb[0m: Agent Starting Run: acvd5o8y with config:
[34m[1mwandb[0m: 	hidden_dim: 64
[34m[1mwandb[0m: 	learning_rate: 0.0070603592901344
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▁▁▁▁▁▁▁▁▁▁▁▁▁▁▂▂▂▂▃▄▄▅▆▆▆▆▇▇▇███▇▇▇▆▆▇▇█
regret,▁

0,1
avg_scores,300.33663
regret,97373.0324


[34m[1mwandb[0m: Agent Starting Run: p3vsif2w with config:
[34m[1mwandb[0m: 	hidden_dim: 64
[34m[1mwandb[0m: 	learning_rate: 0.001653500758197926
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.011111111111111112, max=1.0…

VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▁▁▁▁▁▁▁▁▁▁▁▁▂▂▂▂▂▂▂▂▂▂▂▂▂▂▃▃▃▃▃▄▄▄▅▅▆▇██
regret,▁

0,1
avg_scores,168.92079
regret,125793.24689


[34m[1mwandb[0m: Agent Starting Run: 6vi01j35 with config:
[34m[1mwandb[0m: 	hidden_dim: 64
[34m[1mwandb[0m: 	learning_rate: 0.009833361310456914
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.011288888888925108, max=1.0…

VBox(children=(Label(value='0.001 MB of 0.006 MB uploaded\r'), FloatProgress(value=0.1953932936383579, max=1.0…

0,1
avg_scores,▁▁▁▁▁▁▁▁▁▂▂▂▂▂▂▂▂▂▃▃▃▃▄▄▅▆▆▇▇▇▇████▇▇▇▆▆
regret,▁

0,1
avg_scores,293.44554
regret,88419.32559


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: lh6nzzuw with config:
[34m[1mwandb[0m: 	hidden_dim: 256
[34m[1mwandb[0m: 	learning_rate: 0.00159652393250352
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▁▁▁▁▁▁▂▂▂▂▂▂▂▂▂▂▃▃▃▃▃▄▄▄▄▄▅▅▅▆▆▆▆▆▆▇▇███
regret,▁

0,1
avg_scores,232.78218
regret,112041.73073


[34m[1mwandb[0m: Agent Starting Run: f2upf915 with config:
[34m[1mwandb[0m: 	hidden_dim: 32
[34m[1mwandb[0m: 	learning_rate: 0.003828068238656216
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.000 MB of 0.001 MB uploaded\r'), FloatProgress(value=0.0, max=1.0)))

0,1
avg_scores,▄▃▃▅▅▄▄▃▃▂▂▂▂▂▂▂▁▁▁▁▂▂▃▄▅▅▅▆▇▇▇▇██▇▇▇▇██
regret,▁

0,1
avg_scores,38.33663
regret,134987.08549


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: no4wnr75 with config:
[34m[1mwandb[0m: 	hidden_dim: 256
[34m[1mwandb[0m: 	learning_rate: 0.0050856466460309935
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▁▃▃▃▃▃▄▄▄▄▄▅▆▆▆▆▆▇▇█████▇▇▆▇▆▆▆▆▅▅▄▄▄▄▄▄
regret,▁

0,1
avg_scores,59.12871
regret,120109.18578


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: r6jwyv7y with config:
[34m[1mwandb[0m: 	hidden_dim: 256
[34m[1mwandb[0m: 	learning_rate: 0.002067258743167658
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.011288888888925108, max=1.0…

VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▁▁▁▁▁▂▂▂▂▂▃▃▃▃▄▄▄▅▅▅▆▆▆▆▆▆▆▇▇▇▇█████████
regret,▁

0,1
avg_scores,203.27723
regret,104863.83112


[34m[1mwandb[0m: Agent Starting Run: bi8mb2n8 with config:
[34m[1mwandb[0m: 	hidden_dim: 128
[34m[1mwandb[0m: 	learning_rate: 0.004619813696065738
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.011288888888925108, max=1.0…

VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▁▁▁▁▁▁▁▁▂▂▂▂▂▂▂▂▂▃▃▄▄▅▅▅▆▇▇▇██████▇▇▆▆▅▅
regret,▁

0,1
avg_scores,122.74257
regret,111707.68302


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: gov44dkl with config:
[34m[1mwandb[0m: 	hidden_dim: 64
[34m[1mwandb[0m: 	learning_rate: 0.006116244251641901
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.000 MB of 0.000 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,██▅▅▄▄▃▃▃▃▃▃▃▃▃▃▃▂▃▃▃▃▃▃▄▃▃▃▃▃▃▃▂▂▂▂▂▁▁▁
regret,▁

0,1
avg_scores,12.50495
regret,136927.20787


[34m[1mwandb[0m: Agent Starting Run: 9qhbqavy with config:
[34m[1mwandb[0m: 	hidden_dim: 128
[34m[1mwandb[0m: 	learning_rate: 0.0075276242153169744
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,█▄▃▂▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
regret,▁

0,1
avg_scores,9.39604
regret,139525.47222


[34m[1mwandb[0m: Agent Starting Run: vjd82nir with config:
[34m[1mwandb[0m: 	hidden_dim: 128
[34m[1mwandb[0m: 	learning_rate: 0.0012375533340293428
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,█▆▂▁▁▂▂▃▂▂▁▁▁▃▃▃▃▃▃▃▃▄▆▇▇▇▇▅▅▅▅▅▄▄▃▁▁▂▃▄
regret,▁

0,1
avg_scores,29.78218
regret,133838.91081


[34m[1mwandb[0m: Agent Starting Run: 4ql931gb with config:
[34m[1mwandb[0m: 	hidden_dim: 32
[34m[1mwandb[0m: 	learning_rate: 0.009484419641999654
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.000 MB of 0.000 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▆▄▅█▆▅▅▄▄▃▃▃▃▃▃▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
regret,▁

0,1
avg_scores,9.39604
regret,139223.18885


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: uwuueivg with config:
[34m[1mwandb[0m: 	hidden_dim: 128
[34m[1mwandb[0m: 	learning_rate: 0.00986353765013437
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.011111111111111112, max=1.0…

VBox(children=(Label(value='0.000 MB of 0.000 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,█▅▃▂▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
regret,▁

0,1
avg_scores,9.39604
regret,139519.12518


[34m[1mwandb[0m: Agent Starting Run: pq7p0y5v with config:
[34m[1mwandb[0m: 	hidden_dim: 128
[34m[1mwandb[0m: 	learning_rate: 0.008817995611176228
[34m[1mwandb[0m: 	optimizer_type: sgd
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.011111111111111112, max=1.0…

VBox(children=(Label(value='0.000 MB of 0.000 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,█▄▃▂▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
regret,▁

0,1
avg_scores,9.39604
regret,139427.41647


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: r70y311q with config:
[34m[1mwandb[0m: 	hidden_dim: 64
[34m[1mwandb[0m: 	learning_rate: 0.006504200179722873
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
avg_scores,▁▁▁▁▁▁▁▂▂▂▂▂▂▂▂▂▃▃▄▄▄▅▅▆▆▆▅▅▅▅▅▄▅▅▆▆▆▇▇█
regret,▁

0,1
avg_scores,275.61386
regret,105417.20012


[34m[1mwandb[0m: Agent Starting Run: d7t0y9n8 with config:
[34m[1mwandb[0m: 	hidden_dim: 64
[34m[1mwandb[0m: 	learning_rate: 0.002515896865860069
[34m[1mwandb[0m: 	optimizer_type: adam
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.
