# Imports and Colab Mount

In [1]:
import datetime
import seaborn as sn
import pandas as pd
import numpy as np
import matplotlib as mpl
import matplotlib.pyplot as plt
import scipy.stats as stats
import glob
from math import sqrt

from sklearn.preprocessing import StandardScaler, MinMaxScaler

import keras
from tensorflow.keras.optimizers import Adam
from keras.layers import Dense, LSTM, LeakyReLU, Dropout, GRU, SimpleRNN, Input, LSTM, Dense, Bidirectional, Concatenate, Reshape, Lambda, Bidirectional
from keras.models import Model, Sequential
from keras import backend as K
from tensorflow.keras import layers
from keras.callbacks import Callback, ReduceLROnPlateau, EarlyStopping
from sklearn.metrics import mean_squared_error, mean_absolute_error, mean_absolute_percentage_error
from sklearn.model_selection import train_test_split
import seaborn as sns

from numpy.random import seed
#from tensorflow import set_random_seed

%matplotlib inline

In [2]:
from google.colab import drive

drive.mount('/content/drive')

Mounted at /content/drive


# Load Data

In [3]:
train_h = pd.read_csv("/content/drive/MyDrive/Datasets/solar_train.csv", index_col=0, parse_dates=True)
valid_h = pd.read_csv("/content/drive/MyDrive/Datasets/solar_valid.csv", index_col=0, parse_dates=True)
test_h = pd.read_csv("/content/drive/MyDrive/Datasets/solar_test.csv", index_col=0, parse_dates=True)
hourly = pd.read_csv("/content/drive/MyDrive/Datasets/solar_all.csv", index_col=0, parse_dates=True)

resid_train = pd.read_csv("/content/drive/MyDrive/Datasets/resid_train.csv").drop("Unnamed: 0", axis=1)
resid_test = pd.read_csv("/content/drive/MyDrive/Datasets/resid_test.csv").drop("Unnamed: 0", axis=1)

In [4]:
def series_to_supervised(data, n_in=1, n_out=1, dropnan=True):
	n_vars = 1 if type(data) is list else data.shape[1]
	df = pd.DataFrame(data)
	cols, names = list(), list()
	# input sequence (t-n, ... t-1)
	for i in range(n_in, 0, -1):
		cols.append(df.shift(i))
		names += [('var%d(t-%d)' % (j+1, i)) for j in range(n_vars)]
	# forecast sequence (t, t+1, ... t+n)
	for i in range(0, n_out):
		cols.append(df.shift(-i))
		if i == 0:
			names += [('var%d(t)' % (j+1)) for j in range(n_vars)]
		else:
			names += [('var%d(t+%d)' % (j+1, i)) for j in range(n_vars)]
	# put it all together
	agg = pd.concat(cols, axis=1)
	agg.columns = names
	# drop rows with NaN values
	if dropnan:
		agg.dropna(inplace=True)
	return agg

In [5]:
def make_data(data, timestep, resid_check=False):
  values = data.values
  values = values.astype('float32')
  #scaler = MinMaxScaler(feature_range=(0, 1))
  #scaled = scaler.fit_transform(values)
  
  timestep = timestep
  n_features = 39
  n_obs = timestep * n_features
  reframed = series_to_supervised(values, timestep, 1)
  reframed = reframed.iloc[: , :-38]

  values = reframed.values
  indice1 = train_h.shape[0]
  indice2 = valid_h.shape[0]

  train = values[:indice1, :]
  valid = values[indice1:indice1+indice2, :]
  test = values[indice1+indice2:, :]

  train_X, train_y = train[:, :-1], train[:, -1]
  valid_X, valid_y = valid[:, :-1], valid[:, -1]
  test_X, test_y = test[:, :-1], test[:, -1]

  if (resid_check==True):
    train_y = resid_train.values[:2184]
    valid_y = resid_train.values[2184:]

  scaler = MinMaxScaler(feature_range=(0, 1)).fit(train_X)
  train_X = scaler.transform(train_X)
  valid_X = scaler.transform(valid_X)
  test_X = scaler.transform(test_X)

  scaler_y = MinMaxScaler(feature_range=(0, 1)).fit(train_y.reshape(-1,1))
  train_y = scaler_y.transform(train_y.reshape(-1,1))
  valid_y = scaler_y.transform(valid_y.reshape(-1,1))
  test_y = scaler_y.transform(test_y.reshape(-1,1))

  train_X = train_X.reshape((train_X.shape[0], timestep, n_features))
  valid_X = valid_X.reshape((valid_X.shape[0], timestep, n_features))
  test_X = test_X.reshape((test_X.shape[0], timestep, n_features))
  return train_X, train_y, valid_X, valid_y, test_X, test_y

In [6]:
def make_data2(data, timestep, resid_check=False):
  values = data.values
  values = values.astype('float32')
  #scaler = MinMaxScaler(feature_range=(0, 1))
  #scaled = scaler.fit_transform(values)
  
  timestep = timestep
  n_features = 39
  n_obs = timestep * n_features
  reframed = series_to_supervised(values, timestep, 1)
  reframed = reframed.iloc[: , :-38]

  values = reframed.values
  indice1 = train_h.shape[0]
  indice2 = valid_h.shape[0]

  train = values[:indice1, :]
  valid = values[indice1:indice1+indice2, :]
  test = values[indice1+indice2:, :]

  train_X, train_y = train[:, :-1], train[:, -1]
  valid_X, valid_y = valid[:, :-1], valid[:, -1]
  test_X, test_y = test[:, :-1], test[:, -1]

  if (resid_check==True):
    train_y = resid_train.values[:2184]
    valid_y = resid_train.values[2184:]

  scaler = MinMaxScaler(feature_range=(0, 1)).fit(train_X)
  train_X = scaler.transform(train_X)
  valid_X = scaler.transform(valid_X)
  test_X = scaler.transform(test_X)

  scaler_y = MinMaxScaler(feature_range=(0, 1)).fit(train_y.reshape(-1,1))
  train_y = scaler_y.transform(train_y.reshape(-1,1))
  valid_y = scaler_y.transform(valid_y.reshape(-1,1))
  test_y = scaler_y.transform(test_y.reshape(-1,1))

  train_X = train_X.reshape((train_X.shape[0], timestep, n_features))
  valid_X = valid_X.reshape((valid_X.shape[0], timestep, n_features))
  test_X = test_X.reshape((test_X.shape[0], timestep, n_features))
  return train_X, train_y, valid_X, valid_y, test_X, test_y, scaler, scaler_y

# WanDB

In [7]:
!pip install wandb -qq
import wandb
from wandb.keras import WandbCallback
!wandb login

[K     |████████████████████████████████| 1.8 MB 7.7 MB/s 
[K     |████████████████████████████████| 181 kB 45.5 MB/s 
[K     |████████████████████████████████| 144 kB 48.4 MB/s 
[K     |████████████████████████████████| 63 kB 1.6 MB/s 
[?25h  Building wheel for pathtools (setup.py) ... [?25l[?25hdone
[34m[1mwandb[0m: You can find your API key in your browser here: https://wandb.ai/authorize
[34m[1mwandb[0m: Paste an API key from your profile and hit enter, or press ctrl+c to quit: 
[34m[1mwandb[0m: Appending key for api.wandb.ai to your netrc file: /root/.netrc


# Train

# RNN

In [None]:
# Configure the sweep – specify the parameters to search through, the search strategy, the optimization metric et all.
sweep_config = {
    'name': 'RNN',
    'method': 'bayes', #grid, random
    'metric': {
      'name': 'best_val_loss',
      'goal': 'minimize'   
    },
    'parameters': {
        'batch_size': {
            'values': [256, 128, 64, 32]
        },
        'dropout': {
            'values': [0, 0.1, 0.3]
        },
        'units': {
            'values': [64, 128, 256]
        },
        'timestep': {
            'values': [3, 6, 12, 24]
        },
        'lr': {
            'values': [1e-2, 1e-1]
        },
        'layers': {
            'values': [1, 2, 4, 8]
        },
        
    }
}

In [None]:
sweep_id = wandb.sweep(sweep_config, entity="ancy", project="DF1_RESIDUAL_RNN")

Create sweep with ID: lklcsig0
Sweep URL: https://wandb.ai/ancy/DF1_SIMPLE_RNN/sweeps/lklcsig0


In [None]:
def create_rnn():
    config_defaults = {
    'batch_size': 128,
    'lr': 1e-3,
    'units': 64,
    'timestep': 3,
    'dropout': 0.3,
    'layers': 1,
    }

    wandb.init(config=config_defaults)
    config = wandb.config

    batch_size = config.batch_size
    lr         = config.lr
    num_units  = config.units
    timestep   = config.timestep
    dropout    = config.dropout
    layers     = config.layers

    train_X, train_y, valid_X, valid_y, test_X, test_y = make_data(hourly, timestep, resid_check=True)
    model = Sequential()

    if layers > 1:
      model.add(SimpleRNN(units = num_units, input_shape=(train_X.shape[1], train_X.shape[2]), dropout=dropout, return_sequences=True))

      for i in range(layers-2):
        model.add(SimpleRNN(units = num_units, dropout=dropout, return_sequences=True))

      model.add(SimpleRNN(units = num_units, dropout=dropout))

    else:
      model.add(SimpleRNN(units = num_units, input_shape=(train_X.shape[1], train_X.shape[2]), dropout=dropout))

    model.add(Dense(units = 1))

    model.compile(
        loss="mse",
        optimizer=Adam(learning_rate=lr)
    )

    model.fit(train_X, train_y, batch_size=batch_size,
              epochs=200, verbose=0, shuffle=False,
              validation_data=(valid_X, valid_y),
              callbacks=[WandbCallback(),
                          EarlyStopping(patience=10, restore_best_weights=True)])

    return model

In [None]:
wandb.agent(sweep_id, create_rnn, count=50)

[34m[1mwandb[0m: Agent Starting Run: tkzalzmc with config:
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	dropout: 0.1
[34m[1mwandb[0m: 	layers: 2
[34m[1mwandb[0m: 	lr: 0.01
[34m[1mwandb[0m: 	timestep: 12
[34m[1mwandb[0m: 	units: 128
[34m[1mwandb[0m: Currently logged in as: [33mancy[0m (use `wandb login --relogin` to force relogin)





VBox(children=(Label(value='0.667 MB of 0.667 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▁▂▃▃▃▄▅▅▅▆▇▇▇█
loss,█▁▁▁▁▁▁▁▁▁▁▁▁▁▁
val_loss,▁▄▅▂▁▂▅██▄▂▂▂▂▂

0,1
best_epoch,4.0
best_val_loss,0.00777
epoch,14.0
loss,0.00823
val_loss,0.00952


[34m[1mwandb[0m: Agent Starting Run: bvge0973 with config:
[34m[1mwandb[0m: 	batch_size: 256
[34m[1mwandb[0m: 	dropout: 0.1
[34m[1mwandb[0m: 	layers: 4
[34m[1mwandb[0m: 	lr: 0.1
[34m[1mwandb[0m: 	timestep: 12
[34m[1mwandb[0m: 	units: 64





VBox(children=(Label(value='0.424 MB of 0.424 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▁▂▂▃▃▃▄▄▅▅▆▆▆▇▇██
loss,█▃▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
val_loss,█▁▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁

0,1
best_epoch,7.0
best_val_loss,0.00773
epoch,17.0
loss,0.00742
val_loss,0.00776


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: 97p0yvxg with config:
[34m[1mwandb[0m: 	batch_size: 256
[34m[1mwandb[0m: 	dropout: 0
[34m[1mwandb[0m: 	layers: 8
[34m[1mwandb[0m: 	lr: 0.1
[34m[1mwandb[0m: 	timestep: 3
[34m[1mwandb[0m: 	units: 64





VBox(children=(Label(value='0.299 MB of 0.299 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▁▂▂▃▃▄▄▅▅▅▆▆▇▇██
loss,█▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
val_loss,█▃▁▂▂▁▁▁▂▂▁▁▁▁▁▁▁

0,1
best_epoch,6.0
best_val_loss,0.00774
epoch,16.0
loss,0.0065
val_loss,0.00825


[34m[1mwandb[0m: Agent Starting Run: se0aanlu with config:
[34m[1mwandb[0m: 	batch_size: 256
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	layers: 1
[34m[1mwandb[0m: 	lr: 0.1
[34m[1mwandb[0m: 	timestep: 6
[34m[1mwandb[0m: 	units: 128





VBox(children=(Label(value='0.276 MB of 0.276 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▁▁▂▂▂▂▃▃▃▃▄▄▄▄▅▅▅▅▆▆▆▆▇▇▇▇███
loss,█▃▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
val_loss,█▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁

0,1
best_epoch,19.0
best_val_loss,0.00781
epoch,29.0
loss,0.00598
val_loss,0.00978


[34m[1mwandb[0m: Agent Starting Run: 69dygjji with config:
[34m[1mwandb[0m: 	batch_size: 128
[34m[1mwandb[0m: 	dropout: 0
[34m[1mwandb[0m: 	layers: 8
[34m[1mwandb[0m: 	lr: 0.1
[34m[1mwandb[0m: 	timestep: 24
[34m[1mwandb[0m: 	units: 64





VBox(children=(Label(value='0.854 MB of 0.854 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▁▂▂▃▃▄▄▅▅▅▆▆▇▇██
loss,█▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
val_loss,█▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁

0,1
best_epoch,6.0
best_val_loss,0.00994
epoch,16.0
loss,0.00745
val_loss,0.01647


[34m[1mwandb[0m: Agent Starting Run: ftyjzjfw with config:
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	dropout: 0.1
[34m[1mwandb[0m: 	layers: 1
[34m[1mwandb[0m: 	lr: 0.01
[34m[1mwandb[0m: 	timestep: 6
[34m[1mwandb[0m: 	units: 256





VBox(children=(Label(value='0.900 MB of 0.900 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▁▂▃▃▃▄▅▅▅▆▇▇▇█
loss,█▁▁▁▁▁▁▁▁▁▁▁▁▁▁
val_loss,▁▁▁▁▁▁▂▃▄█▃▂▂▄▇

0,1
best_epoch,4.0
best_val_loss,0.00787
epoch,14.0
loss,0.02478
val_loss,0.02816


[34m[1mwandb[0m: Agent Starting Run: fjy0z9i1 with config:
[34m[1mwandb[0m: 	batch_size: 256
[34m[1mwandb[0m: 	dropout: 0
[34m[1mwandb[0m: 	layers: 8
[34m[1mwandb[0m: 	lr: 0.01
[34m[1mwandb[0m: 	timestep: 24
[34m[1mwandb[0m: 	units: 128





VBox(children=(Label(value='2.998 MB of 2.998 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▁▁▂▂▂▂▃▃▃▃▄▄▄▄▅▅▅▅▆▆▆▆▇▇▇▇███
loss,█▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
val_loss,█▁▄▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁

0,1
best_epoch,19.0
best_val_loss,0.00773
epoch,29.0
loss,0.00728
val_loss,0.00973


[34m[1mwandb[0m: Agent Starting Run: pilctco5 with config:
[34m[1mwandb[0m: 	batch_size: 256
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	layers: 8
[34m[1mwandb[0m: 	lr: 0.1
[34m[1mwandb[0m: 	timestep: 3
[34m[1mwandb[0m: 	units: 64





VBox(children=(Label(value='0.854 MB of 0.854 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▁▂▂▃▃▃▄▄▅▅▅▆▆▆▇▇██
loss,█▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
val_loss,█▂▅▂▁▂▂▁▁▁▁▁▁▁▁▁▂▂▂

0,1
best_epoch,8.0
best_val_loss,0.00774
epoch,18.0
loss,0.02361
val_loss,0.02159


[34m[1mwandb[0m: Agent Starting Run: tfy0xe64 with config:
[34m[1mwandb[0m: 	batch_size: 256
[34m[1mwandb[0m: 	dropout: 0.1
[34m[1mwandb[0m: 	layers: 8
[34m[1mwandb[0m: 	lr: 0.01
[34m[1mwandb[0m: 	timestep: 24
[34m[1mwandb[0m: 	units: 64





VBox(children=(Label(value='0.854 MB of 0.854 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▁▂▂▃▃▄▄▅▅▆▆▇▇██
loss,█▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
val_loss,▁▁█▃▁▁▁▂▂▂▂▂▂▂▂▂

0,1
best_epoch,5.0
best_val_loss,0.00773
epoch,15.0
loss,0.00851
val_loss,0.009


[34m[1mwandb[0m: Agent Starting Run: 8ymg6epu with config:
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	layers: 4
[34m[1mwandb[0m: 	lr: 0.1
[34m[1mwandb[0m: 	timestep: 12
[34m[1mwandb[0m: 	units: 256





VBox(children=(Label(value='5.444 MB of 5.444 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▁▂▂▃▃▃▄▄▅▅▅▆▆▆▇▇██
loss,█▁▁▁▁▁▁▁▁▁▂▁▂▁▂▁▂▁▂
val_loss,▃▁▂▁▄▂▆▁▁▄▁▄▂▇█▇▁▇▁

0,1
best_epoch,8.0
best_val_loss,0.00778
epoch,18.0
loss,0.63328
val_loss,0.01449


[34m[1mwandb[0m: Agent Starting Run: waiomx1z with config:
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	dropout: 0.1
[34m[1mwandb[0m: 	layers: 8
[34m[1mwandb[0m: 	lr: 0.1
[34m[1mwandb[0m: 	timestep: 24
[34m[1mwandb[0m: 	units: 128





VBox(children=(Label(value='2.998 MB of 2.998 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▂▂▃▃▄▅▅▆▆▇▇█
loss,█▄▁▁▁▁▁▁▁▁▁▁▁
val_loss,█▃▁▂▂▂▁▁▁▁▁▂▂

0,1
best_epoch,2.0
best_val_loss,0.00774
epoch,12.0
loss,0.03015
val_loss,0.15923


[34m[1mwandb[0m: Agent Starting Run: ua7bjrjg with config:
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	dropout: 0.1
[34m[1mwandb[0m: 	layers: 2
[34m[1mwandb[0m: 	lr: 0.01
[34m[1mwandb[0m: 	timestep: 6
[34m[1mwandb[0m: 	units: 128





VBox(children=(Label(value='0.667 MB of 0.667 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▂▂▃▃▄▄▅▅▆▆▇▇█
loss,█▁▁▁▁▁▁▁▁▁▁▁▁▁
val_loss,▁▄▂▁▃▇█▄▂▁▂▁▁▂

0,1
best_epoch,3.0
best_val_loss,0.00773
epoch,13.0
loss,0.0085
val_loss,0.00895


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: fh4oqdfx with config:
[34m[1mwandb[0m: 	batch_size: 256
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	layers: 4
[34m[1mwandb[0m: 	lr: 0.1
[34m[1mwandb[0m: 	timestep: 12
[34m[1mwandb[0m: 	units: 128





VBox(children=(Label(value='1.441 MB of 1.441 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▂▂▃▃▄▅▅▆▆▇▇█
loss,█▂▂▁▁▁▁▁▁▁▁▁▁
val_loss,█▁▁▁▁▁▁▁▁▁▁▁▁

0,1
best_epoch,2.0
best_val_loss,0.00929
epoch,12.0
loss,0.00698
val_loss,0.01045


[34m[1mwandb[0m: Agent Starting Run: 4qq5h5tn with config:
[34m[1mwandb[0m: 	batch_size: 128
[34m[1mwandb[0m: 	dropout: 0.1
[34m[1mwandb[0m: 	layers: 8
[34m[1mwandb[0m: 	lr: 0.01
[34m[1mwandb[0m: 	timestep: 24
[34m[1mwandb[0m: 	units: 128





VBox(children=(Label(value='2.998 MB of 2.998 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▁▂▂▂▂▃▃▃▄▄▄▅▅▅▅▆▆▆▇▇▇▇██
loss,█▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
val_loss,█▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁

0,1
best_epoch,14.0
best_val_loss,0.00773
epoch,24.0
loss,0.01233
val_loss,0.01039


[34m[1mwandb[0m: Agent Starting Run: 2z6olq04 with config:
[34m[1mwandb[0m: 	batch_size: 128
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	layers: 8
[34m[1mwandb[0m: 	lr: 0.1
[34m[1mwandb[0m: 	timestep: 3
[34m[1mwandb[0m: 	units: 128





VBox(children=(Label(value='2.998 MB of 2.998 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▂▂▃▃▄▄▅▅▆▆▇▇█
loss,█▁▁▁▁▁▁▁▁▁▁▁▁▁
val_loss,▂▇▂▁▁▁▁▁▃██▂▃▃

0,1
best_epoch,3.0
best_val_loss,0.00837
epoch,13.0
loss,0.07347
val_loss,0.0784


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: rt8fpxzv with config:
[34m[1mwandb[0m: 	batch_size: 128
[34m[1mwandb[0m: 	dropout: 0.1
[34m[1mwandb[0m: 	layers: 8
[34m[1mwandb[0m: 	lr: 0.01
[34m[1mwandb[0m: 	timestep: 24
[34m[1mwandb[0m: 	units: 64





VBox(children=(Label(value='0.854 MB of 0.854 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▁▂▂▃▃▃▄▄▅▅▆▆▆▇▇██
loss,█▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
val_loss,█▁▁▁▁▁▁▁▁▁▁▁▁▂▂▂▃▃

0,1
best_epoch,7.0
best_val_loss,0.00781
epoch,17.0
loss,0.01401
val_loss,0.02114


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: l4x01g8m with config:
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	dropout: 0.1
[34m[1mwandb[0m: 	layers: 2
[34m[1mwandb[0m: 	lr: 0.1
[34m[1mwandb[0m: 	timestep: 12
[34m[1mwandb[0m: 	units: 256





VBox(children=(Label(value='2.417 MB of 2.417 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▁▂▂▃▃▄▄▅▅▆▆▇▇██
loss,█▁▁▁▁▁▁▁▁▁▁▁▁▁▁▂
val_loss,▁▁▁▁▁▁▃▁▃▄▁▃█▄▄▁

0,1
best_epoch,5.0
best_val_loss,0.01284
epoch,15.0
loss,0.90277
val_loss,0.0373


[34m[1mwandb[0m: Agent Starting Run: pnc593t5 with config:
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	layers: 4
[34m[1mwandb[0m: 	lr: 0.01
[34m[1mwandb[0m: 	timestep: 12
[34m[1mwandb[0m: 	units: 256





VBox(children=(Label(value='5.444 MB of 5.444 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▁▁▂▂▂▂▃▃▃▃▄▄▄▄▅▅▅▅▆▆▆▆▇▇▇▇███
loss,█▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
val_loss,▃▁▂▃▁▁▁▁▁▂▂▃▄▂▁▁▁▁▁▁▁▁▂▃▄▄▆▇▇█

0,1
best_epoch,19.0
best_val_loss,0.00783
epoch,29.0
loss,0.02377
val_loss,0.04273


[34m[1mwandb[0m: Agent Starting Run: fuql7dwu with config:
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	dropout: 0.1
[34m[1mwandb[0m: 	layers: 4
[34m[1mwandb[0m: 	lr: 0.01
[34m[1mwandb[0m: 	timestep: 24
[34m[1mwandb[0m: 	units: 128





VBox(children=(Label(value='1.441 MB of 1.441 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▂▂▃▃▄▅▅▆▆▇▇█
loss,█▁▁▁▁▁▁▁▁▁▁▁▁
val_loss,▃▄▁▆█▃▁▁▁▁▂▂▃

0,1
best_epoch,2.0
best_val_loss,0.0079
epoch,12.0
loss,0.00979
val_loss,0.0118


[34m[1mwandb[0m: Agent Starting Run: 6cut08cu with config:
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	layers: 4
[34m[1mwandb[0m: 	lr: 0.01
[34m[1mwandb[0m: 	timestep: 12
[34m[1mwandb[0m: 	units: 256





VBox(children=(Label(value='5.444 MB of 5.444 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▁▂▂▂▂▃▃▃▃▄▄▄▅▅▅▅▆▆▆▆▇▇▇▇██
loss,█▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
val_loss,▃▂▁▅▃▁▁▁▁▂▃▄▆▅▃▁▁▁▁▁▁▁▂▃▄▆█

0,1
best_epoch,16.0
best_val_loss,0.00773
epoch,26.0
loss,0.02237
val_loss,0.02718


[34m[1mwandb[0m: Agent Starting Run: s6dvrsxh with config:
[34m[1mwandb[0m: 	batch_size: 128
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	layers: 8
[34m[1mwandb[0m: 	lr: 0.1
[34m[1mwandb[0m: 	timestep: 24
[34m[1mwandb[0m: 	units: 128





VBox(children=(Label(value='2.998 MB of 2.998 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▂▂▃▃▄▄▅▅▆▆▇▇█
loss,█▂▁▁▁▁▁▁▁▁▁▁▁▁
val_loss,█▇▃▁▁▁▁▁▄▆▂▂▃▅

0,1
best_epoch,3.0
best_val_loss,0.00948
epoch,13.0
loss,0.10764
val_loss,0.18377


[34m[1mwandb[0m: Agent Starting Run: qbqki3zi with config:
[34m[1mwandb[0m: 	batch_size: 256
[34m[1mwandb[0m: 	dropout: 0.1
[34m[1mwandb[0m: 	layers: 8
[34m[1mwandb[0m: 	lr: 0.1
[34m[1mwandb[0m: 	timestep: 24
[34m[1mwandb[0m: 	units: 64





VBox(children=(Label(value='0.854 MB of 0.854 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▁▂▂▂▂▃▃▃▄▄▄▅▅▅▅▆▆▆▇▇▇▇██
loss,█▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
val_loss,▄█▁▁▂▁▁▁▁▁▁▁▁▁▁▁▁▁▂▂▂▁▁▁▁

0,1
best_epoch,14.0
best_val_loss,0.00773
epoch,24.0
loss,0.00686
val_loss,0.00879


[34m[1mwandb[0m: Agent Starting Run: 0nzzav2g with config:
[34m[1mwandb[0m: 	batch_size: 256
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	layers: 8
[34m[1mwandb[0m: 	lr: 0.1
[34m[1mwandb[0m: 	timestep: 24
[34m[1mwandb[0m: 	units: 128





VBox(children=(Label(value='0.883 MB of 0.883 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▁▂▂▃▃▄▄▅▅▆▆▇▇██
loss,█▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
val_loss,▁▃▄▂▁▁▂▂▂▂▂▆▆█▃▁

0,1
best_epoch,5.0
best_val_loss,0.00793
epoch,15.0
loss,0.06804
val_loss,0.01061


[34m[1mwandb[0m: Agent Starting Run: 3898zzup with config:
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	dropout: 0.1
[34m[1mwandb[0m: 	layers: 4
[34m[1mwandb[0m: 	lr: 0.1
[34m[1mwandb[0m: 	timestep: 24
[34m[1mwandb[0m: 	units: 128





VBox(children=(Label(value='1.441 MB of 1.441 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▂▂▃▄▄▅▅▆▇▇█
loss,█▁▁▁▁▁▁▁▁▁▁▁
val_loss,▁▁▂▁▁▃▁▃▄█▇▇

0,1
best_epoch,1.0
best_val_loss,0.00863
epoch,11.0
loss,0.15066
val_loss,0.43809


[34m[1mwandb[0m: Agent Starting Run: 91dyrynf with config:
[34m[1mwandb[0m: 	batch_size: 128
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	layers: 8
[34m[1mwandb[0m: 	lr: 0.01
[34m[1mwandb[0m: 	timestep: 24
[34m[1mwandb[0m: 	units: 128





VBox(children=(Label(value='2.998 MB of 2.998 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▁▂▃▃▃▄▅▅▅▆▇▇▇█
loss,█▁▁▁▁▁▁▁▁▁▁▁▁▁▁
val_loss,█▁▁▁▁▁▁▁▂▂▃▃▂▂▂

0,1
best_epoch,4.0
best_val_loss,0.00773
epoch,14.0
loss,0.00859
val_loss,0.0156


[34m[1mwandb[0m: Agent Starting Run: cx5rrs1x with config:
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	dropout: 0.1
[34m[1mwandb[0m: 	layers: 4
[34m[1mwandb[0m: 	lr: 0.01
[34m[1mwandb[0m: 	timestep: 12
[34m[1mwandb[0m: 	units: 128





VBox(children=(Label(value='1.441 MB of 1.441 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▁▂▂▂▃▃▃▄▄▄▅▅▅▅▆▆▆▇▇▇██
loss,█▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
val_loss,▃▅▁▁▆█▆▂▁▁▁▁▁▁▂▂▃▄▄▄▅▅▆

0,1
best_epoch,12.0
best_val_loss,0.00799
epoch,22.0
loss,0.01289
val_loss,0.01656


[34m[1mwandb[0m: Agent Starting Run: sood6bqk with config:
[34m[1mwandb[0m: 	batch_size: 128
[34m[1mwandb[0m: 	dropout: 0.1
[34m[1mwandb[0m: 	layers: 8
[34m[1mwandb[0m: 	lr: 0.1
[34m[1mwandb[0m: 	timestep: 24
[34m[1mwandb[0m: 	units: 128





VBox(children=(Label(value='2.998 MB of 2.998 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▁▁▂▂▂▂▃▃▃▃▄▄▄▄▅▅▅▅▅▆▆▆▆▇▇▇▇███
loss,█▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
val_loss,▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▂▂█▂▁

0,1
best_epoch,20.0
best_val_loss,0.00774
epoch,30.0
loss,0.12597
val_loss,0.06336


[34m[1mwandb[0m: Agent Starting Run: i8n6420f with config:
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	layers: 2
[34m[1mwandb[0m: 	lr: 0.1
[34m[1mwandb[0m: 	timestep: 12
[34m[1mwandb[0m: 	units: 128





VBox(children=(Label(value='0.667 MB of 0.667 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▂▂▃▄▅▅▆▇▇█
loss,█▁▁▁▁▁▁▁▁▂▁
val_loss,▁▁▂▁▂▃▃▅▆█▇

0,1
best_epoch,0.0
best_val_loss,0.01675
epoch,10.0
loss,0.13089
val_loss,0.42915


[34m[1mwandb[0m: Agent Starting Run: 6qumzb6n with config:
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	layers: 4
[34m[1mwandb[0m: 	lr: 0.01
[34m[1mwandb[0m: 	timestep: 12
[34m[1mwandb[0m: 	units: 256





VBox(children=(Label(value='5.444 MB of 5.444 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▁▂▂▂▂▃▃▃▄▄▄▅▅▅▅▆▆▆▇▇▇▇██
loss,█▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
val_loss,▂▂▂▁▁▁▂▃▃▂▁▁▁▁▁▁▂▂▃▃▄▅▅▅█

0,1
best_epoch,14.0
best_val_loss,0.00776
epoch,24.0
loss,0.02212
val_loss,0.04253


[34m[1mwandb[0m: Agent Starting Run: 0esiw4qb with config:
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	layers: 2
[34m[1mwandb[0m: 	lr: 0.01
[34m[1mwandb[0m: 	timestep: 12
[34m[1mwandb[0m: 	units: 256





VBox(children=(Label(value='2.417 MB of 2.417 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▁▂▂▂▃▃▃▄▄▅▅▅▆▆▆▇▇▇██
loss,█▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
val_loss,▂▁▂▂▁▁▁▁▁▂▁▂▃▆█▄▂▂▁▂▁

0,1
best_epoch,10.0
best_val_loss,0.00789
epoch,20.0
loss,0.02181
val_loss,0.00849


[34m[1mwandb[0m: Agent Starting Run: ha4vto71 with config:
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	layers: 2
[34m[1mwandb[0m: 	lr: 0.01
[34m[1mwandb[0m: 	timestep: 12
[34m[1mwandb[0m: 	units: 128





VBox(children=(Label(value='0.667 MB of 0.667 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▁▂▂▂▃▃▃▄▄▄▅▅▅▆▆▆▇▇▇██
loss,█▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
val_loss,▄▅▁▁▅█▇▂▁▁▁▁▁▁▂▃▃▄▄▃▂▄

0,1
best_epoch,11.0
best_val_loss,0.00791
epoch,21.0
loss,0.01169
val_loss,0.01176


[34m[1mwandb[0m: Agent Starting Run: 65mc267j with config:
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	layers: 2
[34m[1mwandb[0m: 	lr: 0.01
[34m[1mwandb[0m: 	timestep: 12
[34m[1mwandb[0m: 	units: 256





VBox(children=(Label(value='2.417 MB of 2.417 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▁▂▂▂▃▃▃▃▄▄▄▅▅▅▆▆▆▆▇▇▇██
loss,█▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
val_loss,▂▂▂▁▁▂▃▃▄▂▁▁▁▁▁▂▃▅▆▆▆█▇▇

0,1
best_epoch,13.0
best_val_loss,0.00781
epoch,23.0
loss,0.02443
val_loss,0.02974


[34m[1mwandb[0m: Agent Starting Run: 2j3ybf5l with config:
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	layers: 4
[34m[1mwandb[0m: 	lr: 0.01
[34m[1mwandb[0m: 	timestep: 12
[34m[1mwandb[0m: 	units: 256





VBox(children=(Label(value='5.444 MB of 5.444 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▁▂▂▃▃▃▄▄▅▅▆▆▆▇▇██
loss,█▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
val_loss,▃█▄▅▂▁▁▁▂▃▅▇█▆▂▁▁▂

0,1
best_epoch,7.0
best_val_loss,0.00779
epoch,17.0
loss,0.01722
val_loss,0.00888


[34m[1mwandb[0m: Agent Starting Run: qq95zr3p with config:
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	dropout: 0.1
[34m[1mwandb[0m: 	layers: 4
[34m[1mwandb[0m: 	lr: 0.01
[34m[1mwandb[0m: 	timestep: 12
[34m[1mwandb[0m: 	units: 256





VBox(children=(Label(value='5.444 MB of 5.444 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▂▂▃▃▄▅▅▆▆▇▇█
loss,█▁▁▁▁▁▁▁▁▁▁▁▁
val_loss,▄▆▁▄█▄▁▁▁▁▂▃▄

0,1
best_epoch,2.0
best_val_loss,0.00781
epoch,12.0
loss,0.01078
val_loss,0.01288


[34m[1mwandb[0m: Agent Starting Run: 9v28urxv with config:
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	layers: 2
[34m[1mwandb[0m: 	lr: 0.01
[34m[1mwandb[0m: 	timestep: 24
[34m[1mwandb[0m: 	units: 256





VBox(children=(Label(value='2.417 MB of 2.417 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▁▁▂▂▂▂▃▃▃▃▄▄▄▄▅▅▅▅▆▆▆▆▇▇▇▇███
loss,█▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
val_loss,▂▁▂▃▁▁▁▁▁▂▂▃▄▂▁▁▁▁▁▁▁▁▂▃▄▄▅▆▅█

0,1
best_epoch,19.0
best_val_loss,0.00772
epoch,29.0
loss,0.02335
val_loss,0.03983


[34m[1mwandb[0m: Agent Starting Run: 6xmupi6f with config:
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	dropout: 0.1
[34m[1mwandb[0m: 	layers: 4
[34m[1mwandb[0m: 	lr: 0.01
[34m[1mwandb[0m: 	timestep: 12
[34m[1mwandb[0m: 	units: 256





VBox(children=(Label(value='5.444 MB of 5.444 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▂▂▃▃▄▅▅▆▆▇▇█
loss,█▁▁▁▁▁▁▁▁▁▁▁▁
val_loss,▃▅▁▄█▃▁▁▁▂▂▄▅

0,1
best_epoch,2.0
best_val_loss,0.00773
epoch,12.0
loss,0.01116
val_loss,0.0135


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: bnmlscfu with config:
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	layers: 8
[34m[1mwandb[0m: 	lr: 0.01
[34m[1mwandb[0m: 	timestep: 24
[34m[1mwandb[0m: 	units: 256





VBox(children=(Label(value='11.507 MB of 11.507 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
epoch,▁▂▂▃▄▄▅▅▆▇▇█
loss,█▁▁▁▁▁▁▁▁▁▁▁
val_loss,▅▁▅▆▁▁▁▂▂▄▄█

0,1
best_epoch,1.0
best_val_loss,0.00785
epoch,11.0
loss,0.01355
val_loss,0.02172


[34m[1mwandb[0m: Agent Starting Run: nsemuder with config:
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	layers: 4
[34m[1mwandb[0m: 	lr: 0.01
[34m[1mwandb[0m: 	timestep: 12
[34m[1mwandb[0m: 	units: 256





VBox(children=(Label(value='5.444 MB of 5.444 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▂▂▃▄▄▅▅▆▇▇█
loss,█▁▁▁▁▁▁▁▁▁▁▁
val_loss,▅▁▆▇▁▁▁▂▃▅▆█

0,1
best_epoch,1.0
best_val_loss,0.00774
epoch,11.0
loss,0.01383
val_loss,0.01964


[34m[1mwandb[0m: Agent Starting Run: 8yuy5p4p with config:
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	layers: 2
[34m[1mwandb[0m: 	lr: 0.01
[34m[1mwandb[0m: 	timestep: 12
[34m[1mwandb[0m: 	units: 256





VBox(children=(Label(value='2.417 MB of 2.417 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▁▂▂▂▂▃▃▃▃▄▄▄▄▅▅▅▅▆▆▆▆▇▇▇▇██
loss,█▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
val_loss,▂▁▂▃▁▁▁▁▂▂▃▃▂▁▁▁▁▁▁▂▃▄▅▅▆▇█▇

0,1
best_epoch,17.0
best_val_loss,0.00776
epoch,27.0
loss,0.02508
val_loss,0.04526


[34m[1mwandb[0m: Agent Starting Run: mn0rc2kt with config:
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	layers: 2
[34m[1mwandb[0m: 	lr: 0.01
[34m[1mwandb[0m: 	timestep: 24
[34m[1mwandb[0m: 	units: 128





VBox(children=(Label(value='0.667 MB of 0.667 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▂▂▃▃▄▄▅▅▆▆▇▇█
loss,█▁▁▁▁▁▁▁▁▁▁▁▁▁
val_loss,▂▃▂▁▅█▆▂▁▁▁▁▁▁

0,1
best_epoch,3.0
best_val_loss,0.00786
epoch,13.0
loss,0.00869
val_loss,0.00806


[34m[1mwandb[0m: Agent Starting Run: khtjkg59 with config:
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	layers: 4
[34m[1mwandb[0m: 	lr: 0.01
[34m[1mwandb[0m: 	timestep: 12
[34m[1mwandb[0m: 	units: 256





VBox(children=(Label(value='5.444 MB of 5.444 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▁▂▂▂▂▃▃▃▃▄▄▄▅▅▅▅▆▆▆▆▇▇▇▇██
loss,█▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
val_loss,▂▁▃▁▁▁▁▂▂▃▃▂▁▁▁▁▁▁▁▂▂▃▃▅▅▇█

0,1
best_epoch,16.0
best_val_loss,0.00774
epoch,26.0
loss,0.0228
val_loss,0.04329


[34m[1mwandb[0m: Agent Starting Run: j166u8f7 with config:
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	layers: 2
[34m[1mwandb[0m: 	lr: 0.01
[34m[1mwandb[0m: 	timestep: 12
[34m[1mwandb[0m: 	units: 256





VBox(children=(Label(value='2.417 MB of 2.417 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▁▂▃▃▃▄▅▅▅▆▇▇▇█
loss,█▁▁▁▁▁▁▁▁▁▁▁▁▁▁
val_loss,▁▃▅▂▁▃▆█▃▂▁▁▁▁▂

0,1
best_epoch,4.0
best_val_loss,0.00791
epoch,14.0
loss,0.00885
val_loss,0.00901


[34m[1mwandb[0m: Agent Starting Run: x1zl22m5 with config:
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	layers: 2
[34m[1mwandb[0m: 	lr: 0.01
[34m[1mwandb[0m: 	timestep: 24
[34m[1mwandb[0m: 	units: 256





VBox(children=(Label(value='2.417 MB of 2.417 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▁▂▂▂▃▃▄▄▄▅▅▅▆▆▇▇▇██
loss,█▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
val_loss,▄▃▇▁▁▄▅▅▆▁▁▁▁▂▂▃▄▆██

0,1
best_epoch,9.0
best_val_loss,0.00786
epoch,19.0
loss,0.01412
val_loss,0.01957


[34m[1mwandb[0m: Agent Starting Run: sgknpoyt with config:
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	layers: 4
[34m[1mwandb[0m: 	lr: 0.01
[34m[1mwandb[0m: 	timestep: 12
[34m[1mwandb[0m: 	units: 256





VBox(children=(Label(value='5.444 MB of 5.444 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▂▂▃▄▄▅▅▆▇▇█
loss,█▁▁▁▁▁▁▁▁▁▁▁
val_loss,▃▁▆▄▁▁▁▂▄▅█▅

0,1
best_epoch,1.0
best_val_loss,0.00773
epoch,11.0
loss,0.01367
val_loss,0.01553


[34m[1mwandb[0m: Agent Starting Run: asyf1876 with config:
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	layers: 4
[34m[1mwandb[0m: 	lr: 0.01
[34m[1mwandb[0m: 	timestep: 24
[34m[1mwandb[0m: 	units: 128





VBox(children=(Label(value='1.441 MB of 1.441 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▁▂▂▃▃▃▄▄▅▅▅▆▆▆▇▇██
loss,█▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
val_loss,▆▁█▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁

0,1
best_epoch,8.0
best_val_loss,0.00797
epoch,18.0
loss,0.00883
val_loss,0.00995


[34m[1mwandb[0m: Agent Starting Run: 8bm3c6vu with config:
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	layers: 2
[34m[1mwandb[0m: 	lr: 0.01
[34m[1mwandb[0m: 	timestep: 12
[34m[1mwandb[0m: 	units: 256





VBox(children=(Label(value='2.417 MB of 2.417 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▁▂▂▃▃▄▄▅▅▅▆▆▇▇██
loss,█▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
val_loss,▇▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁█

0,1
best_epoch,6.0
best_val_loss,0.00773
epoch,16.0
loss,0.14921
val_loss,0.34591


[34m[1mwandb[0m: Agent Starting Run: kogwq78w with config:
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	layers: 4
[34m[1mwandb[0m: 	lr: 0.01
[34m[1mwandb[0m: 	timestep: 24
[34m[1mwandb[0m: 	units: 256





VBox(children=(Label(value='5.444 MB of 5.444 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▂▂▃▄▄▅▅▆▇▇█
loss,█▁▁▁▁▁▁▁▁▁▁▁
val_loss,▂▁▆▃▁▁▁▂▃▅█▆

0,1
best_epoch,1.0
best_val_loss,0.00793
epoch,11.0
loss,0.01393
val_loss,0.0179


[34m[1mwandb[0m: Agent Starting Run: 0v6cxvl6 with config:
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	layers: 4
[34m[1mwandb[0m: 	lr: 0.01
[34m[1mwandb[0m: 	timestep: 12
[34m[1mwandb[0m: 	units: 256





VBox(children=(Label(value='5.444 MB of 5.444 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▂▂▃▄▄▅▅▆▇▇█
loss,█▁▁▁▁▁▁▁▁▁▁▁
val_loss,▅▁▄▇▁▁▁▁▂▄▅█

0,1
best_epoch,1.0
best_val_loss,0.00804
epoch,11.0
loss,0.01362
val_loss,0.02033


[34m[1mwandb[0m: Agent Starting Run: up4ze921 with config:
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	layers: 2
[34m[1mwandb[0m: 	lr: 0.01
[34m[1mwandb[0m: 	timestep: 24
[34m[1mwandb[0m: 	units: 128





VBox(children=(Label(value='0.667 MB of 0.667 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▁▂▂▂▃▃▃▄▄▄▅▅▅▅▆▆▆▇▇▇██
loss,█▁▁▁▁▁▁▁▁▁▁▂▁▁▁▁▁▁▁▁▁▁▁
val_loss,▁▁▁▁▁▁▁▁▁▁▁█▁▁▁▁▁▁▁▁▁▁▁

0,1
best_epoch,12.0
best_val_loss,0.00795
epoch,22.0
loss,0.01203
val_loss,0.01435


[34m[1mwandb[0m: Agent Starting Run: drbmg5z7 with config:
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	layers: 2
[34m[1mwandb[0m: 	lr: 0.01
[34m[1mwandb[0m: 	timestep: 24
[34m[1mwandb[0m: 	units: 256





VBox(children=(Label(value='2.417 MB of 2.417 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▂▂▃▃▄▅▅▆▆▇▇█
loss,█▁▁▁▁▁▁▁▁▁▁▁▁
val_loss,▂▂▁▃▅▆█▇▃▁▁▁▄

0,1
best_epoch,2.0
best_val_loss,0.00775
epoch,12.0
loss,0.01168
val_loss,0.01141


# LSTM

In [None]:
# Configure the sweep – specify the parameters to search through, the search strategy, the optimization metric et all.
sweep_config = {
    'name': 'LSTM',
    'method': 'bayes', #grid, random
    'metric': {
      'name': 'best_val_loss',
      'goal': 'minimize'   
    },
    'parameters': {
        'batch_size': {
            'values': [256, 128, 64, 32]
        },
        'dropout': {
            'values': [0, 0.1, 0.3]
        },
        'units': {
            'values': [64, 128, 256]
        },
        'timestep': {
            'values': [3, 6, 12, 24]
        },
        'lr': {
            'values': [1e-2, 1e-1]
        },
        'layers': {
            'values': [1, 2, 4, 8]
        },
        
    }
}

In [None]:
sweep_id = wandb.sweep(sweep_config, entity="ancy", project="DF1_RESIDUAL_LSTM")

Create sweep with ID: 1u1gxsbe
Sweep URL: https://wandb.ai/ancy/DF1_RESIDUAL_LSTM/sweeps/1u1gxsbe


In [None]:
def create_lstm():
    config_defaults = {
    'batch_size': 128,
    'lr': 1e-3,
    'units': 64,
    'timestep': 3,
    'dropout': 0.3,
    'layers': 1,
    }

    wandb.init(config=config_defaults)
    config = wandb.config

    batch_size = config.batch_size
    lr         = config.lr
    num_units  = config.units
    timestep   = config.timestep
    dropout    = config.dropout
    layers     = config.layers

    train_X, train_y, valid_X, valid_y, test_X, test_y = make_data(hourly, timestep, resid_check=True)
    model = Sequential()

    if layers > 1:
      model.add(LSTM(units = num_units, input_shape=(train_X.shape[1], train_X.shape[2]), dropout=dropout, return_sequences=True))

      for i in range(layers-2):
        model.add(LSTM(units = num_units, dropout=dropout, return_sequences=True))

      model.add(LSTM(units = num_units, dropout=dropout))

    else:
      model.add(LSTM(units = num_units, input_shape=(train_X.shape[1], train_X.shape[2]), dropout=dropout))

    model.add(Dense(units = 1))
    model.compile(
        loss="mse",
        optimizer=Adam(learning_rate=lr)
    )

    model.fit(train_X, train_y, batch_size=batch_size,
              epochs=200, verbose=0, shuffle=False,
              validation_data=(valid_X, valid_y),
              callbacks=[WandbCallback(),
                          EarlyStopping(patience=10, restore_best_weights=True)])

    return model

In [None]:
wandb.agent(sweep_id, create_lstm, count=50)

[34m[1mwandb[0m: Agent Starting Run: id8o6u9s with config:
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	dropout: 0.1
[34m[1mwandb[0m: 	layers: 1
[34m[1mwandb[0m: 	lr: 0.1
[34m[1mwandb[0m: 	timestep: 24
[34m[1mwandb[0m: 	units: 256





VBox(children=(Label(value='3.501 MB of 3.501 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▁▂▂▃▃▄▄▅▅▆▆▇▇██
loss,█▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
val_loss,█▁▂▂▁▁▂▃▃▁▁▁▁▁▁▁

0,1
best_epoch,5.0
best_val_loss,0.00794
epoch,15.0
loss,0.00885
val_loss,0.00915


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: b6svucul with config:
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	dropout: 0.1
[34m[1mwandb[0m: 	layers: 1
[34m[1mwandb[0m: 	lr: 0.1
[34m[1mwandb[0m: 	timestep: 24
[34m[1mwandb[0m: 	units: 256





VBox(children=(Label(value='3.501 MB of 3.501 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▁▂▂▂▃▃▃▄▄▄▅▅▅▅▆▆▆▇▇▇██
loss,█▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
val_loss,█▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁

0,1
best_epoch,12.0
best_val_loss,0.00773
epoch,22.0
loss,0.01794
val_loss,0.00851


[34m[1mwandb[0m: Agent Starting Run: 6406aqud with config:
[34m[1mwandb[0m: 	batch_size: 256
[34m[1mwandb[0m: 	dropout: 0
[34m[1mwandb[0m: 	layers: 8
[34m[1mwandb[0m: 	lr: 0.1
[34m[1mwandb[0m: 	timestep: 3
[34m[1mwandb[0m: 	units: 128





VBox(children=(Label(value='11.639 MB of 11.639 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
epoch,▁▁▂▂▃▃▃▄▄▅▅▅▆▆▆▇▇██
loss,▁█▃▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
val_loss,▅█▃▄▃▂▁▁▁▁▁▁▁▁▁▁▁▁▁

0,1
best_epoch,8.0
best_val_loss,0.00773
epoch,18.0
loss,0.00637
val_loss,0.00774


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: j9osw6ue with config:
[34m[1mwandb[0m: 	batch_size: 256
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	layers: 8
[34m[1mwandb[0m: 	lr: 0.01
[34m[1mwandb[0m: 	timestep: 3
[34m[1mwandb[0m: 	units: 64





VBox(children=(Label(value='3.062 MB of 3.062 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▁▁▂▂▂▂▃▃▃▃▄▄▄▄▅▅▅▅▅▆▆▆▆▇▇▇▇███
loss,█▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
val_loss,█▂▂▃▂▃▂▂▂▂▂▂▂▂▁▂▂▂▁▂▁▁▁▁▁▁▂▁▂▁▁

0,1
best_epoch,20.0
best_val_loss,0.00633
epoch,30.0
loss,0.00592
val_loss,0.00671


[34m[1mwandb[0m: Agent Starting Run: km73m19x with config:
[34m[1mwandb[0m: 	batch_size: 128
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	layers: 8
[34m[1mwandb[0m: 	lr: 0.01
[34m[1mwandb[0m: 	timestep: 6
[34m[1mwandb[0m: 	units: 64





VBox(children=(Label(value='3.062 MB of 3.062 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▂▂▃▄▄▅▅▆▇▇█
loss,█▂▁▁▁▁▁▁▁▁▁▁
val_loss,█▁▂▃▃▃▂▃▃▃▃▃

0,1
best_epoch,1.0
best_val_loss,0.00804
epoch,11.0
loss,0.00717
val_loss,0.0091


[34m[1mwandb[0m: Agent Starting Run: u7aj5a35 with config:
[34m[1mwandb[0m: 	batch_size: 256
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	layers: 8
[34m[1mwandb[0m: 	lr: 0.01
[34m[1mwandb[0m: 	timestep: 6
[34m[1mwandb[0m: 	units: 256





VBox(children=(Label(value='15.237 MB of 15.237 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
epoch,▁▁▂▂▃▃▃▄▄▅▅▆▆▆▇▇██
loss,█▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
val_loss,█▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁

0,1
best_epoch,7.0
best_val_loss,0.00777
epoch,17.0
loss,0.00657
val_loss,0.00799


[34m[1mwandb[0m: Agent Starting Run: 5l9m4a00 with config:
[34m[1mwandb[0m: 	batch_size: 256
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	layers: 8
[34m[1mwandb[0m: 	lr: 0.1
[34m[1mwandb[0m: 	timestep: 3
[34m[1mwandb[0m: 	units: 128





VBox(children=(Label(value='11.639 MB of 11.639 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
epoch,▁▁▂▃▃▃▄▅▅▅▆▇▇▇█
loss,█▆▁▁▁▁▁▁▁▁▁▁▁▁▁
val_loss,█▄▁▁▁▁▁▁▁▁▁▁▁▁▁

0,1
best_epoch,4.0
best_val_loss,0.00773
epoch,14.0
loss,0.00654
val_loss,0.00779


[34m[1mwandb[0m: Agent Starting Run: 9z1bx4m2 with config:
[34m[1mwandb[0m: 	batch_size: 128
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	layers: 8
[34m[1mwandb[0m: 	lr: 0.1
[34m[1mwandb[0m: 	timestep: 6
[34m[1mwandb[0m: 	units: 64





VBox(children=(Label(value='3.062 MB of 3.062 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▂▂▃▃▄▄▅▅▆▆▇▇█
loss,█▁▁▁▁▁▁▁▁▁▁▁▁▁
val_loss,█▁▂▁▁▁▁▁▁▁▁▁▁▁

0,1
best_epoch,3.0
best_val_loss,0.00777
epoch,13.0
loss,0.00959
val_loss,0.00779


[34m[1mwandb[0m: Agent Starting Run: 3maa8ltn with config:
[34m[1mwandb[0m: 	batch_size: 128
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	layers: 8
[34m[1mwandb[0m: 	lr: 0.1
[34m[1mwandb[0m: 	timestep: 6
[34m[1mwandb[0m: 	units: 64





VBox(children=(Label(value='3.062 MB of 3.062 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▁▂▃▃▃▄▅▅▅▆▇▇▇█
loss,█▁▁▁▁▁▁▁▁▁▁▁▁▁▁
val_loss,▁▁▁▁▁▂▅▇█▇▆▆▅▅▄

0,1
best_epoch,4.0
best_val_loss,0.00773
epoch,14.0
loss,0.00701
val_loss,0.00873


[34m[1mwandb[0m: Agent Starting Run: pghtfa2g with config:
[34m[1mwandb[0m: 	batch_size: 256
[34m[1mwandb[0m: 	dropout: 0
[34m[1mwandb[0m: 	layers: 4
[34m[1mwandb[0m: 	lr: 0.01
[34m[1mwandb[0m: 	timestep: 6
[34m[1mwandb[0m: 	units: 64





VBox(children=(Label(value='1.186 MB of 1.186 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▁▁▂▂▂▂▃▃▃▃▄▄▄▄▅▅▅▅▆▆▆▆▇▇▇▇███
loss,█▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
val_loss,█▅█▂▂▂▂▂▂▂▂▂▂▂▂▁▁▁▁▁▁▁▁▁▂▂▁▁▂▁

0,1
best_epoch,19.0
best_val_loss,0.00645
epoch,29.0
loss,0.00531
val_loss,0.00693


[34m[1mwandb[0m: Agent Starting Run: ezn8tcor with config:
[34m[1mwandb[0m: 	batch_size: 256
[34m[1mwandb[0m: 	dropout: 0.1
[34m[1mwandb[0m: 	layers: 8
[34m[1mwandb[0m: 	lr: 0.01
[34m[1mwandb[0m: 	timestep: 12
[34m[1mwandb[0m: 	units: 64





VBox(children=(Label(value='3.062 MB of 3.062 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▁▁▂▂▂▂▃▃▃▃▄▄▄▄▅▅▅▅▆▆▆▆▇▇▇▇███
loss,█▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
val_loss,█▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁

0,1
best_epoch,19.0
best_val_loss,0.0073
epoch,29.0
loss,0.00543
val_loss,0.00818


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: qw152iwr with config:
[34m[1mwandb[0m: 	batch_size: 128
[34m[1mwandb[0m: 	dropout: 0
[34m[1mwandb[0m: 	layers: 4
[34m[1mwandb[0m: 	lr: 0.01
[34m[1mwandb[0m: 	timestep: 6
[34m[1mwandb[0m: 	units: 64





VBox(children=(Label(value='1.503 MB of 1.503 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▁▂▂▂▂▃▃▃▄▄▄▅▅▅▅▆▆▆▇▇▇▇██
loss,█▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
val_loss,█▃▂▃▄▅▅▅▄▃▂▂▁▁▁█▁▂▁▂▂▂▃▂▂

0,1
best_epoch,14.0
best_val_loss,0.00637
epoch,24.0
loss,0.00759
val_loss,0.00837


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: hjix5l3m with config:
[34m[1mwandb[0m: 	batch_size: 128
[34m[1mwandb[0m: 	dropout: 0
[34m[1mwandb[0m: 	layers: 8
[34m[1mwandb[0m: 	lr: 0.1
[34m[1mwandb[0m: 	timestep: 6
[34m[1mwandb[0m: 	units: 128





VBox(children=(Label(value='11.639 MB of 11.639 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
epoch,▁▁▂▃▃▃▄▅▅▅▆▇▇▇█
loss,█▂▁▁▁▁▁▁▁▁▁▁▁▁▁
val_loss,█▁▁▁▁▁▁▁▁▁▁▁▁▁▁

0,1
best_epoch,4.0
best_val_loss,0.00774
epoch,14.0
loss,0.00743
val_loss,0.01141


[34m[1mwandb[0m: Agent Starting Run: erf6734r with config:
[34m[1mwandb[0m: 	batch_size: 128
[34m[1mwandb[0m: 	dropout: 0
[34m[1mwandb[0m: 	layers: 4
[34m[1mwandb[0m: 	lr: 0.1
[34m[1mwandb[0m: 	timestep: 6
[34m[1mwandb[0m: 	units: 64





VBox(children=(Label(value='1.503 MB of 1.503 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▂▂▃▃▄▅▅▆▆▇▇█
loss,█▁▁▁▁▁▁▁▁▁▁▁▁
val_loss,█▄▁▁▁▃▇█▄▃▃▂▂

0,1
best_epoch,2.0
best_val_loss,0.00773
epoch,12.0
loss,0.00737
val_loss,0.01078


[34m[1mwandb[0m: Agent Starting Run: mbmi9kaq with config:
[34m[1mwandb[0m: 	batch_size: 128
[34m[1mwandb[0m: 	dropout: 0.1
[34m[1mwandb[0m: 	layers: 4
[34m[1mwandb[0m: 	lr: 0.01
[34m[1mwandb[0m: 	timestep: 6
[34m[1mwandb[0m: 	units: 64





VBox(children=(Label(value='1.503 MB of 1.503 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▁▂▂▂▃▃▃▄▄▄▅▅▅▅▆▆▆▇▇▇██
loss,█▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
val_loss,▆▁▂▂▁▁▁▁▁▁▃▂▁▅▁▃▂▃▂▅▅█▆

0,1
best_epoch,12.0
best_val_loss,0.00742
epoch,22.0
loss,0.00606
val_loss,0.00904


[34m[1mwandb[0m: Agent Starting Run: oyw4qs5a with config:
[34m[1mwandb[0m: 	batch_size: 128
[34m[1mwandb[0m: 	dropout: 0
[34m[1mwandb[0m: 	layers: 4
[34m[1mwandb[0m: 	lr: 0.1
[34m[1mwandb[0m: 	timestep: 6
[34m[1mwandb[0m: 	units: 64





VBox(children=(Label(value='0.014 MB of 0.014 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▁▂▃▃▃▄▅▅▅▆▇▇▇█
loss,█▁▁▁▁▁▁▁▁▁▁▁▁▁▁
val_loss,█▁▂▁▁▁▁▂▂▃▄▄▃▂▁

0,1
best_epoch,4.0
best_val_loss,0.00774
epoch,14.0
loss,0.01117
val_loss,0.00851


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: btl22tsh with config:
[34m[1mwandb[0m: 	batch_size: 256
[34m[1mwandb[0m: 	dropout: 0.1
[34m[1mwandb[0m: 	layers: 4
[34m[1mwandb[0m: 	lr: 0.1
[34m[1mwandb[0m: 	timestep: 6
[34m[1mwandb[0m: 	units: 64





VBox(children=(Label(value='1.503 MB of 1.503 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▂▂▃▃▄▄▅▅▆▆▇▇█
loss,█▁▁▁▁▁▁▁▁▁▁▁▁▁
val_loss,█▂▃▁▁▁▁▁▁▁▁▁▁▁

0,1
best_epoch,3.0
best_val_loss,0.00778
epoch,13.0
loss,0.00798
val_loss,0.00874


[34m[1mwandb[0m: Agent Starting Run: y7asi5nk with config:
[34m[1mwandb[0m: 	batch_size: 256
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	layers: 8
[34m[1mwandb[0m: 	lr: 0.1
[34m[1mwandb[0m: 	timestep: 6
[34m[1mwandb[0m: 	units: 64





VBox(children=(Label(value='3.062 MB of 3.062 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▂▂▃▄▄▅▅▆▇▇█
loss,█▁▁▁▁▁▁▁▁▁▁▁
val_loss,▅▁▁▅█▄▂▂▂▁▂▁

0,1
best_epoch,1.0
best_val_loss,0.00777
epoch,11.0
loss,0.00649
val_loss,0.00794


[34m[1mwandb[0m: Agent Starting Run: wqeucjyu with config:
[34m[1mwandb[0m: 	batch_size: 128
[34m[1mwandb[0m: 	dropout: 0
[34m[1mwandb[0m: 	layers: 4
[34m[1mwandb[0m: 	lr: 0.01
[34m[1mwandb[0m: 	timestep: 3
[34m[1mwandb[0m: 	units: 128





VBox(children=(Label(value='5.567 MB of 5.567 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▂▂▃▃▄▅▅▆▆▇▇█
loss,█▁▁▁▁▁▁▁▁▁▁▁▁
val_loss,█▁▁▁▁▃▆▇▇▇▆▅▅

0,1
best_epoch,2.0
best_val_loss,0.00724
epoch,12.0
loss,0.00498
val_loss,0.01003


[34m[1mwandb[0m: Agent Starting Run: qyqcj6z1 with config:
[34m[1mwandb[0m: 	batch_size: 256
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	layers: 8
[34m[1mwandb[0m: 	lr: 0.1
[34m[1mwandb[0m: 	timestep: 3
[34m[1mwandb[0m: 	units: 128





VBox(children=(Label(value='11.639 MB of 11.639 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
epoch,▁▁▂▂▃▃▄▄▅▅▅▆▆▇▇██
loss,█▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
val_loss,█▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁

0,1
best_epoch,6.0
best_val_loss,0.00773
epoch,16.0
loss,0.00659
val_loss,0.00782


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: h9ab6aiq with config:
[34m[1mwandb[0m: 	batch_size: 128
[34m[1mwandb[0m: 	dropout: 0
[34m[1mwandb[0m: 	layers: 8
[34m[1mwandb[0m: 	lr: 0.01
[34m[1mwandb[0m: 	timestep: 6
[34m[1mwandb[0m: 	units: 128





VBox(children=(Label(value='11.639 MB of 11.639 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
epoch,▁▂▂▃▄▄▅▅▆▇▇█
loss,█▁▁▁▁▁▁▁▁▁▁▁
val_loss,█▁▂▂▃▃▁▂▂▁▃▁

0,1
best_epoch,1.0
best_val_loss,0.00781
epoch,11.0
loss,0.00573
val_loss,0.00786


[34m[1mwandb[0m: Agent Starting Run: 2pk1sf7d with config:
[34m[1mwandb[0m: 	batch_size: 128
[34m[1mwandb[0m: 	dropout: 0
[34m[1mwandb[0m: 	layers: 4
[34m[1mwandb[0m: 	lr: 0.01
[34m[1mwandb[0m: 	timestep: 12
[34m[1mwandb[0m: 	units: 64





VBox(children=(Label(value='1.503 MB of 1.503 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▁▂▂▃▃▄▄▅▅▅▆▆▇▇██
loss,█▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
val_loss,█▂▁▁▁▁▁▁▁▁▁▁▁▂▂▃▅

0,1
best_epoch,6.0
best_val_loss,0.0077
epoch,16.0
loss,0.0065
val_loss,0.01367


[34m[1mwandb[0m: Agent Starting Run: 5fgxodue with config:
[34m[1mwandb[0m: 	batch_size: 128
[34m[1mwandb[0m: 	dropout: 0
[34m[1mwandb[0m: 	layers: 8
[34m[1mwandb[0m: 	lr: 0.01
[34m[1mwandb[0m: 	timestep: 12
[34m[1mwandb[0m: 	units: 64





VBox(children=(Label(value='3.062 MB of 3.062 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▁▁▂▂▂▂▂▃▃▃▃▄▄▄▄▄▅▅▅▅▅▆▆▆▆▇▇▇▇▇███
loss,█▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
val_loss,█▃▂▂▂▂▂▂▂▂▂▆▂▂▃▂▂▃█▁▃█▆▁▂▁▄▁▃▁▅▂▆▂

0,1
best_epoch,23.0
best_val_loss,0.00698
epoch,33.0
loss,0.00638
val_loss,0.00766


[34m[1mwandb[0m: Agent Starting Run: z9ov4ovx with config:
[34m[1mwandb[0m: 	batch_size: 128
[34m[1mwandb[0m: 	dropout: 0.1
[34m[1mwandb[0m: 	layers: 4
[34m[1mwandb[0m: 	lr: 0.01
[34m[1mwandb[0m: 	timestep: 6
[34m[1mwandb[0m: 	units: 128





VBox(children=(Label(value='5.567 MB of 5.567 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▂▂▃▃▄▄▅▅▆▆▇▇█
loss,█▁▁▁▁▁▁▁▁▁▁▁▁▁
val_loss,▃█▂▁▁▂▂▂▂▂▂▃▃▃

0,1
best_epoch,3.0
best_val_loss,0.00776
epoch,13.0
loss,0.00732
val_loss,0.00812


[34m[1mwandb[0m: Agent Starting Run: rvm5iu89 with config:
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	dropout: 0
[34m[1mwandb[0m: 	layers: 4
[34m[1mwandb[0m: 	lr: 0.1
[34m[1mwandb[0m: 	timestep: 6
[34m[1mwandb[0m: 	units: 64





VBox(children=(Label(value='1.503 MB of 1.503 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▂▂▃▃▄▅▅▆▆▇▇█
loss,█▁▁▁▁▁▁▁▁▁▁▁▁
val_loss,▁▂▁▂▄▄▄▅▆▇██▆

0,1
best_epoch,2.0
best_val_loss,0.00887
epoch,12.0
loss,0.00858
val_loss,0.01393


[34m[1mwandb[0m: Agent Starting Run: 64k1b29x with config:
[34m[1mwandb[0m: 	batch_size: 128
[34m[1mwandb[0m: 	dropout: 0
[34m[1mwandb[0m: 	layers: 4
[34m[1mwandb[0m: 	lr: 0.1
[34m[1mwandb[0m: 	timestep: 6
[34m[1mwandb[0m: 	units: 64





VBox(children=(Label(value='1.503 MB of 1.503 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▁▂▂▂▂▃▃▃▃▄▄▄▄▅▅▅▅▆▆▆▆▇▇▇▇██
loss,█▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
val_loss,▅▃▃▅█▇▄▂▂▂▂▁▁▁▁▁▁▁▁▁▁▁▂▂▂▃▃▄

0,1
best_epoch,17.0
best_val_loss,0.00936
epoch,27.0
loss,0.01101
val_loss,0.01524


[34m[1mwandb[0m: Agent Starting Run: 6oax41bn with config:
[34m[1mwandb[0m: 	batch_size: 128
[34m[1mwandb[0m: 	dropout: 0
[34m[1mwandb[0m: 	layers: 8
[34m[1mwandb[0m: 	lr: 0.1
[34m[1mwandb[0m: 	timestep: 6
[34m[1mwandb[0m: 	units: 128





VBox(children=(Label(value='11.639 MB of 11.639 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
epoch,▁▂▂▃▃▄▄▅▅▆▆▇▇█
loss,█▁▁▁▁▁▁▁▁▁▁▁▁▁
val_loss,█▇▁▁▁▁▁▂▂▃▃▃▂▂

0,1
best_epoch,3.0
best_val_loss,0.00783
epoch,13.0
loss,0.00788
val_loss,0.01378


[34m[1mwandb[0m: Agent Starting Run: cq8jsy62 with config:
[34m[1mwandb[0m: 	batch_size: 256
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	layers: 8
[34m[1mwandb[0m: 	lr: 0.1
[34m[1mwandb[0m: 	timestep: 3
[34m[1mwandb[0m: 	units: 64





VBox(children=(Label(value='3.062 MB of 3.062 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▁▂▂▃▃▃▄▄▅▅▆▆▆▇▇██
loss,█▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
val_loss,█▂▁▁▁▁▁▁▁▁▁▁▁▂▂▂▁▁

0,1
best_epoch,7.0
best_val_loss,0.00777
epoch,17.0
loss,0.00733
val_loss,0.00812


[34m[1mwandb[0m: Agent Starting Run: 35804tv6 with config:
[34m[1mwandb[0m: 	batch_size: 128
[34m[1mwandb[0m: 	dropout: 0
[34m[1mwandb[0m: 	layers: 8
[34m[1mwandb[0m: 	lr: 0.01
[34m[1mwandb[0m: 	timestep: 6
[34m[1mwandb[0m: 	units: 64





VBox(children=(Label(value='3.062 MB of 3.062 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▁▁▁▂▂▂▂▂▃▃▃▃▃▃▄▄▄▄▄▅▅▅▅▅▅▆▆▆▆▆▆▇▇▇▇▇███
loss,█▂▂▁▂▂▂▂▂▂▂▂▁▁▁▁▁▁▁▁▁▁▁▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
val_loss,▄█▅▅▆▆▅▄▃▃▃▄▃▃▃▃▃▃▃▆▂▂▅▃▃▂▂▂▂▂▁▂▁▁▁▃▃▃▃▃

0,1
best_epoch,40.0
best_val_loss,0.00656
epoch,50.0
loss,0.00661
val_loss,0.00776


[34m[1mwandb[0m: Agent Starting Run: a2lqj25z with config:
[34m[1mwandb[0m: 	batch_size: 128
[34m[1mwandb[0m: 	dropout: 0
[34m[1mwandb[0m: 	layers: 8
[34m[1mwandb[0m: 	lr: 0.01
[34m[1mwandb[0m: 	timestep: 6
[34m[1mwandb[0m: 	units: 64





VBox(children=(Label(value='3.062 MB of 3.062 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▂▂▃▄▄▅▅▆▇▇█
loss,█▁▁▁▁▁▁▁▁▁▁▁
val_loss,▇▁█▃▂▅▄▆▆▆▇▇

0,1
best_epoch,1.0
best_val_loss,0.00773
epoch,11.0
loss,0.00703
val_loss,0.00929


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: 9k3cg0vp with config:
[34m[1mwandb[0m: 	batch_size: 256
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	layers: 8
[34m[1mwandb[0m: 	lr: 0.01
[34m[1mwandb[0m: 	timestep: 3
[34m[1mwandb[0m: 	units: 128





VBox(children=(Label(value='11.639 MB of 11.639 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
epoch,▁▂▂▃▃▄▅▅▆▆▇▇█
loss,█▁▁▁▁▁▁▁▁▁▁▁▁
val_loss,▃▄▁▂▃▂▆▂▃▃▃█▂

0,1
best_epoch,2.0
best_val_loss,0.007
epoch,12.0
loss,0.0062
val_loss,0.00753


[34m[1mwandb[0m: Agent Starting Run: 5mxjnsgs with config:
[34m[1mwandb[0m: 	batch_size: 256
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	layers: 8
[34m[1mwandb[0m: 	lr: 0.01
[34m[1mwandb[0m: 	timestep: 6
[34m[1mwandb[0m: 	units: 64





VBox(children=(Label(value='3.062 MB of 3.062 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▁▂▂▃▃▃▄▄▅▅▆▆▆▇▇██
loss,█▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
val_loss,▄▆▆▄▆█▄▁▃▄▄▂▃▄▄▅▅▄

0,1
best_epoch,7.0
best_val_loss,0.0066
epoch,17.0
loss,0.00685
val_loss,0.00776


[34m[1mwandb[0m: Agent Starting Run: f1eqe4gw with config:
[34m[1mwandb[0m: 	batch_size: 256
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	layers: 8
[34m[1mwandb[0m: 	lr: 0.01
[34m[1mwandb[0m: 	timestep: 6
[34m[1mwandb[0m: 	units: 128





VBox(children=(Label(value='11.639 MB of 11.639 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
epoch,▁▁▂▂▂▂▃▃▃▄▄▄▅▅▅▅▆▆▆▇▇▇▇██
loss,█▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
val_loss,█▄▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁

0,1
best_epoch,14.0
best_val_loss,0.00701
epoch,24.0
loss,0.0061
val_loss,0.00742


[34m[1mwandb[0m: Agent Starting Run: za8ekwv9 with config:
[34m[1mwandb[0m: 	batch_size: 256
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	layers: 8
[34m[1mwandb[0m: 	lr: 0.01
[34m[1mwandb[0m: 	timestep: 6
[34m[1mwandb[0m: 	units: 64





VBox(children=(Label(value='3.062 MB of 3.062 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▁▁▂▂▂▂▂▃▃▃▃▃▄▄▄▄▄▅▅▅▅▅▆▆▆▆▆▇▇▇▇▇███
loss,█▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
val_loss,█▂▂▂▂▂▂▂▂▂▂▂▂▂▂▁▂▂▂▂▂▂▂▂▂▁▁▁▂▁▂▂▂▂▁▁

0,1
best_epoch,25.0
best_val_loss,0.00665
epoch,35.0
loss,0.00591
val_loss,0.00687


[34m[1mwandb[0m: Agent Starting Run: ucu1dkdo with config:
[34m[1mwandb[0m: 	batch_size: 256
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	layers: 8
[34m[1mwandb[0m: 	lr: 0.01
[34m[1mwandb[0m: 	timestep: 6
[34m[1mwandb[0m: 	units: 64





VBox(children=(Label(value='3.062 MB of 3.062 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▁▂▂▂▃▃▃▄▄▄▅▅▅▆▆▆▇▇▇██
loss,█▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
val_loss,▇▄▃█▇▃▃▃▃▅▃▁▃▄▄▃▃▁▃▁▂▂

0,1
best_epoch,11.0
best_val_loss,0.00718
epoch,21.0
loss,0.00612
val_loss,0.00746


[34m[1mwandb[0m: Agent Starting Run: whhh9w9l with config:
[34m[1mwandb[0m: 	batch_size: 128
[34m[1mwandb[0m: 	dropout: 0.1
[34m[1mwandb[0m: 	layers: 8
[34m[1mwandb[0m: 	lr: 0.01
[34m[1mwandb[0m: 	timestep: 6
[34m[1mwandb[0m: 	units: 64





VBox(children=(Label(value='3.062 MB of 3.062 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▂▂▃▄▄▅▅▆▇▇█
loss,█▂▁▁▁▁▁▁▁▁▁▁
val_loss,█▁▂▃▂▂▂▂▃▃▃▃

0,1
best_epoch,1.0
best_val_loss,0.00774
epoch,11.0
loss,0.00708
val_loss,0.00903


[34m[1mwandb[0m: Agent Starting Run: vls47fbq with config:
[34m[1mwandb[0m: 	batch_size: 128
[34m[1mwandb[0m: 	dropout: 0.1
[34m[1mwandb[0m: 	layers: 4
[34m[1mwandb[0m: 	lr: 0.1
[34m[1mwandb[0m: 	timestep: 6
[34m[1mwandb[0m: 	units: 64





VBox(children=(Label(value='1.503 MB of 1.503 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▁▁▁▂▂▂▂▂▃▃▃▃▃▃▄▄▄▄▄▅▅▅▅▅▅▆▆▆▆▆▇▇▇▇▇▇███
loss,█▃▆▁▁▁▁▁▁▁▁▂▂▂▂▂▂▂▂▂▂▂▂▂▃▃▃▃▃▃▃▃▃▃▃▃▃▃▃▄
val_loss,▆█▇▃▃▂▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁

0,1
best_epoch,163.0
best_val_loss,0.00775
epoch,173.0
loss,0.00848
val_loss,0.00776


[34m[1mwandb[0m: Agent Starting Run: te2e03tl with config:
[34m[1mwandb[0m: 	batch_size: 128
[34m[1mwandb[0m: 	dropout: 0
[34m[1mwandb[0m: 	layers: 4
[34m[1mwandb[0m: 	lr: 0.01
[34m[1mwandb[0m: 	timestep: 6
[34m[1mwandb[0m: 	units: 128





VBox(children=(Label(value='5.567 MB of 5.567 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▁▂▃▃▃▄▅▅▅▆▇▇▇█
loss,█▁▁▁▁▁▁▁▁▁▁▁▁▁▁
val_loss,▂█▂▁▁▁▁▁▁▁▁▁▁▁▁

0,1
best_epoch,4.0
best_val_loss,0.00774
epoch,14.0
loss,0.00728
val_loss,0.00785


[34m[1mwandb[0m: Agent Starting Run: k3gweqhw with config:
[34m[1mwandb[0m: 	batch_size: 256
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	layers: 8
[34m[1mwandb[0m: 	lr: 0.01
[34m[1mwandb[0m: 	timestep: 6
[34m[1mwandb[0m: 	units: 64





VBox(children=(Label(value='3.062 MB of 3.062 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▁▁▂▂▂▂▃▃▃▃▄▄▄▄▅▅▅▅▆▆▆▆▇▇▇▇███
loss,█▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
val_loss,▃█▄▃▃▃▂▂▂▂▂▂▂▂▂▂▃▂▂▁▂▁▁▂▂▂▁▁▁▁

0,1
best_epoch,19.0
best_val_loss,0.00628
epoch,29.0
loss,0.00529
val_loss,0.00671


[34m[1mwandb[0m: Agent Starting Run: 2n7we3vk with config:
[34m[1mwandb[0m: 	batch_size: 256
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	layers: 8
[34m[1mwandb[0m: 	lr: 0.01
[34m[1mwandb[0m: 	timestep: 3
[34m[1mwandb[0m: 	units: 64





VBox(children=(Label(value='3.062 MB of 3.062 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▁▁▂▂▂▂▂▂▃▃▃▃▃▃▄▄▄▄▄▅▅▅▅▅▅▆▆▆▆▆▆▇▇▇▇▇▇██
loss,█▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
val_loss,█▃▃▃▃▃▃▃▃▂▃▂▃▃▂▁▂▁▁▁▁▁▁▁▂▁▂▂▂▂▁▂▁▂▂▂▂▂▂▂

0,1
best_epoch,30.0
best_val_loss,0.0061
epoch,40.0
loss,0.00586
val_loss,0.00704


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: xnsd9edu with config:
[34m[1mwandb[0m: 	batch_size: 128
[34m[1mwandb[0m: 	dropout: 0.1
[34m[1mwandb[0m: 	layers: 4
[34m[1mwandb[0m: 	lr: 0.01
[34m[1mwandb[0m: 	timestep: 3
[34m[1mwandb[0m: 	units: 64





VBox(children=(Label(value='1.503 MB of 1.503 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▁▂▂▂▂▃▃▃▄▄▄▄▅▅▅▅▆▆▆▇▇▇▇██
loss,█▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
val_loss,█▃▃▃▃▃▃▃▃▂▂▃▂▂▁▁▂▃▃▃▃▃▄▃▃▅

0,1
best_epoch,15.0
best_val_loss,0.0068
epoch,25.0
loss,0.00542
val_loss,0.0081


[34m[1mwandb[0m: Agent Starting Run: 24q0115s with config:
[34m[1mwandb[0m: 	batch_size: 256
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	layers: 8
[34m[1mwandb[0m: 	lr: 0.01
[34m[1mwandb[0m: 	timestep: 6
[34m[1mwandb[0m: 	units: 128





VBox(children=(Label(value='11.639 MB of 11.639 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
epoch,▁▁▁▁▂▂▂▂▂▃▃▃▃▃▃▄▄▄▄▄▅▅▅▅▅▅▆▆▆▆▆▇▇▇▇▇▇███
loss,█▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
val_loss,█▃▁▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁

0,1
best_epoch,38.0
best_val_loss,0.00636
epoch,48.0
loss,0.0054
val_loss,0.00689


[34m[1mwandb[0m: Agent Starting Run: kzfu1k0e with config:
[34m[1mwandb[0m: 	batch_size: 128
[34m[1mwandb[0m: 	dropout: 0
[34m[1mwandb[0m: 	layers: 4
[34m[1mwandb[0m: 	lr: 0.1
[34m[1mwandb[0m: 	timestep: 6
[34m[1mwandb[0m: 	units: 64





VBox(children=(Label(value='1.503 MB of 1.503 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▂▂▃▄▅▅▆▇▇█
loss,█▁▁▁▁▁▁▁▁▁▁
val_loss,▁▂▅█▃▃▂▂▂▂▃

0,1
best_epoch,0.0
best_val_loss,0.00772
epoch,10.0
loss,0.00918
val_loss,0.01315


[34m[1mwandb[0m: Agent Starting Run: 2vufsvgl with config:
[34m[1mwandb[0m: 	batch_size: 128
[34m[1mwandb[0m: 	dropout: 0
[34m[1mwandb[0m: 	layers: 4
[34m[1mwandb[0m: 	lr: 0.01
[34m[1mwandb[0m: 	timestep: 3
[34m[1mwandb[0m: 	units: 64





VBox(children=(Label(value='1.503 MB of 1.503 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▁▂▂▂▃▃▃▄▄▄▅▅▅▅▆▆▆▇▇▇██
loss,█▂▂▂▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
val_loss,█▇▇▇▇▇▇▆▅▂▃▄▁▂▅▅▅▃▂▅▅▃▃

0,1
best_epoch,12.0
best_val_loss,0.00613
epoch,22.0
loss,0.00605
val_loss,0.0069


[34m[1mwandb[0m: Agent Starting Run: opt3lujd with config:
[34m[1mwandb[0m: 	batch_size: 256
[34m[1mwandb[0m: 	dropout: 0
[34m[1mwandb[0m: 	layers: 4
[34m[1mwandb[0m: 	lr: 0.01
[34m[1mwandb[0m: 	timestep: 3
[34m[1mwandb[0m: 	units: 64





VBox(children=(Label(value='1.503 MB of 1.503 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▁▂▂▂▂▃▃▃▃▄▄▄▄▅▅▅▅▆▆▆▆▇▇▇▇██
loss,█▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
val_loss,█▅▂▂▂▂▂▁▁▁▂▃▂▁▃▁▂▁▁▁▂▂▂▁▂▁▁▁

0,1
best_epoch,17.0
best_val_loss,0.00638
epoch,27.0
loss,0.00492
val_loss,0.00685


[34m[1mwandb[0m: Agent Starting Run: fhwiyuqj with config:
[34m[1mwandb[0m: 	batch_size: 128
[34m[1mwandb[0m: 	dropout: 0.1
[34m[1mwandb[0m: 	layers: 8
[34m[1mwandb[0m: 	lr: 0.01
[34m[1mwandb[0m: 	timestep: 3
[34m[1mwandb[0m: 	units: 64





VBox(children=(Label(value='3.062 MB of 3.062 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▁▁▂▂▂▂▂▂▃▃▃▃▃▄▄▄▄▄▄▅▅▅▅▅▅▆▆▆▆▆▇▇▇▇▇▇███
loss,█▂▂▂▂▂▂▂▂▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
val_loss,▆▇██▇▅▅▅▅▅▅▅▅▄▄▃▃▃▄▃▂▂▂▂▂▂▂▁▁▁▂▁▁▁▁▂▂▁▂▂

0,1
best_epoch,68.0
best_val_loss,0.00577
epoch,78.0
loss,0.00489
val_loss,0.00612


[34m[1mwandb[0m: Agent Starting Run: abstffs9 with config:
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	dropout: 0.1
[34m[1mwandb[0m: 	layers: 8
[34m[1mwandb[0m: 	lr: 0.1
[34m[1mwandb[0m: 	timestep: 3
[34m[1mwandb[0m: 	units: 64





VBox(children=(Label(value='3.062 MB of 3.062 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▁▂▂▃▃▄▄▅▅▆▆▇▇██
loss,█▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
val_loss,▅▁▁▁▁▁▁▁▁▂▃▄▅▆▇█

0,1
best_epoch,5.0
best_val_loss,0.00774
epoch,15.0
loss,0.00761
val_loss,0.00944


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: q61w2s3x with config:
[34m[1mwandb[0m: 	batch_size: 128
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	layers: 8
[34m[1mwandb[0m: 	lr: 0.1
[34m[1mwandb[0m: 	timestep: 3
[34m[1mwandb[0m: 	units: 64





VBox(children=(Label(value='3.062 MB of 3.062 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▁▂▂▂▂▃▃▃▄▄▄▄▅▅▅▅▆▆▆▇▇▇▇██
loss,█▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
val_loss,▂█▄▂▂▂▃▂▂▂▂▂▂▁▁▁▁▁▂▂▃▄▅▅▆▇

0,1
best_epoch,15.0
best_val_loss,0.00773
epoch,25.0
loss,0.0081
val_loss,0.00893


[34m[1mwandb[0m: Agent Starting Run: q5y2li0a with config:
[34m[1mwandb[0m: 	batch_size: 256
[34m[1mwandb[0m: 	dropout: 0.1
[34m[1mwandb[0m: 	layers: 8
[34m[1mwandb[0m: 	lr: 0.01
[34m[1mwandb[0m: 	timestep: 3
[34m[1mwandb[0m: 	units: 64





VBox(children=(Label(value='3.062 MB of 3.062 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▁▁▁▂▂▂▂▂▃▃▃▃▃▃▄▄▄▄▄▅▅▅▅▅▅▆▆▆▆▆▆▇▇▇▇▇███
loss,█▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
val_loss,█▃▃▄▃▃▃▃▃▃▄▄▃▂▂▃▂▂▃▃▂▂▂▂▂▂▁▁▂▁▁▂▂▁▂▁▁▂▂▁

0,1
best_epoch,39.0
best_val_loss,0.00586
epoch,49.0
loss,0.00511
val_loss,0.00633


[34m[1mwandb[0m: Agent Starting Run: k1oplvz2 with config:
[34m[1mwandb[0m: 	batch_size: 128
[34m[1mwandb[0m: 	dropout: 0.1
[34m[1mwandb[0m: 	layers: 8
[34m[1mwandb[0m: 	lr: 0.01
[34m[1mwandb[0m: 	timestep: 3
[34m[1mwandb[0m: 	units: 64





VBox(children=(Label(value='3.062 MB of 3.062 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▁▁▂▂▂▃▃▃▃▃▄▄▄▅▅▅▅▅▆▆▆▇▇▇▇▇██
loss,█▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
val_loss,█▅▆█▇▇▄▅▅▄▆▄▄▅▂▂▁▂▁▂▁▁▁▃▂▂▃▅▄

0,1
best_epoch,18.0
best_val_loss,0.00617
epoch,28.0
loss,0.00688
val_loss,0.00754


# GRU

In [None]:
# Configure the sweep – specify the parameters to search through, the search strategy, the optimization metric et all.
sweep_config = {
    'name': 'GRU',
    'method': 'bayes', #grid, random
    'metric': {
      'name': 'best_val_loss',
      'goal': 'minimize'   
    },
    'parameters': {
        'batch_size': {
            'values': [256, 128, 64, 32]
        },
        'dropout': {
            'values': [0, 0.1, 0.3]
        },
        'units': {
            'values': [64, 128, 256]
        },
        'timestep': {
            'values': [3, 6, 12, 24]
        },
        'lr': {
            'values': [1e-2, 1e-1]
        },
        'layers': {
            'values': [1, 2, 4, 8]
        },
        
    }
}

In [None]:
sweep_id = wandb.sweep(sweep_config, entity="ancy", project="DF1_RESIDUAL_GRU")

Create sweep with ID: wzwodd2r
Sweep URL: https://wandb.ai/ancy/DF1_RESIDUAL_GRU/sweeps/wzwodd2r


In [None]:
def create_gru():
    config_defaults = {
    'batch_size': 128,
    'lr': 1e-3,
    'units': 64,
    'timestep': 3,
    'dropout': 0.3,
    'layers': 1,
    }

    wandb.init(config=config_defaults)
    config = wandb.config

    batch_size = config.batch_size
    lr         = config.lr
    num_units  = config.units
    timestep   = config.timestep
    dropout    = config.dropout
    layers     = config.layers

    train_X, train_y, valid_X, valid_y, test_X, test_y = make_data(hourly, timestep, resid_check=True)
    model = Sequential()

    if layers > 1:
      model.add(GRU(units = num_units, input_shape=(train_X.shape[1], train_X.shape[2]), dropout=dropout, return_sequences=True))

      for i in range(layers-2):
        model.add(GRU(units = num_units, dropout=dropout, return_sequences=True))

      model.add(GRU(units = num_units, dropout=dropout))

    else:
      model.add(GRU(units = num_units, input_shape=(train_X.shape[1], train_X.shape[2]), dropout=dropout))

    model.add(Dense(units = 1))
    lr = config.lr
    model.compile(
        loss="mse",
        optimizer=Adam(learning_rate=lr)
    )
    
    model.fit(train_X, train_y, batch_size=config.batch_size,
              epochs=200, verbose=0, shuffle=False,
              validation_data=(valid_X, valid_y),
              callbacks=[WandbCallback(),
                          EarlyStopping(patience=10, restore_best_weights=True), ReduceLROnPlateau(monitor='val_loss',patience=5, min_lr=1e-6)])

    return model

In [None]:
wandb.agent(sweep_id, create_gru, count=50)

[34m[1mwandb[0m: Agent Starting Run: ctxhgqs5 with config:
[34m[1mwandb[0m: 	batch_size: 128
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	layers: 2
[34m[1mwandb[0m: 	lr: 0.01
[34m[1mwandb[0m: 	timestep: 24
[34m[1mwandb[0m: 	units: 128





VBox(children=(Label(value='1.917 MB of 1.917 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▁▂▂▂▃▃▃▄▄▅▅▅▆▆▆▇▇▇██
loss,█▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
val_loss,▇█▂▂▁▁▁▁▁▂▁▁▁▁▁▁▁▁▁▁▁

0,1
best_epoch,10.0
best_val_loss,0.00747
epoch,20.0
loss,0.00699
val_loss,0.00859


[34m[1mwandb[0m: Agent Starting Run: 8frbp8ir with config:
[34m[1mwandb[0m: 	batch_size: 128
[34m[1mwandb[0m: 	dropout: 0.1
[34m[1mwandb[0m: 	layers: 8
[34m[1mwandb[0m: 	lr: 0.1
[34m[1mwandb[0m: 	timestep: 3
[34m[1mwandb[0m: 	units: 64





VBox(children=(Label(value='2.349 MB of 2.349 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▁▂▂▂▂▃▃▃▄▄▄▄▅▅▅▅▆▆▆▇▇▇▇██
loss,█▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
val_loss,▃▁▁▁▂▅█▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁

0,1
best_epoch,15.0
best_val_loss,0.00773
epoch,25.0
loss,0.00637
val_loss,0.00777


[34m[1mwandb[0m: Agent Starting Run: 3zuzb2ap with config:
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	layers: 8
[34m[1mwandb[0m: 	lr: 0.1
[34m[1mwandb[0m: 	timestep: 24
[34m[1mwandb[0m: 	units: 64





VBox(children=(Label(value='2.349 MB of 2.349 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▁▂▂▂▃▃▃▃▄▄▄▅▅▅▆▆▆▆▇▇▇██
loss,█▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
val_loss,▂▆▃█▃▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁

0,1
best_epoch,13.0
best_val_loss,0.00773
epoch,23.0
loss,0.00684
val_loss,0.00775


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: csui6mlu with config:
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	layers: 8
[34m[1mwandb[0m: 	lr: 0.1
[34m[1mwandb[0m: 	timestep: 3
[34m[1mwandb[0m: 	units: 64





VBox(children=(Label(value='2.349 MB of 2.349 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▂▂▃▃▄▅▅▆▆▇▇█
loss,█▁▁▁▁▁▁▁▁▁▁▁▁
val_loss,▇▄▁▃▇█▂▁▁▁▂▂▃

0,1
best_epoch,2.0
best_val_loss,0.00774
epoch,12.0
loss,0.0076
val_loss,0.00956


[34m[1mwandb[0m: Agent Starting Run: srvzf9l5 with config:
[34m[1mwandb[0m: 	batch_size: 128
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	layers: 1
[34m[1mwandb[0m: 	lr: 0.01
[34m[1mwandb[0m: 	timestep: 24
[34m[1mwandb[0m: 	units: 256





VBox(children=(Label(value='2.642 MB of 2.642 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▁▂▂▂▃▃▃▄▄▄▅▅▅▅▆▆▆▇▇▇██
loss,█▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
val_loss,▂█▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁

0,1
best_epoch,12.0
best_val_loss,0.00665
epoch,22.0
loss,0.00588
val_loss,0.00706


[34m[1mwandb[0m: Agent Starting Run: shsrdrfz with config:
[34m[1mwandb[0m: 	batch_size: 128
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	layers: 1
[34m[1mwandb[0m: 	lr: 0.01
[34m[1mwandb[0m: 	timestep: 24
[34m[1mwandb[0m: 	units: 256





VBox(children=(Label(value='2.642 MB of 2.642 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▁▁▂▂▂▂▂▃▃▃▃▃▄▄▄▄▅▅▅▅▅▆▆▆▆▆▇▇▇▇▇███
loss,█▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
val_loss,█▇▄▂▂▂▂▂▁▁▁▁▁▁▁▁▁▁▁▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁

0,1
best_epoch,24.0
best_val_loss,0.00585
epoch,34.0
loss,0.00505
val_loss,0.00703


[34m[1mwandb[0m: Agent Starting Run: ubvdjk7u with config:
[34m[1mwandb[0m: 	batch_size: 128
[34m[1mwandb[0m: 	dropout: 0.1
[34m[1mwandb[0m: 	layers: 1
[34m[1mwandb[0m: 	lr: 0.01
[34m[1mwandb[0m: 	timestep: 24
[34m[1mwandb[0m: 	units: 256





VBox(children=(Label(value='2.642 MB of 2.642 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▁▁▂▂▂▂▂▃▃▃▃▃▄▄▄▄▄▅▅▅▅▅▆▆▆▆▆▇▇▇▇▇███
loss,█▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
val_loss,▃█▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁

0,1
best_epoch,25.0
best_val_loss,0.00612
epoch,35.0
loss,0.00465
val_loss,0.0071


[34m[1mwandb[0m: Agent Starting Run: tk29dc0w with config:
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	dropout: 0.1
[34m[1mwandb[0m: 	layers: 1
[34m[1mwandb[0m: 	lr: 0.01
[34m[1mwandb[0m: 	timestep: 24
[34m[1mwandb[0m: 	units: 256





VBox(children=(Label(value='2.642 MB of 2.642 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▁▂▂▃▃▄▄▅▅▆▆▇▇██
loss,█▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
val_loss,▂▃▆█▂▁▁▁▂▁▂▆▅▄▃▃

0,1
best_epoch,5.0
best_val_loss,0.0065
epoch,15.0
loss,0.00493
val_loss,0.01385


[34m[1mwandb[0m: Agent Starting Run: ejbz60zx with config:
[34m[1mwandb[0m: 	batch_size: 128
[34m[1mwandb[0m: 	dropout: 0.1
[34m[1mwandb[0m: 	layers: 1
[34m[1mwandb[0m: 	lr: 0.01
[34m[1mwandb[0m: 	timestep: 12
[34m[1mwandb[0m: 	units: 256





VBox(children=(Label(value='2.642 MB of 2.642 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▁▁▂▂▂▂▃▃▃▃▃▄▄▄▄▅▅▅▅▅▆▆▆▆▆▇▇▇▇███
loss,█▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
val_loss,█▇▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁

0,1
best_epoch,22.0
best_val_loss,0.00585
epoch,32.0
loss,0.00479
val_loss,0.00683


[34m[1mwandb[0m: Agent Starting Run: mtc3ouqo with config:
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	layers: 1
[34m[1mwandb[0m: 	lr: 0.01
[34m[1mwandb[0m: 	timestep: 6
[34m[1mwandb[0m: 	units: 256





VBox(children=(Label(value='2.642 MB of 2.642 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▁▂▃▃▃▄▅▅▅▆▇▇▇█
loss,█▁▁▁▁▁▁▁▁▁▁▁▁▁▁
val_loss,▂█▁▂▁▂▁▄▁▃▄▃▃▃▃

0,1
best_epoch,4.0
best_val_loss,0.0059
epoch,14.0
loss,0.00534
val_loss,0.01788


[34m[1mwandb[0m: Agent Starting Run: sn99d59i with config:
[34m[1mwandb[0m: 	batch_size: 128
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	layers: 1
[34m[1mwandb[0m: 	lr: 0.01
[34m[1mwandb[0m: 	timestep: 12
[34m[1mwandb[0m: 	units: 256





VBox(children=(Label(value='2.642 MB of 2.642 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▁▁▂▂▂▃▃▃▃▃▄▄▄▅▅▅▅▅▆▆▆▇▇▇▇▇██
loss,█▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
val_loss,█▃▃▂▁▃▁▁▂▁▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▂▂▂▂

0,1
best_epoch,18.0
best_val_loss,0.00589
epoch,28.0
loss,0.00515
val_loss,0.0087


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: 7waq8qv7 with config:
[34m[1mwandb[0m: 	batch_size: 128
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	layers: 1
[34m[1mwandb[0m: 	lr: 0.1
[34m[1mwandb[0m: 	timestep: 6
[34m[1mwandb[0m: 	units: 256





VBox(children=(Label(value='2.642 MB of 2.642 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▁▁▂▂▂▂▂▂▃▃▃▃▃▄▄▄▄▄▄▅▅▅▅▅▅▆▆▆▆▆▇▇▇▇▇▇███
loss,█▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
val_loss,█▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁

0,1
best_epoch,29.0
best_val_loss,0.00734
epoch,39.0
loss,0.00557
val_loss,0.00967


[34m[1mwandb[0m: Agent Starting Run: mzph3vry with config:
[34m[1mwandb[0m: 	batch_size: 128
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	layers: 1
[34m[1mwandb[0m: 	lr: 0.01
[34m[1mwandb[0m: 	timestep: 12
[34m[1mwandb[0m: 	units: 256





VBox(children=(Label(value='2.642 MB of 2.642 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▁▂▂▂▂▃▃▃▄▄▄▅▅▅▅▆▆▆▇▇▇▇██
loss,█▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
val_loss,█▆▁▂▁▁▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁

0,1
best_epoch,14.0
best_val_loss,0.0058
epoch,24.0
loss,0.00517
val_loss,0.00786


[34m[1mwandb[0m: Agent Starting Run: rak3i8e4 with config:
[34m[1mwandb[0m: 	batch_size: 128
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	layers: 1
[34m[1mwandb[0m: 	lr: 0.01
[34m[1mwandb[0m: 	timestep: 6
[34m[1mwandb[0m: 	units: 256





VBox(children=(Label(value='2.642 MB of 2.642 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▁▂▂▂▃▃▃▄▄▅▅▅▆▆▆▇▇▇██
loss,█▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
val_loss,▄█▂▁▁▃▁▁▂▁▁▁▁▁▁▁▁▁▁▁▁

0,1
best_epoch,10.0
best_val_loss,0.00712
epoch,20.0
loss,0.00522
val_loss,0.00995


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: g0ve2s2q with config:
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	layers: 2
[34m[1mwandb[0m: 	lr: 0.01
[34m[1mwandb[0m: 	timestep: 12
[34m[1mwandb[0m: 	units: 256





VBox(children=(Label(value='7.170 MB of 7.170 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▂▂▃▄▅▅▆▇▇█
loss,█▁▁▁▁▁▁▁▁▁▁
val_loss,▁▁▂▂▂▂█▇▇▇▆

0,1
best_epoch,0.0
best_val_loss,0.00757
epoch,10.0
loss,0.00571
val_loss,0.0297


[34m[1mwandb[0m: Agent Starting Run: v2tvar6w with config:
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	dropout: 0.1
[34m[1mwandb[0m: 	layers: 1
[34m[1mwandb[0m: 	lr: 0.01
[34m[1mwandb[0m: 	timestep: 12
[34m[1mwandb[0m: 	units: 256





VBox(children=(Label(value='2.642 MB of 2.642 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▁▂▃▃▃▄▅▅▅▆▇▇▇█
loss,█▁▁▁▁▁▁▁▁▁▁▁▁▁▁
val_loss,▃█▃▁▁▁▁▁▁▁▁▁▁▁▁

0,1
best_epoch,4.0
best_val_loss,0.00661
epoch,14.0
loss,0.00543
val_loss,0.00752


[34m[1mwandb[0m: Agent Starting Run: kpqsn8ui with config:
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	layers: 1
[34m[1mwandb[0m: 	lr: 0.01
[34m[1mwandb[0m: 	timestep: 12
[34m[1mwandb[0m: 	units: 256





VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▁▂▃▃▃▄▅▅▅▆▇▇▇█
loss,█▁▁▁▁▁▁▁▁▁▁▁▁▁▁
val_loss,▁█▄▄▁▂▁▁▁▁▇▅▄▃▃

0,1
best_epoch,4.0
best_val_loss,0.00857
epoch,14.0
loss,0.00475
val_loss,0.01784


[34m[1mwandb[0m: Agent Starting Run: vki3516i with config:
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	layers: 1
[34m[1mwandb[0m: 	lr: 0.1
[34m[1mwandb[0m: 	timestep: 24
[34m[1mwandb[0m: 	units: 256





VBox(children=(Label(value='2.642 MB of 2.642 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▁▁▁▂▂▂▂▂▃▃▃▃▃▃▄▄▄▄▄▅▅▅▅▅▅▆▆▆▆▆▆▇▇▇▇▇███
loss,█▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
val_loss,█▃▁▁▁▁▁▁▁▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁

0,1
best_epoch,41.0
best_val_loss,0.00743
epoch,51.0
loss,0.00594
val_loss,0.00743


[34m[1mwandb[0m: Agent Starting Run: azwb7g50 with config:
[34m[1mwandb[0m: 	batch_size: 128
[34m[1mwandb[0m: 	dropout: 0.1
[34m[1mwandb[0m: 	layers: 2
[34m[1mwandb[0m: 	lr: 0.1
[34m[1mwandb[0m: 	timestep: 24
[34m[1mwandb[0m: 	units: 256





VBox(children=(Label(value='7.170 MB of 7.170 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▂▂▃▃▄▄▅▅▆▆▇▇█
loss,█▁▁▁▁▁▁▁▁▁▁▁▁▁
val_loss,█▁▁▁▁▁▁▁▁▁▁▁▁▁

0,1
best_epoch,3.0
best_val_loss,0.00811
epoch,13.0
loss,0.00786
val_loss,0.0096


[34m[1mwandb[0m: Agent Starting Run: cqib1637 with config:
[34m[1mwandb[0m: 	batch_size: 128
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	layers: 2
[34m[1mwandb[0m: 	lr: 0.01
[34m[1mwandb[0m: 	timestep: 24
[34m[1mwandb[0m: 	units: 256





VBox(children=(Label(value='7.170 MB of 7.170 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▁▂▂▃▃▃▄▄▅▅▅▆▆▆▇▇██
loss,█▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
val_loss,█▆▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁

0,1
best_epoch,8.0
best_val_loss,0.00696
epoch,18.0
loss,0.00608
val_loss,0.0086


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: yzqs0ljs with config:
[34m[1mwandb[0m: 	batch_size: 128
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	layers: 1
[34m[1mwandb[0m: 	lr: 0.1
[34m[1mwandb[0m: 	timestep: 12
[34m[1mwandb[0m: 	units: 256





VBox(children=(Label(value='2.642 MB of 2.642 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▁▁▁▂▂▂▂▂▃▃▃▃▃▃▄▄▄▄▄▅▅▅▅▅▅▆▆▆▆▆▇▇▇▇▇▇███
loss,█▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
val_loss,█▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁

0,1
best_epoch,199.0
best_val_loss,0.00811
epoch,199.0
loss,0.00661
val_loss,0.00811


[34m[1mwandb[0m: Agent Starting Run: zz7h13lh with config:
[34m[1mwandb[0m: 	batch_size: 128
[34m[1mwandb[0m: 	dropout: 0.1
[34m[1mwandb[0m: 	layers: 1
[34m[1mwandb[0m: 	lr: 0.01
[34m[1mwandb[0m: 	timestep: 24
[34m[1mwandb[0m: 	units: 256





VBox(children=(Label(value='2.642 MB of 2.642 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▁▁▂▂▂▂▃▃▃▃▄▄▄▄▅▅▅▅▅▆▆▆▆▇▇▇▇███
loss,█▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
val_loss,▇█▆▄▄▃▂▃▂▂▂▂▂▁▁▁▂▁▁▁▁▁▁▁▁▁▂▁▁▁▁

0,1
best_epoch,20.0
best_val_loss,0.00607
epoch,30.0
loss,0.00534
val_loss,0.00638


[34m[1mwandb[0m: Agent Starting Run: 73yeie7f with config:
[34m[1mwandb[0m: 	batch_size: 128
[34m[1mwandb[0m: 	dropout: 0.1
[34m[1mwandb[0m: 	layers: 2
[34m[1mwandb[0m: 	lr: 0.01
[34m[1mwandb[0m: 	timestep: 24
[34m[1mwandb[0m: 	units: 256





VBox(children=(Label(value='7.170 MB of 7.170 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▂▂▃▄▄▅▅▆▇▇█
loss,█▁▁▁▁▁▁▁▁▁▁▁
val_loss,█▁▁▁▁▁▁▁▁▁▁▁

0,1
best_epoch,1.0
best_val_loss,0.00899
epoch,11.0
loss,0.006
val_loss,0.00988


[34m[1mwandb[0m: Agent Starting Run: whrk217a with config:
[34m[1mwandb[0m: 	batch_size: 128
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	layers: 1
[34m[1mwandb[0m: 	lr: 0.1
[34m[1mwandb[0m: 	timestep: 24
[34m[1mwandb[0m: 	units: 256





VBox(children=(Label(value='2.642 MB of 2.642 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▁▂▂▂▂▃▃▃▃▄▄▄▄▅▅▅▅▆▆▆▆▇▇▇▇██
loss,█▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
val_loss,▆█▂▂▂▁▁▁▁▁▁▁▁▂▁▁▁▁▁▂▁▁▁▁▁▁▁▁

0,1
best_epoch,17.0
best_val_loss,0.01731
epoch,27.0
loss,0.01333
val_loss,0.039


[34m[1mwandb[0m: Agent Starting Run: ggxdh3ay with config:
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	dropout: 0.1
[34m[1mwandb[0m: 	layers: 2
[34m[1mwandb[0m: 	lr: 0.01
[34m[1mwandb[0m: 	timestep: 3
[34m[1mwandb[0m: 	units: 256





VBox(children=(Label(value='7.170 MB of 7.170 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▁▂▂▂▂▃▃▃▄▄▄▅▅▅▅▆▆▆▇▇▇▇██
loss,█▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
val_loss,█▃▄▄▃▃▂▃▂▂▂▁▂▂▁▁▃▁▁▂▂▁▁▁▁

0,1
best_epoch,14.0
best_val_loss,0.00604
epoch,24.0
loss,0.0053
val_loss,0.00669


[34m[1mwandb[0m: Agent Starting Run: lo08b995 with config:
[34m[1mwandb[0m: 	batch_size: 128
[34m[1mwandb[0m: 	dropout: 0
[34m[1mwandb[0m: 	layers: 8
[34m[1mwandb[0m: 	lr: 0.01
[34m[1mwandb[0m: 	timestep: 12
[34m[1mwandb[0m: 	units: 256


[34m[1mwandb[0m: [32m[41mERROR[0m Error while calling W&B API: context deadline exceeded (<Response [500]>)





VBox(children=(Label(value='34.348 MB of 34.348 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
epoch,▁▁▁▂▂▂▂▂▃▃▃▃▄▄▄▄▄▅▅▅▅▅▆▆▆▆▇▇▇▇▇███
loss,█▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
val_loss,█▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁

0,1
best_epoch,23.0
best_val_loss,0.00773
epoch,33.0
loss,0.00639
val_loss,0.00777


[34m[1mwandb[0m: Agent Starting Run: h2blj6id with config:
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	layers: 4
[34m[1mwandb[0m: 	lr: 0.01
[34m[1mwandb[0m: 	timestep: 12
[34m[1mwandb[0m: 	units: 128





VBox(children=(Label(value='4.210 MB of 4.210 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▁▂▂▃▃▄▄▅▅▆▆▇▇██
loss,█▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
val_loss,█▄▃▃▁▁▁▁▄▂▃▆▇▇█▇

0,1
best_epoch,5.0
best_val_loss,0.00714
epoch,15.0
loss,0.00582
val_loss,0.01199


[34m[1mwandb[0m: Agent Starting Run: 19cfmz2m with config:
[34m[1mwandb[0m: 	batch_size: 128
[34m[1mwandb[0m: 	dropout: 0.1
[34m[1mwandb[0m: 	layers: 8
[34m[1mwandb[0m: 	lr: 0.01
[34m[1mwandb[0m: 	timestep: 24
[34m[1mwandb[0m: 	units: 64





VBox(children=(Label(value='2.349 MB of 2.349 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▁▂▂▂▂▃▃▃▃▄▄▄▄▅▅▅▅▆▆▆▆▇▇▇▇██
loss,█▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
val_loss,█▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁

0,1
best_epoch,17.0
best_val_loss,0.00772
epoch,27.0
loss,0.00662
val_loss,0.00776


[34m[1mwandb[0m: Agent Starting Run: ewld1aqf with config:
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	dropout: 0.1
[34m[1mwandb[0m: 	layers: 8
[34m[1mwandb[0m: 	lr: 0.01
[34m[1mwandb[0m: 	timestep: 6
[34m[1mwandb[0m: 	units: 64





VBox(children=(Label(value='2.349 MB of 2.349 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▁▂▂▂▂▃▃▃▃▄▄▄▅▅▅▅▆▆▆▆▇▇▇▇██
loss,█▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
val_loss,▃█▅▃▄▃▃▃▃▃▃▄▂▂▁▁▁▁▁▁▁▂▁▁▂▂▂

0,1
best_epoch,16.0
best_val_loss,0.00605
epoch,26.0
loss,0.00451
val_loss,0.00634


[34m[1mwandb[0m: Agent Starting Run: 008unnrb with config:
[34m[1mwandb[0m: 	batch_size: 128
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	layers: 2
[34m[1mwandb[0m: 	lr: 0.01
[34m[1mwandb[0m: 	timestep: 24
[34m[1mwandb[0m: 	units: 64





VBox(children=(Label(value='0.557 MB of 0.557 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▂▂▃▃▄▄▅▅▆▆▇▇█
loss,█▁▁▁▁▁▁▁▁▁▁▁▁▁
val_loss,█▅▁▁▁▁▁▂▂▃▄▃▃▃

0,1
best_epoch,3.0
best_val_loss,0.00782
epoch,13.0
loss,0.00655
val_loss,0.01271


[34m[1mwandb[0m: Agent Starting Run: 6w907wi8 with config:
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	layers: 4
[34m[1mwandb[0m: 	lr: 0.01
[34m[1mwandb[0m: 	timestep: 3
[34m[1mwandb[0m: 	units: 128





VBox(children=(Label(value='4.210 MB of 4.210 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▁▂▃▃▃▄▅▅▅▆▇▇▇█
loss,█▁▁▁▁▁▁▁▁▁▁▁▁▁▁
val_loss,▃▅▂▂▁▃▄▄▂▂▇█▇█▇

0,1
best_epoch,4.0
best_val_loss,0.00745
epoch,14.0
loss,0.00523
val_loss,0.01072


[34m[1mwandb[0m: Agent Starting Run: m6hy8n7f with config:
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	dropout: 0
[34m[1mwandb[0m: 	layers: 1
[34m[1mwandb[0m: 	lr: 0.1
[34m[1mwandb[0m: 	timestep: 24
[34m[1mwandb[0m: 	units: 128





VBox(children=(Label(value='0.773 MB of 0.773 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▂▂▃▃▄▄▅▅▆▆▇▇█
loss,█▁▁▁▁▁▁▁▁▁▁▁▁▁
val_loss,█▇▁▁▁▁▅▄▅▃▂▂▂▂

0,1
best_epoch,3.0
best_val_loss,0.02001
epoch,13.0
loss,0.00669
val_loss,0.02862


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: c6aznhld with config:
[34m[1mwandb[0m: 	batch_size: 256
[34m[1mwandb[0m: 	dropout: 0
[34m[1mwandb[0m: 	layers: 1
[34m[1mwandb[0m: 	lr: 0.01
[34m[1mwandb[0m: 	timestep: 6
[34m[1mwandb[0m: 	units: 64





VBox(children=(Label(value='0.260 MB of 0.260 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▁▂▂▃▃▃▄▄▅▅▅▆▆▆▇▇██
loss,█▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
val_loss,█▇█▁▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁

0,1
best_epoch,8.0
best_val_loss,0.00991
epoch,18.0
loss,0.00555
val_loss,0.01085


[34m[1mwandb[0m: Agent Starting Run: l87mqzo5 with config:
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	layers: 8
[34m[1mwandb[0m: 	lr: 0.1
[34m[1mwandb[0m: 	timestep: 24
[34m[1mwandb[0m: 	units: 256





VBox(children=(Label(value='34.348 MB of 34.348 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
epoch,▁▁▂▃▃▃▄▅▅▅▆▇▇▇█
loss,█▁▁▁▁▁▂▁▂▂▁▁▁▁▁
val_loss,▂▁▁▁▁█▁▃█▁▁▁▁▁▁

0,1
best_epoch,4.0
best_val_loss,0.00783
epoch,14.0
loss,0.00871
val_loss,0.0167


[34m[1mwandb[0m: Agent Starting Run: 71f5dcvv with config:
[34m[1mwandb[0m: 	batch_size: 128
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	layers: 2
[34m[1mwandb[0m: 	lr: 0.01
[34m[1mwandb[0m: 	timestep: 24
[34m[1mwandb[0m: 	units: 64





VBox(children=(Label(value='0.557 MB of 0.557 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▂▂▃▃▄▅▅▆▆▇▇█
loss,█▁▁▁▁▁▁▁▁▁▁▁▁
val_loss,█▅▁▂▂▂▁▁▂▂▁▂▁

0,1
best_epoch,2.0
best_val_loss,0.00883
epoch,12.0
loss,0.00741
val_loss,0.01049


[34m[1mwandb[0m: Agent Starting Run: 3phwi6xy with config:
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	dropout: 0.1
[34m[1mwandb[0m: 	layers: 8
[34m[1mwandb[0m: 	lr: 0.1
[34m[1mwandb[0m: 	timestep: 6
[34m[1mwandb[0m: 	units: 128





VBox(children=(Label(value='8.792 MB of 8.792 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▁▁▂▂▂▂▃▃▃▃▃▄▄▄▄▅▅▅▅▅▆▆▆▆▆▇▇▇▇███
loss,█▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
val_loss,▂▁▂▃▁▁█▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁

0,1
best_epoch,22.0
best_val_loss,0.00773
epoch,32.0
loss,0.00637
val_loss,0.00773


[34m[1mwandb[0m: Agent Starting Run: ruhz2nm5 with config:
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	layers: 4
[34m[1mwandb[0m: 	lr: 0.01
[34m[1mwandb[0m: 	timestep: 24
[34m[1mwandb[0m: 	units: 128





VBox(children=(Label(value='4.210 MB of 4.210 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▁▂▂▂▂▃▃▃▄▄▄▄▅▅▅▅▆▆▆▇▇▇▇██
loss,█▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
val_loss,█▄▅▄▃▃▂▂▂▂▂▁▁▂▁▁▁▅▅▅▆▆▃▃▄▃

0,1
best_epoch,15.0
best_val_loss,0.00707
epoch,25.0
loss,0.00573
val_loss,0.0098


[34m[1mwandb[0m: Agent Starting Run: numv8adb with config:
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	dropout: 0
[34m[1mwandb[0m: 	layers: 2
[34m[1mwandb[0m: 	lr: 0.1
[34m[1mwandb[0m: 	timestep: 3
[34m[1mwandb[0m: 	units: 64





VBox(children=(Label(value='0.557 MB of 0.557 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▁▁▂▂▂▂▃▃▃▃▃▄▄▄▄▅▅▅▅▅▆▆▆▆▆▇▇▇▇███
loss,█▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
val_loss,█▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁

0,1
best_epoch,22.0
best_val_loss,0.00773
epoch,32.0
loss,0.00637
val_loss,0.00774


[34m[1mwandb[0m: Agent Starting Run: t61zbreu with config:
[34m[1mwandb[0m: 	batch_size: 256
[34m[1mwandb[0m: 	dropout: 0.1
[34m[1mwandb[0m: 	layers: 8
[34m[1mwandb[0m: 	lr: 0.01
[34m[1mwandb[0m: 	timestep: 6
[34m[1mwandb[0m: 	units: 128





VBox(children=(Label(value='8.792 MB of 8.792 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▁▂▃▃▃▄▅▅▅▆▇▇▇█
loss,█▁▁▁▁▁▁▁▁▁▁▁▁▁▁
val_loss,█▁▁▁▁▁▁▁▁▁▁▁▁▁▁

0,1
best_epoch,4.0
best_val_loss,0.00753
epoch,14.0
loss,0.00807
val_loss,0.00757


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: xpmxpkjt with config:
[34m[1mwandb[0m: 	batch_size: 128
[34m[1mwandb[0m: 	dropout: 0
[34m[1mwandb[0m: 	layers: 8
[34m[1mwandb[0m: 	lr: 0.1
[34m[1mwandb[0m: 	timestep: 3
[34m[1mwandb[0m: 	units: 64





VBox(children=(Label(value='2.349 MB of 2.349 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▁▂▂▂▃▃▃▃▄▄▄▅▅▅▆▆▆▆▇▇▇██
loss,█▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
val_loss,█▂▁▂▄▇▅▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁

0,1
best_epoch,13.0
best_val_loss,0.00773
epoch,23.0
loss,0.00638
val_loss,0.00777


[34m[1mwandb[0m: Agent Starting Run: 4kt0z7il with config:
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	dropout: 0.1
[34m[1mwandb[0m: 	layers: 8
[34m[1mwandb[0m: 	lr: 0.1
[34m[1mwandb[0m: 	timestep: 24
[34m[1mwandb[0m: 	units: 256





VBox(children=(Label(value='34.348 MB of 34.348 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
epoch,▁▁▂▂▂▂▃▃▃▄▄▄▅▅▅▅▆▆▆▇▇▇▇██
loss,█▁▁▂▆▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
val_loss,▂▇█▁▆▄▂▄▇▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁

0,1
best_epoch,14.0
best_val_loss,0.00774
epoch,24.0
loss,0.00689
val_loss,0.00861


[34m[1mwandb[0m: Agent Starting Run: i112q5z2 with config:
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	dropout: 0
[34m[1mwandb[0m: 	layers: 4
[34m[1mwandb[0m: 	lr: 0.1
[34m[1mwandb[0m: 	timestep: 24
[34m[1mwandb[0m: 	units: 256





VBox(children=(Label(value='16.231 MB of 16.231 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
epoch,▁▁▁▁▂▂▂▂▂▃▃▃▃▃▃▄▄▄▄▄▅▅▅▅▅▅▆▆▆▆▆▇▇▇▇▇▇███
loss,█▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
val_loss,▁▂▁▂█▁▁▁▁▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁

0,1
best_epoch,38.0
best_val_loss,0.00736
epoch,48.0
loss,0.00598
val_loss,0.00737


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: wgwh3sfa with config:
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	dropout: 0
[34m[1mwandb[0m: 	layers: 2
[34m[1mwandb[0m: 	lr: 0.01
[34m[1mwandb[0m: 	timestep: 12
[34m[1mwandb[0m: 	units: 64





VBox(children=(Label(value='0.557 MB of 0.557 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▂▂▃▃▄▅▅▆▆▇▇█
loss,█▁▁▁▁▁▁▁▁▁▁▁▁
val_loss,▁▂▁▂▁▂▂▃█▆▅▄▄

0,1
best_epoch,2.0
best_val_loss,0.00746
epoch,12.0
loss,0.00432
val_loss,0.02396


[34m[1mwandb[0m: Agent Starting Run: w8t8lggx with config:
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	dropout: 0
[34m[1mwandb[0m: 	layers: 4
[34m[1mwandb[0m: 	lr: 0.1
[34m[1mwandb[0m: 	timestep: 6
[34m[1mwandb[0m: 	units: 64





VBox(children=(Label(value='1.155 MB of 1.155 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▁▂▃▃▃▄▅▅▅▆▇▇▇█
loss,█▁▁▁▁▁▁▁▁▁▁▁▁▁▁
val_loss,▃▇▅▁▁▂▄▇█▄▁▁▁▂▂

0,1
best_epoch,4.0
best_val_loss,0.00773
epoch,14.0
loss,0.00767
val_loss,0.00901


[34m[1mwandb[0m: Agent Starting Run: tr03xm9t with config:
[34m[1mwandb[0m: 	batch_size: 128
[34m[1mwandb[0m: 	dropout: 0
[34m[1mwandb[0m: 	layers: 4
[34m[1mwandb[0m: 	lr: 0.01
[34m[1mwandb[0m: 	timestep: 12
[34m[1mwandb[0m: 	units: 64





VBox(children=(Label(value='1.155 MB of 1.155 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▁▂▂▃▃▃▄▄▅▅▅▆▆▆▇▇██
loss,█▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
val_loss,▅█▂▃▃▂▂▁▁▂▁▂▁▁▂▂▂▁▁

0,1
best_epoch,8.0
best_val_loss,0.00759
epoch,18.0
loss,0.00522
val_loss,0.0079


[34m[1mwandb[0m: Agent Starting Run: cxz3qpb7 with config:
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	dropout: 0.1
[34m[1mwandb[0m: 	layers: 8
[34m[1mwandb[0m: 	lr: 0.1
[34m[1mwandb[0m: 	timestep: 6
[34m[1mwandb[0m: 	units: 64





VBox(children=(Label(value='2.349 MB of 2.349 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▁▂▃▃▃▄▅▅▅▆▇▇▇█
loss,█▁▁▁▁▁▁▁▂▁▁▁▁▁▁
val_loss,▂▂▂▃▁▂▁▂▄█▂▂▂▂▂

0,1
best_epoch,4.0
best_val_loss,0.00774
epoch,14.0
loss,0.00708
val_loss,0.00952


[34m[1mwandb[0m: Agent Starting Run: fx4b7azi with config:
[34m[1mwandb[0m: 	batch_size: 256
[34m[1mwandb[0m: 	dropout: 0
[34m[1mwandb[0m: 	layers: 8
[34m[1mwandb[0m: 	lr: 0.01
[34m[1mwandb[0m: 	timestep: 6
[34m[1mwandb[0m: 	units: 64





VBox(children=(Label(value='2.349 MB of 2.349 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▁▂▂▂▃▃▃▃▄▄▄▅▅▅▆▆▆▆▇▇▇██
loss,█▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
val_loss,▃▇█▃▂▂▃▃▁▁▁▁▁▁▁▁▂▃▂▃▃▃▃▃

0,1
best_epoch,13.0
best_val_loss,0.0067
epoch,23.0
loss,0.00457
val_loss,0.00814


[34m[1mwandb[0m: Agent Starting Run: 4deswr8s with config:
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	layers: 4
[34m[1mwandb[0m: 	lr: 0.1
[34m[1mwandb[0m: 	timestep: 3
[34m[1mwandb[0m: 	units: 128





VBox(children=(Label(value='4.210 MB of 4.210 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▁▁▂▂▂▂▃▃▃▃▄▄▄▄▅▅▅▅▅▆▆▆▆▇▇▇▇███
loss,█▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
val_loss,▇█▃▁▁▂▃▃▃▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁

0,1
best_epoch,20.0
best_val_loss,0.00773
epoch,30.0
loss,0.00682
val_loss,0.00774


[34m[1mwandb[0m: Agent Starting Run: sysqlpdr with config:
[34m[1mwandb[0m: 	batch_size: 256
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	layers: 2
[34m[1mwandb[0m: 	lr: 0.1
[34m[1mwandb[0m: 	timestep: 3
[34m[1mwandb[0m: 	units: 256





VBox(children=(Label(value='7.170 MB of 7.170 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▁▁▂▂▂▂▂▂▃▃▃▃▃▃▄▄▄▄▄▅▅▅▅▅▅▆▆▆▆▆▆▇▇▇▇▇███
loss,█▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
val_loss,█▅▃▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁

0,1
best_epoch,44.0
best_val_loss,0.00806
epoch,54.0
loss,0.00863
val_loss,0.0082


[34m[1mwandb[0m: Agent Starting Run: w4ebqgqv with config:
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	layers: 8
[34m[1mwandb[0m: 	lr: 0.1
[34m[1mwandb[0m: 	timestep: 6
[34m[1mwandb[0m: 	units: 64





VBox(children=(Label(value='0.299 MB of 0.299 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▁▂▂▃▃▄▄▅▅▅▆▆▇▇██
loss,█▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
val_loss,▁▁▁▂▃▂▁▁▁▃▅█▁▁▁▁▁

0,1
best_epoch,6.0
best_val_loss,0.00773
epoch,16.0
loss,0.0075
val_loss,0.00776


# Transformer

In [8]:
sweep_config = {
    'name': 'New_Transformer',
    'method': 'bayes', #grid, random
    'metric': {
      'name': 'best_val_loss',
      'goal': 'minimize'   
    },
    'parameters': {
        'batch_size': {
            'values': [128, 64, 32]
        },
        'dropout': {
            'values': [0, 0.1, 0.3]
        },
        'timestep': {
            'values': [3, 6, 12, 24]
        },
        'n_heads': {
            'values': [2, 4, 8]
        },
        'ff_dim': {
            'values': [128,256]
        },
        'n_blocks': {
            'values': [2, 4, 8]
        },
        'embed_dim': {
            'values': [32, 64, 128]
        },
        'time_2_vec': {
            'values': [2,3,4]
        }
    }
}

In [9]:
sweep_id = wandb.sweep(sweep_config, entity="ancy", project="DF1_RESIDUAL_TRANS_testando")

Create sweep with ID: khvwgb24
Sweep URL: https://wandb.ai/ancy/DF1_RESIDUAL_TRANS_testando/sweeps/khvwgb24


In [10]:
class TransformerBlock(layers.Layer):
    def __init__(self, embed_dim, feat_dim, num_heads, ff_dim, rate = 0.1):
        super(TransformerBlock, self).__init__()
        self.att = layers.MultiHeadAttention(num_heads = num_heads, key_dim = embed_dim)
        self.ffn = keras.Sequential( [layers.Dense(ff_dim, activation = "gelu"), layers.Dense(feat_dim),] )
        self.layernorm1 = layers.BatchNormalization()
        self.layernorm2 = layers.BatchNormalization()
        self.dropout1 = layers.Dropout(rate)
        self.dropout2 = layers.Dropout(rate)
        self.embed_dim = embed_dim
        self.feat_dim = feat_dim
        self.num_heads = num_heads
        self.ff_dim = ff_dim
        self.rate = rate

    def call(self, inputs, training):
        attn_output = self.att(inputs, inputs)
        attn_output = self.dropout1(attn_output, training = training)
        out1 = self.layernorm1(inputs + attn_output)
        ffn_output = self.ffn(out1)
        ffn_output = self.dropout2(ffn_output, training = training)
        return self.layernorm2(out1 + ffn_output)

    def get_config(self):

        config = super().get_config()
        config.update({
            'embed_dim': self.embed_dim,
            'feat_dim': self.feat_dim,
            'num_heads': self.num_heads,
            'ff_dim': self.ff_dim,
            'rate': self.rate,
        })
        return config

In [11]:
class Time2Vec(keras.layers.Layer):
    def __init__(self, kernel_size = 1):
        super(Time2Vec, self).__init__(trainable = True, name = 'Time2VecLayer')
        self.k = kernel_size

    def build(self, input_shape):
        # trend
        self.wb = self.add_weight(name = 'wb', shape = (input_shape[1],), initializer = 'uniform', trainable = True)
        self.bb = self.add_weight(name = 'bb', shape = (input_shape[1],), initializer = 'uniform', trainable = True)
        # periodic
        self.wa = self.add_weight(name = 'wa', shape = (1, input_shape[1], self.k), initializer = 'uniform', trainable = True)
        self.ba = self.add_weight(name = 'ba', shape = (1, input_shape[1], self.k), initializer = 'uniform', trainable = True)
        super(Time2Vec, self).build(input_shape)

    def call(self, inputs, **kwargs):
        bias = self.wb * inputs + self.bb
        dp = K.dot(inputs, self.wa) + self.ba
        wgts = K.sin(dp) # or K.cos(.)
        ret = K.concatenate([K.expand_dims(bias, -1), wgts], -1)
        ret = K.reshape(ret, (-1, inputs.shape[1] * (self.k + 1)))
        return ret

    def compute_output_shape(self, input_shape):
        return (input_shape[0], input_shape[1] * (self.k + 1))

    def get_config(self):

        config = super().get_config()
        config.update({
            'kernel_size': self.k,
        })
        return config

In [12]:
EPOCHS = 50
N_HEADS = 8
N_FOLDS = 10
FF_DIM = 256
N_BLOCKS = 6
EMBED_DIM = 64
BATCH_SIZE = 16
WINDOW_SIZE = 65
DROPUT_RATE = 0.0
TIME_2_VEC_DIM = 3
TRAIN_MODEL = True
SKIP_CONNECTION_STRENGTH = 0.9

In [13]:
def get_model(input_shape, time2vec_dim = 3):
    inp = Input(input_shape)
    x = inp

    time_embedding = keras.layers.TimeDistributed(Time2Vec(time2vec_dim - 1))(x)
    x = Concatenate(axis = -1)([x, time_embedding])
    x = layers.LayerNormalization(epsilon = 1e-6)(x)

    for k in range(N_BLOCKS):
        x_old = x
        transformer_block = TransformerBlock(EMBED_DIM, input_shape[-1] + ( input_shape[-1] * time2vec_dim), N_HEADS, FF_DIM, DROPUT_RATE)
        x = transformer_block(x)
        x = ((1.0 - SKIP_CONNECTION_STRENGTH) * x) + (SKIP_CONNECTION_STRENGTH * x_old)

    x = layers.Flatten()(x)

    x = layers.Dense(128, activation = "selu")(x)
    x = layers.Dropout(DROPUT_RATE)(x)
    x = Dense(1, activation = 'linear')(x)

    out = x
    model = Model(inp, out)
    return model

In [14]:
def get_model2():

    config_defaults = {
    'batch_size': 128,
    'lr': 1e-3,
    'timestep': 3,
    'n_heads': 8,
    'ff_dim':256,
    'n_blocks':6,
    'embed_dim':64,
    'dropout':0,
    'time_2_vec':3,
    }

    wandb.init(config=config_defaults)
    config = wandb.config
    train_X, train_y, valid_X, valid_y, test_X, test_y, scaler, scaler_y = make_data2(hourly, config.timestep, resid_check=True)


    batch_size=config.batch_size
    lr=config.lr
    N_HEADS = config.n_heads
    FF_DIM = config.ff_dim
    N_BLOCKS = config.n_blocks
    EMBED_DIM = config.embed_dim
    DROPUT_RATE = config.dropout
    time2vec_dim = config.time_2_vec

    input_shape = train_X.shape[1:]
    inp = Input(input_shape)
    x = inp

    time_embedding = keras.layers.TimeDistributed(Time2Vec(time2vec_dim - 1))(x)
    x = Concatenate(axis = -1)([x, time_embedding])
    x = layers.LayerNormalization(epsilon = 1e-6)(x)

    for k in range(N_BLOCKS):
        x_old = x
        transformer_block = TransformerBlock(EMBED_DIM, input_shape[-1] + ( input_shape[-1] * time2vec_dim), N_HEADS, FF_DIM, DROPUT_RATE)
        x = transformer_block(x)
        x = ((1.0 - SKIP_CONNECTION_STRENGTH) * x) + (SKIP_CONNECTION_STRENGTH * x_old)

    x = layers.Flatten()(x)

    x = layers.Dense(128, activation = "selu")(x)
    x = layers.Dropout(DROPUT_RATE)(x)
    x = Dense(1, activation = 'linear')(x)

    out = x
    model = Model(inp, out)

    model.compile(
        loss="mse",
        optimizer=Adam(learning_rate=lr)
                  )

    model.fit(train_X, train_y, batch_size=config.batch_size,
              epochs=200, verbose=0, shuffle=False,
              validation_data=(valid_X, valid_y),
              callbacks=[WandbCallback(),
                          EarlyStopping(patience=10, restore_best_weights=True), ReduceLROnPlateau(monitor='val_loss',patience=5, min_lr=1e-6)]
              )
    
    yhat = model.predict(test_X)
    yhat_inv = scaler_y.inverse_transform(yhat)
    resid_sum = (yhat_inv+resid_test.values[config.timestep:])

    print(sqrt(mean_squared_error(resid_sum, scaler_y.inverse_transform(test_y))))
    print(mean_absolute_error(resid_sum, scaler_y.inverse_transform(test_y)))
    print(mean_absolute_percentage_error(resid_sum, scaler_y.inverse_transform(test_y)))
    
    return model

In [None]:
wandb.agent(sweep_id, get_model2, count=50)

[34m[1mwandb[0m: Agent Starting Run: 8qzth7wm with config:
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	embed_dim: 32
[34m[1mwandb[0m: 	ff_dim: 256
[34m[1mwandb[0m: 	n_blocks: 4
[34m[1mwandb[0m: 	n_heads: 4
[34m[1mwandb[0m: 	time_2_vec: 4
[34m[1mwandb[0m: 	timestep: 12
[34m[1mwandb[0m: Currently logged in as: [33mancy[0m (use `wandb login --relogin` to force relogin)


2664.216767763912
2280.8695566046417
0.5153221867046072



VBox(children=(Label(value='12.965 MB of 12.965 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
epoch,▁▁▁▁▂▂▂▂▂▃▃▃▃▃▃▄▄▄▄▄▅▅▅▅▅▅▆▆▆▆▆▆▇▇▇▇▇███
loss,█▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
val_loss,█▁▁▁▁▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁

0,1
best_epoch,50.0
best_val_loss,0.02972
epoch,60.0
loss,0.292
val_loss,0.04391


[34m[1mwandb[0m: Agent Starting Run: 1k8nqer3 with config:
[34m[1mwandb[0m: 	batch_size: 128
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	embed_dim: 64
[34m[1mwandb[0m: 	ff_dim: 128
[34m[1mwandb[0m: 	n_blocks: 2
[34m[1mwandb[0m: 	n_heads: 2
[34m[1mwandb[0m: 	time_2_vec: 2
[34m[1mwandb[0m: 	timestep: 3


3356.4142545245372
2528.644908422214
3.144097363072469



VBox(children=(Label(value='2.777 MB of 2.777 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▂▂▃▃▄▄▅▅▆▆▇▇█
loss,█▅▄▃▂▂▂▁▁▁▁▁▁▁
val_loss,█▂▁▁▂▄▃▄▃▃▃▃▃▃

0,1
best_epoch,3.0
best_val_loss,0.34952
epoch,13.0
loss,0.1536
val_loss,1.16529


[34m[1mwandb[0m: Agent Starting Run: uvuxr7zy with config:
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	dropout: 0.1
[34m[1mwandb[0m: 	embed_dim: 64
[34m[1mwandb[0m: 	ff_dim: 256
[34m[1mwandb[0m: 	n_blocks: 8
[34m[1mwandb[0m: 	n_heads: 2
[34m[1mwandb[0m: 	time_2_vec: 4
[34m[1mwandb[0m: 	timestep: 24


2647.0222884145696
2051.266251339578
2.1352899870488824



VBox(children=(Label(value='25.876 MB of 25.876 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
epoch,▁▁▁▂▂▂▂▃▃▃▃▃▄▄▄▄▅▅▅▅▆▆▆▆▆▇▇▇▇███
loss,█▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
val_loss,█▂▂▂▂▂▂▃▂▂▂▄▃▃▂▂▂▂▁▁▂▁▁▁▁▁▂▁▁▁▁▁

0,1
best_epoch,21.0
best_val_loss,0.0452
epoch,31.0
loss,0.28504
val_loss,0.05223


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: 9uuf7qs0 with config:
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	embed_dim: 64
[34m[1mwandb[0m: 	ff_dim: 256
[34m[1mwandb[0m: 	n_blocks: 8
[34m[1mwandb[0m: 	n_heads: 8
[34m[1mwandb[0m: 	time_2_vec: 4
[34m[1mwandb[0m: 	timestep: 12


1123.4124524135539
944.0940819431394
0.8697343882076959



VBox(children=(Label(value='49.980 MB of 49.980 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
epoch,▁▁▁▁▂▂▂▂▂▃▃▃▃▃▃▄▄▄▄▄▅▅▅▅▅▅▆▆▆▆▆▇▇▇▇▇▇▇██
loss,█▃▂▂▂▂▂▂▁▁▁▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
val_loss,▂█▁▂▂▂▁▁▁▁▁▃▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁

0,1
best_epoch,32.0
best_val_loss,0.0055
epoch,42.0
loss,0.01263
val_loss,0.00648


[34m[1mwandb[0m: Agent Starting Run: 9fx18oga with config:
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	dropout: 0.1
[34m[1mwandb[0m: 	embed_dim: 32
[34m[1mwandb[0m: 	ff_dim: 256
[34m[1mwandb[0m: 	n_blocks: 8
[34m[1mwandb[0m: 	n_heads: 8
[34m[1mwandb[0m: 	time_2_vec: 4
[34m[1mwandb[0m: 	timestep: 24


2748.613769932641
2385.9644638522645
0.4734803498558154



VBox(children=(Label(value='35.052 MB of 35.052 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
epoch,▁▁▂▂▂▃▃▃▃▄▄▄▅▅▅▆▆▆▆▇▇▇██
loss,█▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
val_loss,▃▂▂▅▄▄█▂▂▂▂▁▁▁▂▂▂▂▃▂▃▂▂▃

0,1
best_epoch,13.0
best_val_loss,0.06585
epoch,23.0
loss,0.30431
val_loss,0.12657


[34m[1mwandb[0m: Agent Starting Run: h5dbpfvg with config:
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	dropout: 0
[34m[1mwandb[0m: 	embed_dim: 32
[34m[1mwandb[0m: 	ff_dim: 256
[34m[1mwandb[0m: 	n_blocks: 8
[34m[1mwandb[0m: 	n_heads: 4
[34m[1mwandb[0m: 	time_2_vec: 4
[34m[1mwandb[0m: 	timestep: 3


2087.787166877971
1727.162829597965
0.4681657190400313



VBox(children=(Label(value='0.326 MB of 0.326 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▁▂▂▂▂▃▃▃▄▄▄▄▅▅▅▅▆▆▆▇▇▇▇██
loss,█▂▁▁▁▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
val_loss,█▃▄▂▅█▁▃▁▁▁▂▂▃▄▁▁▁▁▁▁▁▁▁▁▁

0,1
best_epoch,15.0
best_val_loss,0.03034
epoch,25.0
loss,0.00481
val_loss,0.04224


[34m[1mwandb[0m: Agent Starting Run: vjjblxrr with config:
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	embed_dim: 128
[34m[1mwandb[0m: 	ff_dim: 256
[34m[1mwandb[0m: 	n_blocks: 8
[34m[1mwandb[0m: 	n_heads: 8
[34m[1mwandb[0m: 	time_2_vec: 4
[34m[1mwandb[0m: 	timestep: 24


2222.9124638779713
1868.7695738767097
1.8347054919008632



VBox(children=(Label(value='90.111 MB of 90.111 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
epoch,▁▁▂▂▂▃▃▃▄▄▄▅▅▅▅▆▆▆▇▇▇██
loss,█▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
val_loss,▂▃▂▁▃▃█▁▄▁▁▁▁▁▁▁▁▁▁▁▁▁▁

0,1
best_epoch,12.0
best_val_loss,0.03374
epoch,22.0
loss,0.69505
val_loss,0.04006


[34m[1mwandb[0m: Agent Starting Run: b8aq1ptv with config:
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	dropout: 0
[34m[1mwandb[0m: 	embed_dim: 32
[34m[1mwandb[0m: 	ff_dim: 128
[34m[1mwandb[0m: 	n_blocks: 4
[34m[1mwandb[0m: 	n_heads: 8
[34m[1mwandb[0m: 	time_2_vec: 4
[34m[1mwandb[0m: 	timestep: 24


2430.057199921024
2018.7141907779262
3.602235415107296



VBox(children=(Label(value='18.690 MB of 18.690 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
epoch,▁▁▂▂▂▂▃▃▃▄▄▄▅▅▅▅▆▆▆▇▇▇▇██
loss,█▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
val_loss,█▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁

0,1
best_epoch,14.0
best_val_loss,0.02595
epoch,24.0
loss,0.00478
val_loss,0.03072


[34m[1mwandb[0m: Agent Starting Run: 8gstoixd with config:
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	dropout: 0
[34m[1mwandb[0m: 	embed_dim: 128
[34m[1mwandb[0m: 	ff_dim: 128
[34m[1mwandb[0m: 	n_blocks: 8
[34m[1mwandb[0m: 	n_heads: 8
[34m[1mwandb[0m: 	time_2_vec: 4
[34m[1mwandb[0m: 	timestep: 24


3099.338441304727
2543.2748717793365
0.46576741456025333



VBox(children=(Label(value='12.167 MB of 12.167 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
epoch,▁▂▂▃▃▄▅▅▆▆▇▇█
loss,█▁▁▁▁▁▁▁▁▁▁▁▁
val_loss,▇▁▁▃▄▆▇▇███▇▇

0,1
best_epoch,2.0
best_val_loss,0.14461
epoch,12.0
loss,0.00468
val_loss,0.51141


[34m[1mwandb[0m: Agent Starting Run: sngt1kb1 with config:
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	dropout: 0
[34m[1mwandb[0m: 	embed_dim: 32
[34m[1mwandb[0m: 	ff_dim: 256
[34m[1mwandb[0m: 	n_blocks: 4
[34m[1mwandb[0m: 	n_heads: 8
[34m[1mwandb[0m: 	time_2_vec: 4
[34m[1mwandb[0m: 	timestep: 12


2629.722073908669
2073.0027449573163
0.6386603990821217



VBox(children=(Label(value='17.553 MB of 17.553 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
epoch,▁▁▂▂▂▂▃▃▃▄▄▄▅▅▅▅▆▆▆▇▇▇▇██
loss,█▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
val_loss,▂▆▄▂▃▃▂▅▂█▅▃▂▁▁▁▁▁▂▂▁▁▁▁▂

0,1
best_epoch,14.0
best_val_loss,0.05893
epoch,24.0
loss,0.01536
val_loss,0.08595


[34m[1mwandb[0m: Agent Starting Run: ew8yf82n with config:
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	dropout: 0.1
[34m[1mwandb[0m: 	embed_dim: 32
[34m[1mwandb[0m: 	ff_dim: 128
[34m[1mwandb[0m: 	n_blocks: 4
[34m[1mwandb[0m: 	n_heads: 8
[34m[1mwandb[0m: 	time_2_vec: 4
[34m[1mwandb[0m: 	timestep: 6


2893.0172564564286
2451.2798565683634
1.5123184616473517



VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▁▂▂▃▃▃▄▄▅▅▅▆▆▆▇▇██
loss,█▂▂▅▃▂▂▁▁▁▁▁▁▁▁▁▁▁▁
val_loss,▂▆▅█▅▁▁▁▁▂▁▁▁▃▂▂▁▁▁

0,1
best_epoch,8.0
best_val_loss,0.0303
epoch,18.0
loss,0.08948
val_loss,0.09552


[34m[1mwandb[0m: Agent Starting Run: k7eyzp8o with config:
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	embed_dim: 32
[34m[1mwandb[0m: 	ff_dim: 256
[34m[1mwandb[0m: 	n_blocks: 8
[34m[1mwandb[0m: 	n_heads: 4
[34m[1mwandb[0m: 	time_2_vec: 4
[34m[1mwandb[0m: 	timestep: 3


949.3784945267004
694.5805564980777
0.36056598509174387



VBox(children=(Label(value='19.878 MB of 19.878 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
epoch,▁▁▁▂▂▂▂▂▂▃▃▃▃▃▃▄▄▄▄▄▅▅▅▅▅▅▆▆▆▆▆▆▇▇▇▇▇▇██
loss,█▄▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
val_loss,▅▆▇▆▃▅▃█▄▃▁▂▂▃▃▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁

0,1
best_epoch,31.0
best_val_loss,0.00527
epoch,41.0
loss,0.01263
val_loss,0.00565


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: 2j7ik78h with config:
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	dropout: 0
[34m[1mwandb[0m: 	embed_dim: 32
[34m[1mwandb[0m: 	ff_dim: 256
[34m[1mwandb[0m: 	n_blocks: 2
[34m[1mwandb[0m: 	n_heads: 8
[34m[1mwandb[0m: 	time_2_vec: 4
[34m[1mwandb[0m: 	timestep: 24


2351.314975625149
1994.0752803422363
7.433062195886173



VBox(children=(Label(value='13.947 MB of 13.947 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
epoch,▁▁▁▂▂▂▂▃▃▃▃▃▄▄▄▄▅▅▅▅▆▆▆▆▆▇▇▇▇███
loss,█▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
val_loss,█▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁

0,1
best_epoch,21.0
best_val_loss,0.02725
epoch,31.0
loss,0.00524
val_loss,0.0275


[34m[1mwandb[0m: Agent Starting Run: 34bdydqg with config:
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	dropout: 0.1
[34m[1mwandb[0m: 	embed_dim: 32
[34m[1mwandb[0m: 	ff_dim: 256
[34m[1mwandb[0m: 	n_blocks: 8
[34m[1mwandb[0m: 	n_heads: 2
[34m[1mwandb[0m: 	time_2_vec: 4
[34m[1mwandb[0m: 	timestep: 24


2351.0772345390283
1867.040407336806
1.4927282767399026



VBox(children=(Label(value='21.281 MB of 21.281 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
epoch,▁▂▂▃▄▄▅▅▆▇▇█
loss,█▁▁▁▁▁▁▁▁▁▁▁
val_loss,▃▁▃▄▄▄█▆▆▆▃▃

0,1
best_epoch,1.0
best_val_loss,0.04859
epoch,11.0
loss,0.41225
val_loss,0.09003


[34m[1mwandb[0m: Agent Starting Run: nl2rzdor with config:
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	dropout: 0
[34m[1mwandb[0m: 	embed_dim: 32
[34m[1mwandb[0m: 	ff_dim: 256
[34m[1mwandb[0m: 	n_blocks: 2
[34m[1mwandb[0m: 	n_heads: 8
[34m[1mwandb[0m: 	time_2_vec: 4
[34m[1mwandb[0m: 	timestep: 6


1746.1209612334635
1489.306718777075
0.42360824043203327



VBox(children=(Label(value='8.805 MB of 8.805 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▁▁▁▂▂▂▂▂▃▃▃▃▃▄▄▄▄▄▄▅▅▅▅▅▅▆▆▆▆▆▇▇▇▇▇████
loss,█▁▁▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
val_loss,█▇▅▂█▄▂▁▁▁▁▁▁▁▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁

0,1
best_epoch,52.0
best_val_loss,0.01133
epoch,62.0
loss,0.0051
val_loss,0.01142


[34m[1mwandb[0m: Agent Starting Run: f7e6zrny with config:
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	dropout: 0
[34m[1mwandb[0m: 	embed_dim: 32
[34m[1mwandb[0m: 	ff_dim: 256
[34m[1mwandb[0m: 	n_blocks: 4
[34m[1mwandb[0m: 	n_heads: 8
[34m[1mwandb[0m: 	time_2_vec: 4
[34m[1mwandb[0m: 	timestep: 6


3557.2388826503193
3024.1680719673873
1.134586409115118



VBox(children=(Label(value='15.840 MB of 15.840 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
epoch,▁▁▂▂▂▃▃▄▄▄▅▅▅▆▆▇▇▇██
loss,█▁▁▁▁▁▂▁▁▁▁▁▁▁▁▁▁▁▁▁
val_loss,█▇█▅▇▃▆▃▂▁▁▁▂▂▂▁▁▁▁▁

0,1
best_epoch,9.0
best_val_loss,0.18677
epoch,19.0
loss,0.04018
val_loss,0.35334


[34m[1mwandb[0m: Agent Starting Run: cuj9o646 with config:
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	dropout: 0.1
[34m[1mwandb[0m: 	embed_dim: 32
[34m[1mwandb[0m: 	ff_dim: 256
[34m[1mwandb[0m: 	n_blocks: 2
[34m[1mwandb[0m: 	n_heads: 4
[34m[1mwandb[0m: 	time_2_vec: 4
[34m[1mwandb[0m: 	timestep: 12


2703.5168975222978
2154.1261617972423
2.7715493067090633



VBox(children=(Label(value='8.226 MB of 8.226 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▁▁▂▂▂▂▃▃▃▃▄▄▄▄▅▅▅▅▅▆▆▆▆▇▇▇▇███
loss,█▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
val_loss,▄▂▂▂▃██▂▄▄▁▁▆▂▂▂▃▁▁▁▁▁▁▁▁▁▁▁▁▁▁

0,1
best_epoch,20.0
best_val_loss,0.03316
epoch,30.0
loss,0.18685
val_loss,0.08896


[34m[1mwandb[0m: Agent Starting Run: g9dbqr0w with config:
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	dropout: 0
[34m[1mwandb[0m: 	embed_dim: 32
[34m[1mwandb[0m: 	ff_dim: 256
[34m[1mwandb[0m: 	n_blocks: 2
[34m[1mwandb[0m: 	n_heads: 8
[34m[1mwandb[0m: 	time_2_vec: 4
[34m[1mwandb[0m: 	timestep: 24


1943.3634176641528
1543.3931462279818
27.742297592546443



VBox(children=(Label(value='13.947 MB of 13.947 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
epoch,▁▂▂▃▄▄▅▅▆▇▇█
loss,█▁▁▁▁▁▁▁▁▁▁▁
val_loss,▂▁▅▇█▇▆▃▃▄▄▄

0,1
best_epoch,1.0
best_val_loss,0.04733
epoch,11.0
loss,0.00832
val_loss,0.08398


[34m[1mwandb[0m: Agent Starting Run: at0d0lae with config:
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	dropout: 0
[34m[1mwandb[0m: 	embed_dim: 32
[34m[1mwandb[0m: 	ff_dim: 128
[34m[1mwandb[0m: 	n_blocks: 2
[34m[1mwandb[0m: 	n_heads: 8
[34m[1mwandb[0m: 	time_2_vec: 4
[34m[1mwandb[0m: 	timestep: 12


2210.836714671578
1726.1253519656811
2.022867372962887



VBox(children=(Label(value='9.375 MB of 9.375 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▁▂▃▃▃▄▅▅▅▆▇▇▇█
loss,█▁▁▁▁▁▁▁▁▁▁▁▁▁▁
val_loss,█▂▂▁▁▁▂▃▄▆▃▄▄▄▃

0,1
best_epoch,4.0
best_val_loss,0.09342
epoch,14.0
loss,0.03514
val_loss,0.30534


[34m[1mwandb[0m: Agent Starting Run: z8be867f with config:
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	embed_dim: 128
[34m[1mwandb[0m: 	ff_dim: 256
[34m[1mwandb[0m: 	n_blocks: 8
[34m[1mwandb[0m: 	n_heads: 8
[34m[1mwandb[0m: 	time_2_vec: 4
[34m[1mwandb[0m: 	timestep: 24


1606.3483556260342
1293.5674669993991
0.600659887276636



VBox(children=(Label(value='90.111 MB of 90.111 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
epoch,▁▁▂▂▂▂▃▃▃▃▄▄▄▄▅▅▅▅▆▆▆▆▇▇▇▇██
loss,█▂▂▂▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
val_loss,▁█▁▂▇▃▄▁▁▂▁▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁

0,1
best_epoch,17.0
best_val_loss,0.01864
epoch,27.0
loss,0.14163
val_loss,0.0741


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: ju39tvb6 with config:
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	embed_dim: 32
[34m[1mwandb[0m: 	ff_dim: 256
[34m[1mwandb[0m: 	n_blocks: 8
[34m[1mwandb[0m: 	n_heads: 4
[34m[1mwandb[0m: 	time_2_vec: 3
[34m[1mwandb[0m: 	timestep: 12


1059.0413837531237
786.8264748403843
0.3990560000068029



VBox(children=(Label(value='18.073 MB of 18.073 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
epoch,▁▁▁▁▂▂▂▂▂▃▃▃▃▃▃▄▄▄▄▄▅▅▅▅▅▅▆▆▆▆▆▇▇▇▇▇▇▇██
loss,█▄▄▃▂▂▂▂▃▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
val_loss,▂▅█▁▁▁▁▂▄▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁

0,1
best_epoch,32.0
best_val_loss,0.00737
epoch,42.0
loss,0.02046
val_loss,0.01032


[34m[1mwandb[0m: Agent Starting Run: qscgzzes with config:
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	embed_dim: 32
[34m[1mwandb[0m: 	ff_dim: 256
[34m[1mwandb[0m: 	n_blocks: 8
[34m[1mwandb[0m: 	n_heads: 4
[34m[1mwandb[0m: 	time_2_vec: 4
[34m[1mwandb[0m: 	timestep: 3


1550.8372370444777
1215.1064175915544
0.40766359221748694



VBox(children=(Label(value='19.878 MB of 19.878 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
epoch,▁▁▂▂▃▃▃▄▄▅▅▅▆▆▆▇▇██
loss,█▄▂▂▁▂▁▁▁▁▁▁▁▁▁▁▁▁▁
val_loss,█▃▂▁▆▂▁▁▁▁▂▁▃▂▂▂▂▂▁

0,1
best_epoch,8.0
best_val_loss,0.01521
epoch,18.0
loss,0.02225
val_loss,0.04413


[34m[1mwandb[0m: Agent Starting Run: oiiehna7 with config:
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	embed_dim: 32
[34m[1mwandb[0m: 	ff_dim: 128
[34m[1mwandb[0m: 	n_blocks: 8
[34m[1mwandb[0m: 	n_heads: 8
[34m[1mwandb[0m: 	time_2_vec: 4
[34m[1mwandb[0m: 	timestep: 24


1080.7077823245036
834.7825188861707
0.33014073357692186



VBox(children=(Label(value='30.471 MB of 30.471 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
epoch,▁▁▁▂▂▂▂▂▂▃▃▃▃▃▃▄▄▄▄▄▅▅▅▅▅▅▆▆▆▆▆▇▇▇▇▇▇███
loss,█▂▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
val_loss,▃▄▆▃▅█▅▆▄▃▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁

0,1
best_epoch,58.0
best_val_loss,0.00626
epoch,68.0
loss,0.03312
val_loss,0.00675


[34m[1mwandb[0m: Agent Starting Run: 1b7yh3ng with config:
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	embed_dim: 32
[34m[1mwandb[0m: 	ff_dim: 128
[34m[1mwandb[0m: 	n_blocks: 4
[34m[1mwandb[0m: 	n_heads: 8
[34m[1mwandb[0m: 	time_2_vec: 4
[34m[1mwandb[0m: 	timestep: 24


2718.908768447552
2226.6274043945473
1.8609810176813495



VBox(children=(Label(value='18.690 MB of 18.690 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
epoch,▁▁▂▂▃▃▄▄▅▅▅▆▆▇▇██
loss,█▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
val_loss,▂▅▂▁█▁▁▁▂▁▁▂▄▄▃▄▄

0,1
best_epoch,6.0
best_val_loss,0.08712
epoch,16.0
loss,0.91561
val_loss,0.61106


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: onkbxe9i with config:
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	embed_dim: 64
[34m[1mwandb[0m: 	ff_dim: 256
[34m[1mwandb[0m: 	n_blocks: 8
[34m[1mwandb[0m: 	n_heads: 8
[34m[1mwandb[0m: 	time_2_vec: 3
[34m[1mwandb[0m: 	timestep: 12


1410.6869137411566
1069.7461201568249
1.5802562114981784



VBox(children=(Label(value='40.113 MB of 40.113 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
epoch,▁▁▂▂▂▃▃▃▄▄▄▅▅▅▆▆▆▇▇▇██
loss,█▃▂▂▂▂▂▂▁▁▁▁▁▁▁▂▁▁▁▁▁▁
val_loss,▇█▇▂▁▄▁▁▁▁▂▁▁▁▁▁▁▁▁▁▁▁

0,1
best_epoch,11.0
best_val_loss,0.01486
epoch,21.0
loss,0.01756
val_loss,0.04567


[34m[1mwandb[0m: Agent Starting Run: awpkvdon with config:
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	dropout: 0.1
[34m[1mwandb[0m: 	embed_dim: 32
[34m[1mwandb[0m: 	ff_dim: 128
[34m[1mwandb[0m: 	n_blocks: 8
[34m[1mwandb[0m: 	n_heads: 8
[34m[1mwandb[0m: 	time_2_vec: 3
[34m[1mwandb[0m: 	timestep: 6


1366.628936768744
1099.730326094772
0.6188362666855709



VBox(children=(Label(value='20.379 MB of 20.379 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
epoch,▁▁▁▂▂▂▂▂▂▃▃▃▃▃▃▄▄▄▄▄▅▅▅▅▅▅▆▆▆▆▆▆▇▇▇▇▇███
loss,█▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
val_loss,▄▄█▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁

0,1
best_epoch,55.0
best_val_loss,0.00991
epoch,65.0
loss,0.02212
val_loss,0.01167


[34m[1mwandb[0m: Agent Starting Run: 2cuzi9vg with config:
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	embed_dim: 128
[34m[1mwandb[0m: 	ff_dim: 256
[34m[1mwandb[0m: 	n_blocks: 8
[34m[1mwandb[0m: 	n_heads: 8
[34m[1mwandb[0m: 	time_2_vec: 4
[34m[1mwandb[0m: 	timestep: 6


899.7904937213336
667.2860520817387
0.412880247342367



VBox(children=(Label(value='84.969 MB of 84.969 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
epoch,▁▁▁▁▂▂▂▂▂▃▃▃▃▃▃▄▄▄▄▄▅▅▅▅▅▅▆▆▆▆▆▇▇▇▇▇▇███
loss,█▃▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
val_loss,█▇▆▂▁▂▁▂▁▁▁▂▂▃▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁

0,1
best_epoch,47.0
best_val_loss,0.00494
epoch,57.0
loss,0.01235
val_loss,0.00508


[34m[1mwandb[0m: Agent Starting Run: 7b99qzyp with config:
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	embed_dim: 32
[34m[1mwandb[0m: 	ff_dim: 128
[34m[1mwandb[0m: 	n_blocks: 8
[34m[1mwandb[0m: 	n_heads: 8
[34m[1mwandb[0m: 	time_2_vec: 4
[34m[1mwandb[0m: 	timestep: 6
