# Text classification using Tensorflow: Sentiment on Reviews
# Hyperparameter Tuning

This notebook trains a binary classifier for sentiment analysis to classify restaurant food reviews as *negative* or *positive*, based on the text of the review where a sentiment score was previously calculated.


In [None]:
from google.colab import drive
drive.mount('/content/drive')

Mounted at /content/drive


In [None]:
!pip install --upgrade -q wandb
import wandb
from wandb.keras import WandbCallback
import os
import random
import numpy as np
import pandas as pd
import shutil
import time
import datetime
from datetime import datetime, timedelta
from timeit import default_timer as timer
import pickle
import joblib
from sklearn.utils import shuffle
import tensorflow as tf
from tensorflow.keras import layers, losses
from tensorboard.plugins.hparams import api as hp
from tensorflow.keras.callbacks import ReduceLROnPlateau, ModelCheckpoint, Callback, EarlyStopping
from tensorflow.keras.optimizers import Adam, RMSprop, SGD, Nadam
import matplotlib
import matplotlib.pyplot as plt
import tqdm
from tensorflow import keras
from keras.utils import np_utils

[K     |████████████████████████████████| 1.8 MB 7.7 MB/s 
[K     |████████████████████████████████| 181 kB 47.4 MB/s 
[K     |████████████████████████████████| 145 kB 52.2 MB/s 
[K     |████████████████████████████████| 63 kB 1.7 MB/s 
[?25h  Building wheel for pathtools (setup.py) ... [?25l[?25hdone


In [None]:
print('CUDA and NVIDIA GPU Information')
!/usr/local/cuda/bin/nvcc --version
!nvidia-smi

print('\n')
print('TensorFlow version: {}'.format(tf.__version__))
print('Eager execution is: {}'.format(tf.executing_eagerly()))
print('Keras version: {}'.format(tf.keras.__version__))
print('Num GPUs Available: ', len(tf.config.list_physical_devices('GPU')))

CUDA and NVIDIA GPU Information
nvcc: NVIDIA (R) Cuda compiler driver
Copyright (c) 2005-2020 NVIDIA Corporation
Built on Mon_Oct_12_20:09:46_PDT_2020
Cuda compilation tools, release 11.1, V11.1.105
Build cuda_11.1.TC455_06.29190527_0
Wed Jul  6 02:23:01 2022       
+-----------------------------------------------------------------------------+
| NVIDIA-SMI 460.32.03    Driver Version: 460.32.03    CUDA Version: 11.2     |
|-------------------------------+----------------------+----------------------+
| GPU  Name        Persistence-M| Bus-Id        Disp.A | Volatile Uncorr. ECC |
| Fan  Temp  Perf  Pwr:Usage/Cap|         Memory-Usage | GPU-Util  Compute M. |
|                               |                      |               MIG M. |
|   0  Tesla P100-PCIE...  Off  | 00000000:00:04.0 Off |                    0 |
| N/A   39C    P0    26W / 250W |      0MiB / 16280MiB |      0%      Default |
|                               |                      |                  N/A |
+------------

In [None]:
# Reproducibility in TF
def init_seeds(seed=42):
    random.seed(seed)
    np.random.seed(seed)
    tf.random.set_seed(seed)
    session_conf = tf.compat.v1.ConfigProto()
    session_conf = tf.compat.v1.ConfigProto(intra_op_parallelism_threads=1,
                                            inter_op_parallelism_threads=1)
    os.environ['TF_CUDNN_DETERMINISTIC'] = 'True'
    os.environ['TF_DETERMINISTIC_OPS'] = 'True'
    sess = tf.compat.v1.Session(graph=tf.compat.v1.get_default_graph(),
                                config=session_conf)
    tf.compat.v1.keras.backend.set_session(sess)
    return sess

In [None]:
init_seeds(seed=42)

<tensorflow.python.client.session.Session at 0x7f8e6294a9d0>

In [None]:
%cd /content/drive/MyDrive/Yelp_Reviews/Data/

/content/drive/MyDrive/Yelp_Reviews/Data


In [None]:
# Read reviews with stars filtered to 1, 2 and 5
df = pd.read_parquet('YelpReviews_NLP_125stars.parquet')
print('Number of rows and columns:', df.shape)
df.head()

Number of rows and columns: (1541486, 2)


Unnamed: 0_level_0,stars_reviews,cleanReview
index,Unnamed: 1_level_1,Unnamed: 2_level_1
2,5.0,wonderful place get lunch staff friendly effic...
3,5.0,dedicated loving memory gary feldman greatest ...
5,5.0,love place everything menu delicious like tuna...
7,5.0,truely hidden gem place greatest buffalo chick...
9,5.0,seriously great fresh fantastic food spot pric...


In [None]:
# Recode to binary
df['stars_reviews'].mask(df['stars_reviews'] == 1, 0, inplace=True)
df['stars_reviews'].mask(df['stars_reviews'] == 2, 0, inplace=True)
df['stars_reviews'].mask(df['stars_reviews'] == 5, 1, inplace=True)

print('Number of reviews per group:')
df[['stars_reviews']].value_counts()

Number of reviews per group:


stars_reviews
0.0              770743
1.0              770743
dtype: int64

In [None]:
# Sample the number of reviews to balance with sentiment
df1 = df[df.stars_reviews==0]
df1 = shuffle(df1)
df1 = df1.sample(n=414937)

# Sample the number of reviews to balance with sentiment
df2 = df[df.stars_reviews==1]
df2 = shuffle(df2)
df2 = df2.sample(n=414937)

# Combine sampled groups
df = pd.concat([df1, df2])
df = shuffle(df)

del df2

df.shape

(829874, 2)

In [None]:
# Convert data types
df[['cleanReview']] = df[['cleanReview']].astype('str')
df['stars_reviews'] = df['stars_reviews'].astype('float32')

In [None]:
# Set up features and label
features = df['cleanReview']
labels = df['stars_reviews']

In [None]:
# Load pandas df to tf
df = tf.data.Dataset.from_tensor_slices((features, labels))

In [None]:
# Define components for paritioning data
df_size = df.cardinality().numpy()
train_size = int(0.8 * df_size)
val_size = int(0.10 * df_size)
test_size = int(0.10 * df_size)
BATCH_SIZE = 32

In [None]:
# Prepare train/test sets
df = df.shuffle(800_000, seed=42, reshuffle_each_iteration=False)
train = df.take(train_size).batch(BATCH_SIZE)
test = df.skip(train_size)
val = test.skip(val_size).batch(BATCH_SIZE)
test= test.take(test_size).batch(BATCH_SIZE)

print('Train data split:', len(train))
print('Eval data split', len(val))
print('Test data split', len(test))

Train data split: 20747
Eval data split 2594
Test data split 2594


# Sentiment analysis




### Prepare the data for training

Next, the reviews are tokenized and vectorized using `tf.keras.layers.TextVectorization` layer. Tokenization refers to splitting strings into single words, or tokens. Vectorization converts the tokens into numbers as input for the neural network. Unique integer indices are created for each token by using `output_mode` = `int`. The `max_features` and `sequence_length` are defined for what is sampled.

In [None]:
max_features = 50000
sequence_length = 300

vectorize_layer = layers.TextVectorization(
    max_tokens=max_features,
    output_mode='int',
    output_sequence_length=sequence_length)

The preprocessing layer is fit to the dataset by using `adapt` for the training data, which results in the model creating an index of strings to integers.

In [None]:
# Make a review-only dataset and then call adapt
train_text = train.map(lambda x, y:x)
vectorize_layer.adapt(train_text)

Now, define a function to examine how the created layer preprocesses the data:



In [None]:
def vectorize_text(cleanReview, stars_reviews):
    cleanReview = tf.expand_dims(cleanReview, -1)
    return vectorize_layer(cleanReview), stars_reviews

In [None]:
# Sample a batch reviews and labels
text_batch, label_batch = next(iter(train))
first_review, first_label = text_batch[0], label_batch[0]
print('Review', first_review)
print('Label', first_label)
print('Vectorized review', vectorize_text(first_review, first_label))

Review tf.Tensor(b'food terribly salted waiter personality never filled husband drink never asked everything good till stacked plate end', shape=(), dtype=string)
Label tf.Tensor(0.0, shape=(), dtype=float32)
Vectorized review (<tf.Tensor: shape=(1, 300), dtype=int64, numpy=
array([[   2, 2137, 1472,  157, 2144,   26,  709,  209,   34,   26,   57,
          77,    4, 1475, 3873,  137,  257,    0,    0,    0,    0,    0,
           0,    0,    0,    0,    0,    0,    0,    0,    0,    0,    0,
           0,    0,    0,    0,    0,    0,    0,    0,    0,    0,    0,
           0,    0,    0,    0,    0,    0,    0,    0,    0,    0,    0,
           0,    0,    0,    0,    0,    0,    0,    0,    0,    0,    0,
           0,    0,    0,    0,    0,    0,    0,    0,    0,    0,    0,
           0,    0,    0,    0,    0,    0,    0,    0,    0,    0,    0,
           0,    0,    0,    0,    0,    0,    0,    0,    0,    0,    0,
           0,    0,    0,    0,    0,    0,    0,    0,   

In [None]:
print('12870 ---> ', vectorize_layer.get_vocabulary()[12870])
print(' 3130 ---> ', vectorize_layer.get_vocabulary()[3130])
print('Vocabulary size: {}'.format(len(vectorize_layer.get_vocabulary())))

12870 --->  refers
 3130 --->  aged
Vocabulary size: 50000


Then, apply the `TextVectorization` layer to the train, validation, and test sets.

In [None]:
train_ds = train.map(vectorize_text)
val_ds = val.map(vectorize_text)
test_ds = test.map(vectorize_text)

Configure the dataset for performance by using `.cache()` and `.prefetch()`.




In [None]:
AUTOTUNE = tf.data.AUTOTUNE

train_ds = train_ds.cache().prefetch(buffer_size=AUTOTUNE)
val_ds = val_ds.cache().prefetch(buffer_size=AUTOTUNE)
test_ds = test_ds.cache().prefetch(buffer_size=AUTOTUNE)

# Hyperparameter Tuning

In [None]:
# Set path for results
%cd /content/drive/MyDrive/Yelp_Reviews/DL/BoW/ReviewStars/Models/

/content/drive/MyDrive/Yelp_Reviews/DL/BoW/ReviewStars/Models


In [None]:
# Set up w & b
wandb.login()

<IPython.core.display.Javascript object>

[34m[1mwandb[0m: Logging into wandb.ai. (Learn how to deploy a W&B server locally: https://wandb.me/wandb-server)
[34m[1mwandb[0m: You can find your API key in your browser here: https://wandb.ai/authorize
wandb: Paste an API key from your profile and hit enter, or press ctrl+c to quit: 

··········


[34m[1mwandb[0m: Appending key for api.wandb.ai to your netrc file: /root/.netrc


True

In [None]:
# Configure the sweep
sweep_config = {
    'method': 'grid',
    'metric': {
      'name': 'BinaryAccuracy',
      'goal': 'maximize'
    },
    'parameters': {
        'epochs': {
            'values': [3, 5, 7]
        },
        'batch_size': {
            'values': [8, 4, 2, 1]
        },
        'embedding_dim': {
            'values': [128, 64, 32]
        },
        'dropout': {
            'values': [0.2, 0.3, 0.4, 0.5]
        },
        'weight_decay': {
            'values': [0.0005, 0.005, 0.05]
        },
        'learning_rate': {
            'values': [0.00001, 0.00005, 0.0001, 0.0005, 0.001, 0.005, 0.01]
        },
        'optimizer': {
            'values': ['adam', 'nadam', 'sgd', 'rmsprop']
        },
    }
}

## 2. Initialize the Sweep

In [None]:
# Initialize a new sweep
sweep_id = wandb.sweep(sweep_config, entity='aschultz',
                       project='tf_textclass_reviewstars_grid')

Create sweep with ID: 20z3bhbj
Sweep URL: https://wandb.ai/aschultz/tf_textclass_reviewstars_grid/sweeps/20z3bhbj


### Define Neural Network


In [None]:
# The sweep calls this function with each set of hyperparameters
def train():
    # Default values for hyperparameters
    config_defaults = {
        'epochs': 5,
        'batch_size': 8,
        'weight_decay': 0.0005,
        'learning_rate': 0.01,
        'optimizer': 'adam',
        'embedding_dim': 32,
        'dropout': 0.5,
        'momentum': 0.9,
        'seed': 42
    }

    # Initialize a new wandb run
    wandb.init(config=config_defaults)

    # Config hyperparameters and inputs
    config = wandb.config

    # Define the model architecture
    model = tf.keras.Sequential()
    model.add(tf.keras.layers.Embedding(max_features + 1, config.embedding_dim))
    model.add(tf.keras.layers.Dropout(config.dropout))
    model.add(tf.keras.layers.GlobalAveragePooling1D())
    model.add(tf.keras.layers.Dropout(config.dropout))
    model.add(tf.keras.layers.Dense(1))

    # Define the optimizer
    if config.optimizer=='sgd':
        optimizer = SGD(learning_rate=config.learning_rate, decay=1e-5,
                        momentum=config.momentum, nesterov=True)
    elif config.optimizer=='rmsprop':
        optimizer = RMSprop(learning_rate=config.learning_rate, decay=1e-5)
    elif config.optimizer=='adam':
        optimizer = Adam(learning_rate=config.learning_rate, beta_1=0.9,
                         beta_2=0.999, clipnorm=1.0)
    elif config.optimizer=='nadam':
        optimizer = Nadam(learning_rate=config.learning_rate, beta_1=0.9,
                          beta_2=0.999, clipnorm=1.0)

    # Define loss and metrics
    model.compile(loss=losses.BinaryCrossentropy(from_logits=True),
                  optimizer = optimizer,
                  metrics=tf.metrics.BinaryAccuracy(threshold=0.0))

    # Fit model
    model.fit(train_ds, batch_size=config.batch_size,
              epochs=config.epochs,
              validation_data=(val_ds),
              callbacks=[WandbCallback(data_type='text', validation_data=(val_ds)),
                                       EarlyStopping(patience=10,
                                                     restore_best_weights=True)])

## 3. Run the sweep agent

In [None]:
# Run sweep for HPO
wandb.agent(sweep_id, train)

[34m[1mwandb[0m: Agent Starting Run: 6c6u8vd3 with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 1e-05
[34m[1mwandb[0m: 	optimizer: adam
[34m[1mwandb[0m: 	weight_decay: 0.0005
[34m[1mwandb[0m: Currently logged in as: [33maschultz[0m. Use [1m`wandb login --relogin`[0m to force relogin




Instructions for updating:
Use `tf.compat.v1.graph_util.tensor_shape_from_node_def_name`
Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='73.271 MB of 73.271 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▆█
epoch,▁▅█
loss,█▅▁
val_binary_accuracy,▁▅█
val_loss,█▅▁

0,1
GFLOPS,0.0
best_epoch,2.0
best_val_loss,0.50283
binary_accuracy,0.80234
epoch,2.0
loss,0.542
val_binary_accuracy,0.82843
val_loss,0.50283


[34m[1mwandb[0m: Agent Starting Run: i9xhe98k with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 1e-05
[34m[1mwandb[0m: 	optimizer: adam
[34m[1mwandb[0m: 	weight_decay: 0.005


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='73.271 MB of 73.271 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▆█
epoch,▁▅█
loss,█▅▁
val_binary_accuracy,▁▅█
val_loss,█▅▁

0,1
GFLOPS,0.0
best_epoch,2.0
best_val_loss,0.50435
binary_accuracy,0.80076
epoch,2.0
loss,0.54344
val_binary_accuracy,0.82711
val_loss,0.50435


[34m[1mwandb[0m: Agent Starting Run: 3xfuqz68 with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 1e-05
[34m[1mwandb[0m: 	optimizer: adam
[34m[1mwandb[0m: 	weight_decay: 0.05


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='73.271 MB of 73.271 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▆█
epoch,▁▅█
loss,█▅▁
val_binary_accuracy,▁▅█
val_loss,█▅▁

0,1
GFLOPS,0.0
best_epoch,2.0
best_val_loss,0.50446
binary_accuracy,0.80127
epoch,2.0
loss,0.54335
val_binary_accuracy,0.82753
val_loss,0.50446


[34m[1mwandb[0m: Agent Starting Run: a6eqk3lq with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 1e-05
[34m[1mwandb[0m: 	optimizer: nadam
[34m[1mwandb[0m: 	weight_decay: 0.0005


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='73.271 MB of 73.271 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▆█
epoch,▁▅█
loss,█▅▁
val_binary_accuracy,▁▅█
val_loss,█▅▁

0,1
GFLOPS,0.0
best_epoch,2.0
best_val_loss,0.54096
binary_accuracy,0.77137
epoch,2.0
loss,0.57233
val_binary_accuracy,0.79281
val_loss,0.54096


[34m[1mwandb[0m: Agent Starting Run: 6moge6ny with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 1e-05
[34m[1mwandb[0m: 	optimizer: nadam
[34m[1mwandb[0m: 	weight_decay: 0.005


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='73.271 MB of 73.271 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▆█
epoch,▁▅█
loss,█▅▁
val_binary_accuracy,▁▅█
val_loss,█▅▁

0,1
GFLOPS,0.0
best_epoch,2.0
best_val_loss,0.54064
binary_accuracy,0.77161
epoch,2.0
loss,0.57208
val_binary_accuracy,0.7927
val_loss,0.54064


[34m[1mwandb[0m: Agent Starting Run: a792qmp1 with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 1e-05
[34m[1mwandb[0m: 	optimizer: nadam
[34m[1mwandb[0m: 	weight_decay: 0.05


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='73.271 MB of 73.271 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▆█
epoch,▁▅█
loss,█▅▁
val_binary_accuracy,▁▅█
val_loss,█▅▁

0,1
GFLOPS,0.0
best_epoch,2.0
best_val_loss,0.54081
binary_accuracy,0.77112
epoch,2.0
loss,0.5724
val_binary_accuracy,0.79266
val_loss,0.54081


[34m[1mwandb[0m: Agent Starting Run: d0n7f70r with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 1e-05
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_decay: 0.0005


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='48.856 MB of 48.856 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▅█
epoch,▁▅█
loss,█▃▁
val_binary_accuracy,▁▅█
val_loss,█▄▁

0,1
GFLOPS,0.0
best_epoch,2.0
best_val_loss,0.69253
binary_accuracy,0.5062
epoch,2.0
loss,0.69259
val_binary_accuracy,0.50378
val_loss,0.69253


[34m[1mwandb[0m: Agent Starting Run: oys59qkz with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 1e-05
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_decay: 0.005


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='0.001 MB of 48.856 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=3.03540…

0,1
binary_accuracy,▁▅█
epoch,▁▅█
loss,█▄▁
val_binary_accuracy,▁▅█
val_loss,█▄▁

0,1
GFLOPS,0.0
best_epoch,2.0
best_val_loss,0.69199
binary_accuracy,0.51525
epoch,2.0
loss,0.69204
val_binary_accuracy,0.51176
val_loss,0.69199


[34m[1mwandb[0m: Agent Starting Run: d5h08nwu with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 1e-05
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_decay: 0.05


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='48.856 MB of 48.856 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▅█
epoch,▁▅█
loss,█▄▁
val_binary_accuracy,▁▄█
val_loss,█▄▁

0,1
GFLOPS,0.0
best_epoch,2.0
best_val_loss,0.69234
binary_accuracy,0.50985
epoch,2.0
loss,0.69237
val_binary_accuracy,0.50675
val_loss,0.69234


[34m[1mwandb[0m: Agent Starting Run: 0q7x8wgl with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 1e-05
[34m[1mwandb[0m: 	optimizer: rmsprop
[34m[1mwandb[0m: 	weight_decay: 0.0005


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='48.856 MB of 48.856 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▆█
epoch,▁▅█
loss,█▅▁
val_binary_accuracy,▁▅█
val_loss,█▅▁

0,1
GFLOPS,0.0
best_epoch,2.0
best_val_loss,0.57297
binary_accuracy,0.76068
epoch,2.0
loss,0.59493
val_binary_accuracy,0.77555
val_loss,0.57297


[34m[1mwandb[0m: Agent Starting Run: rmwohpmd with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 1e-05
[34m[1mwandb[0m: 	optimizer: rmsprop
[34m[1mwandb[0m: 	weight_decay: 0.005


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='48.856 MB of 48.856 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▆█
epoch,▁▅█
loss,█▅▁
val_binary_accuracy,▁▅█
val_loss,█▅▁

0,1
GFLOPS,0.0
best_epoch,2.0
best_val_loss,0.57353
binary_accuracy,0.75881
epoch,2.0
loss,0.59557
val_binary_accuracy,0.77376
val_loss,0.57353


[34m[1mwandb[0m: Agent Starting Run: yyza159d with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 1e-05
[34m[1mwandb[0m: 	optimizer: rmsprop
[34m[1mwandb[0m: 	weight_decay: 0.05


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='48.856 MB of 48.856 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▆█
epoch,▁▅█
loss,█▅▁
val_binary_accuracy,▁▅█
val_loss,█▅▁

0,1
GFLOPS,0.0
best_epoch,2.0
best_val_loss,0.57176
binary_accuracy,0.76024
epoch,2.0
loss,0.59387
val_binary_accuracy,0.77521
val_loss,0.57176


[34m[1mwandb[0m: Agent Starting Run: bk58aaq1 with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 5e-05
[34m[1mwandb[0m: 	optimizer: adam
[34m[1mwandb[0m: 	weight_decay: 0.0005


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='73.271 MB of 73.271 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▇█
epoch,▁▅█
loss,█▃▁
val_binary_accuracy,▁▇█
val_loss,█▂▁

0,1
GFLOPS,0.0
best_epoch,2.0
best_val_loss,0.15148
binary_accuracy,0.94847
epoch,2.0
loss,0.16624
val_binary_accuracy,0.95084
val_loss,0.15148


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: 9qepk9ri with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 5e-05
[34m[1mwandb[0m: 	optimizer: adam
[34m[1mwandb[0m: 	weight_decay: 0.005


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='73.271 MB of 73.271 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▇█
epoch,▁▅█
loss,█▃▁
val_binary_accuracy,▁▇█
val_loss,█▂▁

0,1
GFLOPS,0.0
best_epoch,2.0
best_val_loss,0.1522
binary_accuracy,0.94815
epoch,2.0
loss,0.16731
val_binary_accuracy,0.95069
val_loss,0.1522


[34m[1mwandb[0m: Agent Starting Run: 671fwmbv with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 5e-05
[34m[1mwandb[0m: 	optimizer: adam
[34m[1mwandb[0m: 	weight_decay: 0.05


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='73.271 MB of 73.271 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▇█
epoch,▁▅█
loss,█▃▁
val_binary_accuracy,▁▇█
val_loss,█▂▁

0,1
GFLOPS,0.0
best_epoch,2.0
best_val_loss,0.15165
binary_accuracy,0.9484
epoch,2.0
loss,0.16648
val_binary_accuracy,0.95093
val_loss,0.15165


[34m[1mwandb[0m: Agent Starting Run: nypohtzg with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 5e-05
[34m[1mwandb[0m: 	optimizer: nadam
[34m[1mwandb[0m: 	weight_decay: 0.0005


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='73.271 MB of 73.271 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▇█
epoch,▁▅█
loss,█▃▁
val_binary_accuracy,▁▇█
val_loss,█▃▁

0,1
GFLOPS,0.0
best_epoch,2.0
best_val_loss,0.18615
binary_accuracy,0.93396
epoch,2.0
loss,0.20426
val_binary_accuracy,0.93714
val_loss,0.18615


[34m[1mwandb[0m: Agent Starting Run: ul7v9im8 with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 5e-05
[34m[1mwandb[0m: 	optimizer: nadam
[34m[1mwandb[0m: 	weight_decay: 0.005


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='73.271 MB of 73.271 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▇█
epoch,▁▅█
loss,█▃▁
val_binary_accuracy,▁▇█
val_loss,█▃▁

0,1
GFLOPS,0.0
best_epoch,2.0
best_val_loss,0.18599
binary_accuracy,0.93389
epoch,2.0
loss,0.20386
val_binary_accuracy,0.93729
val_loss,0.18599


[34m[1mwandb[0m: Agent Starting Run: 84rkwt9r with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 5e-05
[34m[1mwandb[0m: 	optimizer: nadam
[34m[1mwandb[0m: 	weight_decay: 0.05


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='73.271 MB of 73.271 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▇█
epoch,▁▅█
loss,█▃▁
val_binary_accuracy,▁▇█
val_loss,█▃▁

0,1
GFLOPS,0.0
best_epoch,2.0
best_val_loss,0.18668
binary_accuracy,0.9337
epoch,2.0
loss,0.20509
val_binary_accuracy,0.93709
val_loss,0.18668


[34m[1mwandb[0m: Agent Starting Run: qxozpuql with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 5e-05
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_decay: 0.0005


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='48.856 MB of 48.856 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▅█
epoch,▁▅█
loss,█▄▁
val_binary_accuracy,▁▅█
val_loss,█▄▁

0,1
GFLOPS,0.0
best_epoch,2.0
best_val_loss,0.68976
binary_accuracy,0.54438
epoch,2.0
loss,0.69017
val_binary_accuracy,0.54692
val_loss,0.68976


[34m[1mwandb[0m: Agent Starting Run: o4k7ele7 with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 5e-05
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_decay: 0.005


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='48.856 MB of 48.856 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▆█
epoch,▁▅█
loss,█▄▁
val_binary_accuracy,▁▆█
val_loss,█▄▁

0,1
GFLOPS,0.0
best_epoch,2.0
best_val_loss,0.68913
binary_accuracy,0.55106
epoch,2.0
loss,0.68951
val_binary_accuracy,0.5529
val_loss,0.68913


[34m[1mwandb[0m: Agent Starting Run: 0t5s07vr with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 5e-05
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_decay: 0.05


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='48.856 MB of 48.856 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▆█
epoch,▁▅█
loss,█▄▁
val_binary_accuracy,▁▅█
val_loss,█▄▁

0,1
GFLOPS,0.0
best_epoch,2.0
best_val_loss,0.68962
binary_accuracy,0.54613
epoch,2.0
loss,0.69002
val_binary_accuracy,0.54837
val_loss,0.68962


[34m[1mwandb[0m: Agent Starting Run: qs16csae with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 5e-05
[34m[1mwandb[0m: 	optimizer: rmsprop
[34m[1mwandb[0m: 	weight_decay: 0.0005


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='48.856 MB of 48.856 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▇█
epoch,▁▅█
loss,█▃▁
val_binary_accuracy,▁▇█
val_loss,█▃▁

0,1
GFLOPS,0.0
best_epoch,2.0
best_val_loss,0.18692
binary_accuracy,0.93751
epoch,2.0
loss,0.20682
val_binary_accuracy,0.94109
val_loss,0.18692


[34m[1mwandb[0m: Agent Starting Run: n87bpxki with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 5e-05
[34m[1mwandb[0m: 	optimizer: rmsprop
[34m[1mwandb[0m: 	weight_decay: 0.005


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='48.856 MB of 48.856 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▇█
epoch,▁▅█
loss,█▃▁
val_binary_accuracy,▁▇█
val_loss,█▃▁

0,1
GFLOPS,0.0
best_epoch,2.0
best_val_loss,0.18801
binary_accuracy,0.93727
epoch,2.0
loss,0.20824
val_binary_accuracy,0.9408
val_loss,0.18801


[34m[1mwandb[0m: Agent Starting Run: b7gd096x with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 5e-05
[34m[1mwandb[0m: 	optimizer: rmsprop
[34m[1mwandb[0m: 	weight_decay: 0.05


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='48.856 MB of 48.856 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▇█
epoch,▁▅█
loss,█▃▁
val_binary_accuracy,▁▇█
val_loss,█▃▁

0,1
GFLOPS,0.0
best_epoch,2.0
best_val_loss,0.18812
binary_accuracy,0.93723
epoch,2.0
loss,0.20839
val_binary_accuracy,0.94083
val_loss,0.18812


[34m[1mwandb[0m: Agent Starting Run: jpu9yf2i with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 0.0001
[34m[1mwandb[0m: 	optimizer: adam
[34m[1mwandb[0m: 	weight_decay: 0.0005


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='73.271 MB of 73.271 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▇█
epoch,▁▅█
loss,█▂▁
val_binary_accuracy,▁▆█
val_loss,█▂▁

0,1
GFLOPS,0.0
best_epoch,2.0
best_val_loss,0.12332
binary_accuracy,0.95795
epoch,2.0
loss,0.12606
val_binary_accuracy,0.95899
val_loss,0.12332


[34m[1mwandb[0m: Agent Starting Run: l6tysz1e with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 0.0001
[34m[1mwandb[0m: 	optimizer: adam
[34m[1mwandb[0m: 	weight_decay: 0.005


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='73.271 MB of 73.271 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▇█
epoch,▁▅█
loss,█▂▁
val_binary_accuracy,▁▆█
val_loss,█▂▁

0,1
GFLOPS,0.0
best_epoch,2.0
best_val_loss,0.1234
binary_accuracy,0.95791
epoch,2.0
loss,0.1262
val_binary_accuracy,0.95901
val_loss,0.1234


[34m[1mwandb[0m: Agent Starting Run: f071mlna with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 0.0001
[34m[1mwandb[0m: 	optimizer: adam
[34m[1mwandb[0m: 	weight_decay: 0.05


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='73.271 MB of 73.271 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▇█
epoch,▁▅█
loss,█▂▁
val_binary_accuracy,▁▆█
val_loss,█▂▁

0,1
GFLOPS,0.0
best_epoch,2.0
best_val_loss,0.12321
binary_accuracy,0.95802
epoch,2.0
loss,0.12591
val_binary_accuracy,0.95914
val_loss,0.12321


[34m[1mwandb[0m: Agent Starting Run: ok5qiz3x with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 0.0001
[34m[1mwandb[0m: 	optimizer: nadam
[34m[1mwandb[0m: 	weight_decay: 0.0005


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='73.271 MB of 73.271 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▇█
epoch,▁▅█
loss,█▂▁
val_binary_accuracy,▁▆█
val_loss,█▃▁

0,1
GFLOPS,0.0
best_epoch,2.0
best_val_loss,0.147
binary_accuracy,0.94724
epoch,2.0
loss,0.15325
val_binary_accuracy,0.9494
val_loss,0.147


[34m[1mwandb[0m: Agent Starting Run: wgrn4sye with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 0.0001
[34m[1mwandb[0m: 	optimizer: nadam
[34m[1mwandb[0m: 	weight_decay: 0.005


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='73.271 MB of 73.271 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▇█
epoch,▁▅█
loss,█▂▁
val_binary_accuracy,▁▆█
val_loss,█▃▁

0,1
GFLOPS,0.0
best_epoch,2.0
best_val_loss,0.14636
binary_accuracy,0.9476
epoch,2.0
loss,0.15246
val_binary_accuracy,0.94958
val_loss,0.14636


[34m[1mwandb[0m: Agent Starting Run: mx2ibxt9 with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 0.0001
[34m[1mwandb[0m: 	optimizer: nadam
[34m[1mwandb[0m: 	weight_decay: 0.05


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='73.271 MB of 73.271 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▇█
epoch,▁▅█
loss,█▂▁
val_binary_accuracy,▁▆█
val_loss,█▃▁

0,1
GFLOPS,0.0
best_epoch,2.0
best_val_loss,0.14656
binary_accuracy,0.94754
epoch,2.0
loss,0.15265
val_binary_accuracy,0.94949
val_loss,0.14656


[34m[1mwandb[0m: Agent Starting Run: rp0lhp3j with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 0.0001
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_decay: 0.0005


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='48.856 MB of 48.856 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▆█
epoch,▁▅█
loss,█▄▁
val_binary_accuracy,▁▆█
val_loss,█▄▁

0,1
GFLOPS,0.0
best_epoch,2.0
best_val_loss,0.68687
binary_accuracy,0.56313
epoch,2.0
loss,0.68756
val_binary_accuracy,0.5669
val_loss,0.68687


[34m[1mwandb[0m: Agent Starting Run: ssdcqtph with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 0.0001
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_decay: 0.005


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='48.856 MB of 48.856 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▆█
epoch,▁▅█
loss,█▄▁
val_binary_accuracy,▁▆█
val_loss,█▄▁

0,1
GFLOPS,0.0
best_epoch,2.0
best_val_loss,0.68671
binary_accuracy,0.56278
epoch,2.0
loss,0.68742
val_binary_accuracy,0.5667
val_loss,0.68671


[34m[1mwandb[0m: Agent Starting Run: rrqqutvg with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 0.0001
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_decay: 0.05


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='48.856 MB of 48.856 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▆█
epoch,▁▅█
loss,█▄▁
val_binary_accuracy,▁▆█
val_loss,█▄▁

0,1
GFLOPS,0.0
best_epoch,2.0
best_val_loss,0.68682
binary_accuracy,0.56258
epoch,2.0
loss,0.68755
val_binary_accuracy,0.56672
val_loss,0.68682


[34m[1mwandb[0m: Agent Starting Run: o78kanmb with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 0.0001
[34m[1mwandb[0m: 	optimizer: rmsprop
[34m[1mwandb[0m: 	weight_decay: 0.0005


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='48.856 MB of 48.856 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁██
epoch,▁▅█
loss,█▂▁
val_binary_accuracy,▁▆█
val_loss,█▂▁

0,1
GFLOPS,0.0
best_epoch,2.0
best_val_loss,0.14437
binary_accuracy,0.9495
epoch,2.0
loss,0.14918
val_binary_accuracy,0.95119
val_loss,0.14437


[34m[1mwandb[0m: Agent Starting Run: mpv2m2a9 with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 0.0001
[34m[1mwandb[0m: 	optimizer: rmsprop
[34m[1mwandb[0m: 	weight_decay: 0.005


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='48.856 MB of 48.856 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁██
epoch,▁▅█
loss,█▂▁
val_binary_accuracy,▁▆█
val_loss,█▂▁

0,1
GFLOPS,0.0
best_epoch,2.0
best_val_loss,0.14479
binary_accuracy,0.9493
epoch,2.0
loss,0.14971
val_binary_accuracy,0.95099
val_loss,0.14479


[34m[1mwandb[0m: Agent Starting Run: xyuqarq0 with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 0.0001
[34m[1mwandb[0m: 	optimizer: rmsprop
[34m[1mwandb[0m: 	weight_decay: 0.05


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='48.856 MB of 48.856 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▇█
epoch,▁▅█
loss,█▂▁
val_binary_accuracy,▁▆█
val_loss,█▂▁

0,1
GFLOPS,0.0
best_epoch,2.0
best_val_loss,0.14448
binary_accuracy,0.94944
epoch,2.0
loss,0.14931
val_binary_accuracy,0.95114
val_loss,0.14448


[34m[1mwandb[0m: Agent Starting Run: z0t3wlo3 with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 0.0005
[34m[1mwandb[0m: 	optimizer: adam
[34m[1mwandb[0m: 	weight_decay: 0.0005


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='73.271 MB of 73.271 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▇█
epoch,▁▅█
loss,█▂▁
val_binary_accuracy,▁▇█
val_loss,█▂▁

0,1
GFLOPS,0.0
best_epoch,2.0
best_val_loss,0.10786
binary_accuracy,0.96624
epoch,2.0
loss,0.10089
val_binary_accuracy,0.96457
val_loss,0.10786


[34m[1mwandb[0m: Agent Starting Run: ugcvgkc7 with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 0.0005
[34m[1mwandb[0m: 	optimizer: adam
[34m[1mwandb[0m: 	weight_decay: 0.005


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='73.271 MB of 73.271 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▇█
epoch,▁▅█
loss,█▂▁
val_binary_accuracy,▁▇█
val_loss,█▂▁

0,1
GFLOPS,0.0
best_epoch,2.0
best_val_loss,0.10783
binary_accuracy,0.96623
epoch,2.0
loss,0.10088
val_binary_accuracy,0.96459
val_loss,0.10783


[34m[1mwandb[0m: Agent Starting Run: cn0lqqcw with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 0.0005
[34m[1mwandb[0m: 	optimizer: adam
[34m[1mwandb[0m: 	weight_decay: 0.05


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='73.271 MB of 73.271 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▇█
epoch,▁▅█
loss,█▂▁
val_binary_accuracy,▁▇█
val_loss,█▂▁

0,1
GFLOPS,0.0
best_epoch,2.0
best_val_loss,0.10777
binary_accuracy,0.96627
epoch,2.0
loss,0.1008
val_binary_accuracy,0.96456
val_loss,0.10777


[34m[1mwandb[0m: Agent Starting Run: zkwwn3uc with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 0.0005
[34m[1mwandb[0m: 	optimizer: nadam
[34m[1mwandb[0m: 	weight_decay: 0.0005


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='73.271 MB of 73.271 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▇█
epoch,▁▅█
loss,█▂▁
val_binary_accuracy,▁▆█
val_loss,█▃▁

0,1
GFLOPS,0.0
best_epoch,2.0
best_val_loss,0.11468
binary_accuracy,0.96187
epoch,2.0
loss,0.11292
val_binary_accuracy,0.96243
val_loss,0.11468


[34m[1mwandb[0m: Agent Starting Run: 85c6o6cc with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 0.0005
[34m[1mwandb[0m: 	optimizer: nadam
[34m[1mwandb[0m: 	weight_decay: 0.005


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='73.271 MB of 73.271 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▇█
epoch,▁▅█
loss,█▂▁
val_binary_accuracy,▁▆█
val_loss,█▃▁

0,1
GFLOPS,0.0
best_epoch,2.0
best_val_loss,0.11462
binary_accuracy,0.96199
epoch,2.0
loss,0.11284
val_binary_accuracy,0.96249
val_loss,0.11462


[34m[1mwandb[0m: Agent Starting Run: vu86fx6q with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 0.0005
[34m[1mwandb[0m: 	optimizer: nadam
[34m[1mwandb[0m: 	weight_decay: 0.05


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='73.271 MB of 73.271 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▇█
epoch,▁▅█
loss,█▂▁
val_binary_accuracy,▁▆█
val_loss,█▃▁

0,1
GFLOPS,0.0
best_epoch,2.0
best_val_loss,0.11462
binary_accuracy,0.9619
epoch,2.0
loss,0.11286
val_binary_accuracy,0.96252
val_loss,0.11462


[34m[1mwandb[0m: Agent Starting Run: z8nyvihc with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 0.0005
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_decay: 0.0005


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='41.041 MB of 48.856 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=0.8400…

0,1
binary_accuracy,▁▇█
epoch,▁▅█
loss,█▃▁
val_binary_accuracy,▁▆█
val_loss,█▃▁

0,1
GFLOPS,0.0
best_epoch,2.0
best_val_loss,0.67744
binary_accuracy,0.57759
epoch,2.0
loss,0.67878
val_binary_accuracy,0.58117
val_loss,0.67744


[34m[1mwandb[0m: Agent Starting Run: rkzasqt9 with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 0.0005
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_decay: 0.005


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='20.845 MB of 48.856 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=0.4266…

0,1
binary_accuracy,▁▇█
epoch,▁▅█
loss,█▃▁
val_binary_accuracy,▁▆█
val_loss,█▃▁

0,1
GFLOPS,0.0
best_epoch,2.0
best_val_loss,0.6774
binary_accuracy,0.57851
epoch,2.0
loss,0.67869
val_binary_accuracy,0.58108
val_loss,0.6774


[34m[1mwandb[0m: Agent Starting Run: t20pdwli with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 0.0005
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_decay: 0.05


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='48.856 MB of 48.856 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▇█
epoch,▁▅█
loss,█▃▁
val_binary_accuracy,▁▅█
val_loss,█▃▁

0,1
GFLOPS,0.0
best_epoch,2.0
best_val_loss,0.67724
binary_accuracy,0.57837
epoch,2.0
loss,0.67858
val_binary_accuracy,0.58132
val_loss,0.67724


[34m[1mwandb[0m: Agent Starting Run: 5t11gqo8 with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 0.0005
[34m[1mwandb[0m: 	optimizer: rmsprop
[34m[1mwandb[0m: 	weight_decay: 0.0005


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='48.856 MB of 48.856 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁██
epoch,▁▅█
loss,█▁▁
val_binary_accuracy,▁▇█
val_loss,█▃▁

0,1
GFLOPS,0.0
best_epoch,2.0
best_val_loss,0.12162
binary_accuracy,0.96005
epoch,2.0
loss,0.12074
val_binary_accuracy,0.95992
val_loss,0.12162


[34m[1mwandb[0m: Agent Starting Run: h53ihgit with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 0.0005
[34m[1mwandb[0m: 	optimizer: rmsprop
[34m[1mwandb[0m: 	weight_decay: 0.005


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='48.856 MB of 48.856 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁██
epoch,▁▅█
loss,█▁▁
val_binary_accuracy,▁▇█
val_loss,█▃▁

0,1
GFLOPS,0.0
best_epoch,2.0
best_val_loss,0.12169
binary_accuracy,0.95998
epoch,2.0
loss,0.12079
val_binary_accuracy,0.95991
val_loss,0.12169


[34m[1mwandb[0m: Agent Starting Run: n1qaplm5 with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 0.0005
[34m[1mwandb[0m: 	optimizer: rmsprop
[34m[1mwandb[0m: 	weight_decay: 0.05


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='48.856 MB of 48.856 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁██
epoch,▁▅█
loss,█▁▁
val_binary_accuracy,▁▇█
val_loss,█▃▁

0,1
GFLOPS,0.0
best_epoch,2.0
best_val_loss,0.12165
binary_accuracy,0.96007
epoch,2.0
loss,0.12079
val_binary_accuracy,0.95986
val_loss,0.12165


[34m[1mwandb[0m: Agent Starting Run: bhf4f0kj with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: adam
[34m[1mwandb[0m: 	weight_decay: 0.0005


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='73.271 MB of 73.271 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▇█
epoch,▁▅█
loss,█▂▁
val_binary_accuracy,▁▅█
val_loss,█▂▁

0,1
GFLOPS,0.0
best_epoch,2.0
best_val_loss,0.10669
binary_accuracy,0.96694
epoch,2.0
loss,0.09873
val_binary_accuracy,0.96548
val_loss,0.10669


[34m[1mwandb[0m: Agent Starting Run: jipfz2r9 with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: adam
[34m[1mwandb[0m: 	weight_decay: 0.005


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='46.955 MB of 73.271 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=0.6408…

0,1
binary_accuracy,▁▇█
epoch,▁▅█
loss,█▂▁
val_binary_accuracy,▁▅█
val_loss,█▂▁

0,1
GFLOPS,0.0
best_epoch,2.0
best_val_loss,0.10667
binary_accuracy,0.96691
epoch,2.0
loss,0.09874
val_binary_accuracy,0.96549
val_loss,0.10667


[34m[1mwandb[0m: Agent Starting Run: dc8kskdz with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: adam
[34m[1mwandb[0m: 	weight_decay: 0.05


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='73.271 MB of 73.271 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▇█
epoch,▁▅█
loss,█▂▁
val_binary_accuracy,▁▅█
val_loss,█▂▁

0,1
GFLOPS,0.0
best_epoch,2.0
best_val_loss,0.10665
binary_accuracy,0.96692
epoch,2.0
loss,0.09869
val_binary_accuracy,0.96555
val_loss,0.10665


[34m[1mwandb[0m: Agent Starting Run: j969as6c with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: nadam
[34m[1mwandb[0m: 	weight_decay: 0.0005


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='73.271 MB of 73.271 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▇█
epoch,▁▅█
loss,█▂▁
val_binary_accuracy,▁▅█
val_loss,█▃▁

0,1
GFLOPS,0.0
best_epoch,2.0
best_val_loss,0.11049
binary_accuracy,0.96383
epoch,2.0
loss,0.10755
val_binary_accuracy,0.96372
val_loss,0.11049


[34m[1mwandb[0m: Agent Starting Run: idlhcgzv with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: nadam
[34m[1mwandb[0m: 	weight_decay: 0.005


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='73.271 MB of 73.271 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▇█
epoch,▁▅█
loss,█▂▁
val_binary_accuracy,▁▅█
val_loss,█▃▁

0,1
GFLOPS,0.0
best_epoch,2.0
best_val_loss,0.11038
binary_accuracy,0.96383
epoch,2.0
loss,0.10745
val_binary_accuracy,0.96368
val_loss,0.11038


[34m[1mwandb[0m: Agent Starting Run: 4dewwgoi with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: nadam
[34m[1mwandb[0m: 	weight_decay: 0.05


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='73.271 MB of 73.271 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▇█
epoch,▁▅█
loss,█▂▁
val_binary_accuracy,▁▅█
val_loss,█▄▁

0,1
GFLOPS,0.0
best_epoch,2.0
best_val_loss,0.11045
binary_accuracy,0.96385
epoch,2.0
loss,0.10756
val_binary_accuracy,0.96371
val_loss,0.11045


[34m[1mwandb[0m: Agent Starting Run: 61sire1q with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_decay: 0.0005


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='48.856 MB of 48.856 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▇█
epoch,▁▅█
loss,█▂▁
val_binary_accuracy,▁▆█
val_loss,█▃▁

0,1
GFLOPS,0.0
best_epoch,2.0
best_val_loss,0.67491
binary_accuracy,0.58151
epoch,2.0
loss,0.67632
val_binary_accuracy,0.58484
val_loss,0.67491


[34m[1mwandb[0m: Agent Starting Run: bmf2170c with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_decay: 0.005


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='48.856 MB of 48.856 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▇█
epoch,▁▅█
loss,█▂▁
val_binary_accuracy,▁▆█
val_loss,█▃▁

0,1
GFLOPS,0.0
best_epoch,2.0
best_val_loss,0.67496
binary_accuracy,0.58158
epoch,2.0
loss,0.67632
val_binary_accuracy,0.58466
val_loss,0.67496


[34m[1mwandb[0m: Agent Starting Run: uuqi1fji with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_decay: 0.05


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='21.205 MB of 48.856 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=0.4340…

0,1
binary_accuracy,▁▇█
epoch,▁▅█
loss,█▂▁
val_binary_accuracy,▁▆█
val_loss,█▃▁

0,1
GFLOPS,0.0
best_epoch,2.0
best_val_loss,0.67496
binary_accuracy,0.58165
epoch,2.0
loss,0.67629
val_binary_accuracy,0.58482
val_loss,0.67496


[34m[1mwandb[0m: Agent Starting Run: uzaxbs8m with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: rmsprop
[34m[1mwandb[0m: 	weight_decay: 0.0005


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='48.856 MB of 48.856 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁██
epoch,▁▅█
loss,█▁▁
val_binary_accuracy,▁▆█
val_loss,█▃▁

0,1
GFLOPS,0.0
best_epoch,2.0
best_val_loss,0.11962
binary_accuracy,0.96086
epoch,2.0
loss,0.11845
val_binary_accuracy,0.96063
val_loss,0.11962


[34m[1mwandb[0m: Agent Starting Run: gdedzykj with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: rmsprop
[34m[1mwandb[0m: 	weight_decay: 0.005


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='48.856 MB of 48.856 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁██
epoch,▁▅█
loss,█▁▁
val_binary_accuracy,▁▆█
val_loss,█▃▁

0,1
GFLOPS,0.0
best_epoch,2.0
best_val_loss,0.11957
binary_accuracy,0.96085
epoch,2.0
loss,0.11842
val_binary_accuracy,0.96069
val_loss,0.11957


[34m[1mwandb[0m: Agent Starting Run: 6c0dpp2t with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: rmsprop
[34m[1mwandb[0m: 	weight_decay: 0.05


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='48.856 MB of 48.856 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁██
epoch,▁▅█
loss,█▁▁
val_binary_accuracy,▁▆█
val_loss,█▃▁

0,1
GFLOPS,0.0
best_epoch,2.0
best_val_loss,0.11961
binary_accuracy,0.96086
epoch,2.0
loss,0.11844
val_binary_accuracy,0.96064
val_loss,0.11961


[34m[1mwandb[0m: Agent Starting Run: ub61b9y9 with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 0.005
[34m[1mwandb[0m: 	optimizer: adam
[34m[1mwandb[0m: 	weight_decay: 0.0005


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='73.271 MB of 73.271 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▇█
epoch,▁▅█
loss,█▂▁
val_binary_accuracy,▁▂█
val_loss,█▄▁

0,1
GFLOPS,0.0
best_epoch,2.0
best_val_loss,0.10709
binary_accuracy,0.96628
epoch,2.0
loss,0.10003
val_binary_accuracy,0.96537
val_loss,0.10709


[34m[1mwandb[0m: Agent Starting Run: 5f05p9f5 with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 0.005
[34m[1mwandb[0m: 	optimizer: adam
[34m[1mwandb[0m: 	weight_decay: 0.005


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='73.271 MB of 73.271 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▇█
epoch,▁▅█
loss,█▂▁
val_binary_accuracy,▁▂█
val_loss,█▄▁

0,1
GFLOPS,0.0
best_epoch,2.0
best_val_loss,0.10709
binary_accuracy,0.96634
epoch,2.0
loss,0.10002
val_binary_accuracy,0.96526
val_loss,0.10709


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: whd0u4hk with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 0.005
[34m[1mwandb[0m: 	optimizer: adam
[34m[1mwandb[0m: 	weight_decay: 0.05


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='73.271 MB of 73.271 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▇█
epoch,▁▅█
loss,█▂▁
val_binary_accuracy,▁▁█
val_loss,█▄▁

0,1
GFLOPS,0.0
best_epoch,2.0
best_val_loss,0.10707
binary_accuracy,0.96626
epoch,2.0
loss,0.10002
val_binary_accuracy,0.96536
val_loss,0.10707


[34m[1mwandb[0m: Agent Starting Run: wzq6krcw with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 0.005
[34m[1mwandb[0m: 	optimizer: nadam
[34m[1mwandb[0m: 	weight_decay: 0.0005


Epoch 1/3
Epoch 2/3