# Text classification using Tensorflow: Sentiment on Reviews
# Hyperparameter Tuning

This notebook trains a binary classifier for sentiment analysis to classify restaurant food reviews as *negative* or *positive*, based on the text of the review where a sentiment score was previously calculated. 


In [None]:
from google.colab import drive 
drive.mount('/content/drive')

Mounted at /content/drive


In [None]:
!pip install --upgrade -q wandb
import wandb
from wandb.keras import WandbCallback
import os
import random
import numpy as np
import pandas as pd
import shutil
import time
import datetime
from datetime import datetime, timedelta
from timeit import default_timer as timer
import pickle
import joblib
from sklearn.utils import shuffle
import tensorflow as tf
from tensorflow.keras import layers
from tensorflow.keras import losses
from tensorboard.plugins.hparams import api as hp
from tensorflow.keras.callbacks import ReduceLROnPlateau, ModelCheckpoint, Callback, EarlyStopping
from tensorflow.keras.optimizers import Adam, RMSprop, SGD, Nadam
import matplotlib
import matplotlib.pyplot as plt
import tqdm
from tensorflow import keras
from keras.utils import np_utils

[K     |████████████████████████████████| 1.8 MB 8.1 MB/s 
[K     |████████████████████████████████| 181 kB 98.6 MB/s 
[K     |████████████████████████████████| 145 kB 47.3 MB/s 
[K     |████████████████████████████████| 63 kB 2.2 MB/s 
[?25h  Building wheel for pathtools (setup.py) ... [?25l[?25hdone


In [None]:
print('CUDA and NVIDIA GPU Information')
!/usr/local/cuda/bin/nvcc --version
!nvidia-smi

print('\n')
print('TensorFlow version: {}'.format(tf.__version__))
print('Eager execution is: {}'.format(tf.executing_eagerly()))
print('Keras version: {}'.format(tf.keras.__version__))
print('Num GPUs Available: ', len(tf.config.list_physical_devices('GPU')))

CUDA and NVIDIA GPU Information
nvcc: NVIDIA (R) Cuda compiler driver
Copyright (c) 2005-2020 NVIDIA Corporation
Built on Mon_Oct_12_20:09:46_PDT_2020
Cuda compilation tools, release 11.1, V11.1.105
Build cuda_11.1.TC455_06.29190527_0
Wed Jul  6 02:17:55 2022       
+-----------------------------------------------------------------------------+
| NVIDIA-SMI 460.32.03    Driver Version: 460.32.03    CUDA Version: 11.2     |
|-------------------------------+----------------------+----------------------+
| GPU  Name        Persistence-M| Bus-Id        Disp.A | Volatile Uncorr. ECC |
| Fan  Temp  Perf  Pwr:Usage/Cap|         Memory-Usage | GPU-Util  Compute M. |
|                               |                      |               MIG M. |
|   0  Tesla P100-PCIE...  Off  | 00000000:00:04.0 Off |                    0 |
| N/A   37C    P0    27W / 250W |      0MiB / 16280MiB |      0%      Default |
|                               |                      |                  N/A |
+------------

In [None]:
# Reproducibility in TF 
def init_seeds(seed=42):
    np.random.seed(seed)
    random.seed(seed)
    session_conf = tf.compat.v1.ConfigProto()
    session_conf = tf.compat.v1.ConfigProto(intra_op_parallelism_threads=1,
                              inter_op_parallelism_threads=1)
    os.environ['TF_CUDNN_DETERMINISTIC'] ='true'
    os.environ['TF_DETERMINISTIC_OPS'] = 'true'
    tf.random.set_seed(seed)
    sess = tf.compat.v1.Session(graph=tf.compat.v1.get_default_graph(),
                                config=session_conf)
    tf.compat.v1.keras.backend.set_session(sess)
    return sess

In [None]:
init_seeds(seed=42)

<tensorflow.python.client.session.Session at 0x7fe6538c8e50>

In [None]:
%cd /content/drive/MyDrive/Yelp_Reviews/Data/

/content/drive/MyDrive/Yelp_Reviews/Data


In [None]:
# Read tokenized reviews with sentiment
df = pd.read_parquet('YelpReviews_NLP_sentimentNegPos_tokenized.parquet')
print('Number of rows and columns:', df.shape)
df.head()

Number of rows and columns: (829874, 3)


Unnamed: 0_level_0,cleanReview,sentiment,stars_reviews
index,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1
1,"[order, chicken, finger, sub, honey, mustard, ...",Negative,3.0
3,"[dedicated, loving, memory, gary, feldman, gre...",Negative,5.0
12,"[absolutely, horrible, thought, would, order, ...",Negative,1.0
15,"[found, better, chicken, finger, know, inside,...",Negative,4.0
20,"[amazing, everything, tried, disappoint, chick...",Negative,5.0


In [None]:
# Examine how star reviews pairs with sentiment polarity
print(df[['stars_reviews', 'sentiment']].value_counts())

stars_reviews  sentiment
5.0            Positive     278011
1.0            Negative     231245
4.0            Positive     104585
2.0            Negative      90320
3.0            Negative      44097
4.0            Negative      26276
5.0            Negative      22999
3.0            Positive      22096
2.0            Positive       6690
1.0            Positive       3555
dtype: int64


In [None]:
# Remove comma from tokenize to make one string
df = df.copy()
df['cleanReview'] = df['cleanReview'].apply(lambda x: ','.join(map(str, x)))
df.loc[:,'cleanReview'] =  df['cleanReview'].str.replace(r',', ' ', regex=True)
df.head()

Unnamed: 0_level_0,cleanReview,sentiment,stars_reviews
index,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1
1,order chicken finger sub honey mustard sauce p...,Negative,3.0
3,dedicated loving memory gary feldman greatest ...,Negative,5.0
12,absolutely horrible thought would order place ...,Negative,1.0
15,found better chicken finger know inside crisp ...,Negative,4.0
20,amazing everything tried disappoint chicken ca...,Negative,5.0


In [None]:
# Recode to binary
df = df.copy()
df['sentiment'].mask(df['sentiment'] == 'Negative', 0, inplace=True)
df['sentiment'].mask(df['sentiment'] == 'Positive', 1, inplace=True)

print('Number of reviews per group:')
df[['sentiment']].value_counts() 

Number of reviews per group:


sentiment
0            414937
1            414937
dtype: int64

In [None]:
# Shuffle data
df = df.drop(['stars_reviews'], axis=1)
df = shuffle(df)
df.shape

(829874, 2)

In [None]:
# Convert data types
df = df.copy()
df[['cleanReview']] = df[['cleanReview']].astype('str')
df['sentiment'] = df['sentiment'].astype('float32')

In [None]:
features = df['cleanReview']
labels = df['sentiment']

In [None]:
# Load pandas df to tf
df = tf.data.Dataset.from_tensor_slices((features, labels))

In [None]:
# Define components for paritioning data
df_size = df.cardinality().numpy()
train_size = int(0.8 * df_size)
val_size = int(0.10 * df_size)
test_size = int(0.10 * df_size)
BATCH_SIZE = 32

In [None]:
# Prepare train/test sets
df = df.shuffle(800_000, seed=42, reshuffle_each_iteration=False)
train = df.take(train_size).batch(BATCH_SIZE) 
test = df.skip(train_size)
val = test.skip(val_size).batch(BATCH_SIZE) 
test= test.take(test_size).batch(BATCH_SIZE) 

print('Train data split:', len(train))
print('Eval data split', len(val))
print('Test data split', len(test))

Train data split: 20747
Eval data split 2594
Test data split 2594


# Sentiment analysis




### Prepare the data for training

Next, the reviews are tokenized and vectorized using `tf.keras.layers.TextVectorization` layer. Tokenization refers to splitting strings into single words, or tokens. Vectorization converts the tokens into numbers as input for the neural network. Unique integer indices are created for each token by using `output_mode` = `int`. The `max_features` and `sequence_length` are defined for what is sampled.

In [None]:
max_features = 50000
sequence_length = 300

vectorize_layer = layers.TextVectorization(
    max_tokens=max_features,
    output_mode='int',
    output_sequence_length=sequence_length)

The preprocessing layer is fit to the dataset by using `adapt` for the training data, which results in the model creating an index of strings to integers.

In [None]:
# Make a review-only dataset and then call adapt
train_text = train.map(lambda x, y:x)
vectorize_layer.adapt(train_text)

Now, define a function to examine how the created layer preprocesses the data:



In [None]:
def vectorize_text(cleanReview, sentiment):
  cleanReview = tf.expand_dims(cleanReview, -1)
  return vectorize_layer(cleanReview), sentiment

In [None]:
# Sample a batch reviews and labels
text_batch, label_batch = next(iter(train))
first_review, first_label = text_batch[0], label_batch[0]
print('Review', first_review)
print('Label', first_label)
print('Vectorized review', vectorize_text(first_review, first_label))

Review tf.Tensor(b'waste time still business yet competition dripping springs area ordered delivery dozen time food usually okay delivery service horrible tried order three different occasion delivery told delivery driver called sick tonight placed order people told hour hour fifteen minute called hour minute later informed delivery driver leave work call replacement two hour later still food called back two people working friendly gm always mia wait another chinese place come town put business delivery fee also outrageous type service', shape=(), dtype=string)
Label tf.Tensor(0.0, shape=(), dtype=float32)
Vectorized review (<tf.Tensor: shape=(1, 300), dtype=int64, numpy=
array([[ 444,    7,   85,  193,  365, 2678, 2372, 2330,  123,   16,  230,
        1280,    7,    2,  288,  406,  230,    6,  122,  101,   11,  260,
         231,  936,  230,   82,  230,  789,  177,  549,  462,  616,   11,
          42,   82,   63,   63, 3115,   29,  177,   63,   29,  270, 1135,
         230,  789,  30

In [None]:
print('12870 ---> ', vectorize_layer.get_vocabulary()[12870])
print(' 3130 ---> ', vectorize_layer.get_vocabulary()[3130])
print('Vocabulary size: {}'.format(len(vectorize_layer.get_vocabulary())))

12870 --->  spongey
 3130 --->  unsanitary
Vocabulary size: 50000


Then, apply the `TextVectorization` layer to the train, validation, and test sets.

In [None]:
train_ds = train.map(vectorize_text)
val_ds = val.map(vectorize_text)
test_ds = test.map(vectorize_text)

Configure the dataset for performance by using `.cache()` and `.prefetch()`.




In [None]:
AUTOTUNE = tf.data.AUTOTUNE

train_ds = train_ds.cache().prefetch(buffer_size=AUTOTUNE)
val_ds = val_ds.cache().prefetch(buffer_size=AUTOTUNE)
test_ds = test_ds.cache().prefetch(buffer_size=AUTOTUNE)

# Hyperparameter Tuning

In [None]:
# Set path for results
%cd /content/drive/MyDrive/Yelp_Reviews/DL/BoW/SentimentPolarity/Models/

/content/drive/MyDrive/Yelp_Reviews/DL/BoW/SentimentPolarity/Models


In [None]:
wandb.login()

<IPython.core.display.Javascript object>

[34m[1mwandb[0m: Logging into wandb.ai. (Learn how to deploy a W&B server locally: https://wandb.me/wandb-server)
[34m[1mwandb[0m: You can find your API key in your browser here: https://wandb.ai/authorize
wandb: Paste an API key from your profile and hit enter, or press ctrl+c to quit: 

··········


[34m[1mwandb[0m: Appending key for api.wandb.ai to your netrc file: /root/.netrc


True

In [None]:
# Configure the sweep 
sweep_config = {
    'method': 'grid', 
    'metric': {
      'name': 'BinaryAccuracy',
      'goal': 'maximize'   
    },
    'parameters': {
        'epochs': {
            'values': [3, 5, 7]
        },
        'batch_size': {
            'values': [8, 4, 2, 1]
        },
        'embedding_dim': {
            'values': [128, 64, 32]
        },        
        'dropout': {
            'values': [0.2, 0.3, 0.4, 0.5]
        },
        'weight_decay': {
            'values': [0.0005, 0.005, 0.05]
        },
        'learning_rate': {
            'values': [0.00001, 0.00005, 0.0001, 0.0005, 0.001, 0.005, 0.01]
        },
        'optimizer': {
            'values': ['adam', 'nadam', 'sgd', 'rmsprop']
        },
    }
}

## 2. Initialize the Sweep

In [None]:
# Initialize a new sweep
sweep_id = wandb.sweep(sweep_config, entity='aschultz', 
                       project='tf_textclass_sentpol_grid')

Create sweep with ID: 2ld2attl
Sweep URL: https://wandb.ai/aschultz/tf_textclass_sentpol_grid/sweeps/2ld2attl


### Define Neural Network


In [None]:
# The sweep calls this function with each set of hyperparameters
def train():
    # Default values for hyperparameters 
    config_defaults = {
        'epochs': 5,
        'batch_size': 8,
        'weight_decay': 0.0005,
        'learning_rate': 0.01,
        'optimizer': 'adam',
        'embedding_dim': 32,
        'dropout': 0.5,
        'momentum': 0.9,
        'seed': 42
    }

    # Initialize a new wandb run
    wandb.init(config=config_defaults)
    
    # Config hyperparameters and inputs
    config = wandb.config
    
    # Define the model architecture 
    model = tf.keras.Sequential()
    model.add(tf.keras.layers.Embedding(max_features + 1, config.embedding_dim))
    model.add(tf.keras.layers.Dropout(config.dropout))
    model.add(tf.keras.layers.GlobalAveragePooling1D())
    model.add(tf.keras.layers.Dropout(config.dropout))
    model.add(tf.keras.layers.Dense(1))

    # Define the optimizer
    if config.optimizer=='sgd':
      optimizer = SGD(learning_rate=config.learning_rate, decay=1e-5, 
                      momentum=config.momentum, nesterov=True)
    elif config.optimizer=='rmsprop':
      optimizer = RMSprop(learning_rate=config.learning_rate, decay=1e-5)
    elif config.optimizer=='adam':
      optimizer = Adam(learning_rate=config.learning_rate, beta_1=0.9, 
                       beta_2=0.999, clipnorm=1.0)
    elif config.optimizer=='nadam':
      optimizer = Nadam(learning_rate=config.learning_rate, beta_1=0.9, 
                        beta_2=0.999, clipnorm=1.0)

    # Define loss and metrics
    model.compile(loss=losses.BinaryCrossentropy(from_logits=True), 
                  optimizer = optimizer, 
                  metrics=tf.metrics.BinaryAccuracy(threshold=0.0))

    # Fit model
    model.fit(train_ds, batch_size=config.batch_size,
              epochs=config.epochs,
              validation_data=(val_ds),
              callbacks=[WandbCallback(data_type="text", validation_data=(val_ds)), 
                                       EarlyStopping(patience=10, 
                                                     restore_best_weights=True)]) 

## 3. Run the sweep agent

In [None]:
# Run sweep for HPO
wandb.agent(sweep_id, train)

[34m[1mwandb[0m: Agent Starting Run: ro8tqjx3 with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 1e-05
[34m[1mwandb[0m: 	optimizer: adam
[34m[1mwandb[0m: 	weight_decay: 0.0005
[34m[1mwandb[0m: Currently logged in as: [33maschultz[0m. Use [1m`wandb login --relogin`[0m to force relogin




Instructions for updating:
Use `tf.compat.v1.graph_util.tensor_shape_from_node_def_name`
Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='73.271 MB of 73.271 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▆█
epoch,▁▅█
loss,█▅▁
val_binary_accuracy,▁▅█
val_loss,█▅▁

0,1
GFLOPS,0.0
best_epoch,2.0
best_val_loss,0.45283
binary_accuracy,0.83832
epoch,2.0
loss,0.50132
val_binary_accuracy,0.86209
val_loss,0.45283


[34m[1mwandb[0m: Agent Starting Run: iks0gbm4 with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 1e-05
[34m[1mwandb[0m: 	optimizer: adam
[34m[1mwandb[0m: 	weight_decay: 0.005


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='73.271 MB of 73.271 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▆█
epoch,▁▅█
loss,█▅▁
val_binary_accuracy,▁▅█
val_loss,█▅▁

0,1
GFLOPS,0.0
best_epoch,2.0
best_val_loss,0.45493
binary_accuracy,0.83697
epoch,2.0
loss,0.50339
val_binary_accuracy,0.86099
val_loss,0.45493


[34m[1mwandb[0m: Agent Starting Run: v5fl7s3l with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 1e-05
[34m[1mwandb[0m: 	optimizer: adam
[34m[1mwandb[0m: 	weight_decay: 0.05


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='73.271 MB of 73.271 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▆█
epoch,▁▅█
loss,█▅▁
val_binary_accuracy,▁▅█
val_loss,█▅▁

0,1
GFLOPS,0.0
best_epoch,2.0
best_val_loss,0.45502
binary_accuracy,0.83734
epoch,2.0
loss,0.5033
val_binary_accuracy,0.86128
val_loss,0.45502


[34m[1mwandb[0m: Agent Starting Run: zqcyw4io with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 1e-05
[34m[1mwandb[0m: 	optimizer: nadam
[34m[1mwandb[0m: 	weight_decay: 0.0005


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='73.271 MB of 73.271 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▆█
epoch,▁▅█
loss,█▅▁
val_binary_accuracy,▁▆█
val_loss,█▅▁

0,1
GFLOPS,0.0
best_epoch,2.0
best_val_loss,0.49319
binary_accuracy,0.8203
epoch,2.0
loss,0.53566
val_binary_accuracy,0.84229
val_loss,0.49319


[34m[1mwandb[0m: Agent Starting Run: g2bq7ixa with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 1e-05
[34m[1mwandb[0m: 	optimizer: nadam
[34m[1mwandb[0m: 	weight_decay: 0.005


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='73.271 MB of 73.271 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▆█
epoch,▁▅█
loss,█▅▁
val_binary_accuracy,▁▆█
val_loss,█▅▁

0,1
GFLOPS,0.0
best_epoch,2.0
best_val_loss,0.49238
binary_accuracy,0.82052
epoch,2.0
loss,0.53489
val_binary_accuracy,0.84271
val_loss,0.49238


[34m[1mwandb[0m: Agent Starting Run: hwtboou9 with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 1e-05
[34m[1mwandb[0m: 	optimizer: nadam
[34m[1mwandb[0m: 	weight_decay: 0.05


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='73.271 MB of 73.271 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▆█
epoch,▁▅█
loss,█▅▁
val_binary_accuracy,▁▆█
val_loss,█▅▁

0,1
GFLOPS,0.0
best_epoch,2.0
best_val_loss,0.49273
binary_accuracy,0.82025
epoch,2.0
loss,0.53555
val_binary_accuracy,0.84237
val_loss,0.49273


[34m[1mwandb[0m: Agent Starting Run: gvobexct with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 1e-05
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_decay: 0.0005


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='48.856 MB of 48.856 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▅█
epoch,▁▅█
loss,█▃▁
val_binary_accuracy,▁▄█
val_loss,█▄▁

0,1
GFLOPS,0.0
best_epoch,2.0
best_val_loss,0.69202
binary_accuracy,0.50597
epoch,2.0
loss,0.69227
val_binary_accuracy,0.50658
val_loss,0.69202


[34m[1mwandb[0m: Agent Starting Run: kzh48oqr with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 1e-05
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_decay: 0.005


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='48.856 MB of 48.856 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▄█
epoch,▁▅█
loss,█▄▁
val_binary_accuracy,▁▄█
val_loss,█▄▁

0,1
GFLOPS,0.0
best_epoch,2.0
best_val_loss,0.69136
binary_accuracy,0.51428
epoch,2.0
loss,0.69163
val_binary_accuracy,0.51399
val_loss,0.69136


[34m[1mwandb[0m: Agent Starting Run: ldulejg2 with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 1e-05
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_decay: 0.05


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='48.856 MB of 48.856 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▅█
epoch,▁▅█
loss,█▄▁
val_binary_accuracy,▁▄█
val_loss,█▄▁

0,1
GFLOPS,0.0
best_epoch,2.0
best_val_loss,0.69177
binary_accuracy,0.50879
epoch,2.0
loss,0.69204
val_binary_accuracy,0.50878
val_loss,0.69177


[34m[1mwandb[0m: Agent Starting Run: i73kf4cw with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 1e-05
[34m[1mwandb[0m: 	optimizer: rmsprop
[34m[1mwandb[0m: 	weight_decay: 0.0005


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='48.856 MB of 48.856 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▆█
epoch,▁▅█
loss,█▅▁
val_binary_accuracy,▁▆█
val_loss,█▅▁

0,1
GFLOPS,0.0
best_epoch,2.0
best_val_loss,0.53664
binary_accuracy,0.80659
epoch,2.0
loss,0.56644
val_binary_accuracy,0.82231
val_loss,0.53664


[34m[1mwandb[0m: Agent Starting Run: 5inqa954 with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 1e-05
[34m[1mwandb[0m: 	optimizer: rmsprop
[34m[1mwandb[0m: 	weight_decay: 0.005


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='48.856 MB of 48.856 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▆█
epoch,▁▅█
loss,█▅▁
val_binary_accuracy,▁▆█
val_loss,█▅▁

0,1
GFLOPS,0.0
best_epoch,2.0
best_val_loss,0.53703
binary_accuracy,0.80541
epoch,2.0
loss,0.56704
val_binary_accuracy,0.82114
val_loss,0.53703


[34m[1mwandb[0m: Agent Starting Run: mfyqclnx with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 1e-05
[34m[1mwandb[0m: 	optimizer: rmsprop
[34m[1mwandb[0m: 	weight_decay: 0.05


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='48.856 MB of 48.856 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▆█
epoch,▁▅█
loss,█▅▁
val_binary_accuracy,▁▆█
val_loss,█▅▁

0,1
GFLOPS,0.0
best_epoch,2.0
best_val_loss,0.53495
binary_accuracy,0.80689
epoch,2.0
loss,0.56492
val_binary_accuracy,0.82229
val_loss,0.53495


[34m[1mwandb[0m: Agent Starting Run: d4dn0buy with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 5e-05
[34m[1mwandb[0m: 	optimizer: adam
[34m[1mwandb[0m: 	weight_decay: 0.0005


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='73.271 MB of 73.271 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▇█
epoch,▁▅█
loss,█▃▁
val_binary_accuracy,▁▇█
val_loss,█▂▁

0,1
GFLOPS,0.0
best_epoch,2.0
best_val_loss,0.04923
binary_accuracy,0.98485
epoch,2.0
loss,0.07023
val_binary_accuracy,0.98861
val_loss,0.04923


[34m[1mwandb[0m: Agent Starting Run: s47do7k1 with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 5e-05
[34m[1mwandb[0m: 	optimizer: adam
[34m[1mwandb[0m: 	weight_decay: 0.005


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='73.271 MB of 73.271 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▇█
epoch,▁▅█
loss,█▃▁
val_binary_accuracy,▁▇█
val_loss,█▃▁

0,1
GFLOPS,0.0
best_epoch,2.0
best_val_loss,0.04981
binary_accuracy,0.98468
epoch,2.0
loss,0.07123
val_binary_accuracy,0.98852
val_loss,0.04981


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: 6dhb7vm6 with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 5e-05
[34m[1mwandb[0m: 	optimizer: adam
[34m[1mwandb[0m: 	weight_decay: 0.05


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='73.271 MB of 73.271 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▇█
epoch,▁▅█
loss,█▃▁
val_binary_accuracy,▁▇█
val_loss,█▃▁

0,1
GFLOPS,0.0
best_epoch,2.0
best_val_loss,0.04934
binary_accuracy,0.98489
epoch,2.0
loss,0.07042
val_binary_accuracy,0.98861
val_loss,0.04934


[34m[1mwandb[0m: Agent Starting Run: wzvdptuk with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 5e-05
[34m[1mwandb[0m: 	optimizer: nadam
[34m[1mwandb[0m: 	weight_decay: 0.0005


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='73.271 MB of 73.271 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▇█
epoch,▁▅█
loss,█▃▁
val_binary_accuracy,▁▇█
val_loss,█▃▁

0,1
GFLOPS,0.0
best_epoch,2.0
best_val_loss,0.06641
binary_accuracy,0.9794
epoch,2.0
loss,0.09117
val_binary_accuracy,0.98341
val_loss,0.06641


[34m[1mwandb[0m: Agent Starting Run: 86no33m3 with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 5e-05
[34m[1mwandb[0m: 	optimizer: nadam
[34m[1mwandb[0m: 	weight_decay: 0.005


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='73.271 MB of 73.271 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▇█
epoch,▁▅█
loss,█▃▁
val_binary_accuracy,▁▇█
val_loss,█▃▁

0,1
GFLOPS,0.0
best_epoch,2.0
best_val_loss,0.06623
binary_accuracy,0.97951
epoch,2.0
loss,0.09092
val_binary_accuracy,0.98348
val_loss,0.06623


[34m[1mwandb[0m: Agent Starting Run: yvrqplph with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 5e-05
[34m[1mwandb[0m: 	optimizer: nadam
[34m[1mwandb[0m: 	weight_decay: 0.05


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='73.271 MB of 73.271 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▇█
epoch,▁▅█
loss,█▃▁
val_binary_accuracy,▁▇█
val_loss,█▃▁

0,1
GFLOPS,0.0
best_epoch,2.0
best_val_loss,0.06697
binary_accuracy,0.97931
epoch,2.0
loss,0.09191
val_binary_accuracy,0.98333
val_loss,0.06697


[34m[1mwandb[0m: Agent Starting Run: h8h1xsx1 with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 5e-05
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_decay: 0.0005


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='48.856 MB of 48.856 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▅█
epoch,▁▅█
loss,█▄▁
val_binary_accuracy,▁▅█
val_loss,█▄▁

0,1
GFLOPS,0.0
best_epoch,2.0
best_val_loss,0.68779
binary_accuracy,0.56194
epoch,2.0
loss,0.68861
val_binary_accuracy,0.56565
val_loss,0.68779


[34m[1mwandb[0m: Agent Starting Run: bxmdf14g with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 5e-05
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_decay: 0.005


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='48.856 MB of 48.856 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▅█
epoch,▁▅█
loss,█▄▁
val_binary_accuracy,▁▅█
val_loss,█▄▁

0,1
GFLOPS,0.0
best_epoch,2.0
best_val_loss,0.68711
binary_accuracy,0.57056
epoch,2.0
loss,0.68792
val_binary_accuracy,0.5737
val_loss,0.68711


[34m[1mwandb[0m: Agent Starting Run: h8tr99kg with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 5e-05
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_decay: 0.05


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='48.856 MB of 48.856 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▅█
epoch,▁▅█
loss,█▄▁
val_binary_accuracy,▁▅█
val_loss,█▄▁

0,1
GFLOPS,0.0
best_epoch,2.0
best_val_loss,0.68749
binary_accuracy,0.56521
epoch,2.0
loss,0.68834
val_binary_accuracy,0.56884
val_loss,0.68749


[34m[1mwandb[0m: Agent Starting Run: 2lxm21o4 with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 5e-05
[34m[1mwandb[0m: 	optimizer: rmsprop
[34m[1mwandb[0m: 	weight_decay: 0.0005


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='48.856 MB of 48.856 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▇█
epoch,▁▅█
loss,█▃▁
val_binary_accuracy,▁▇█
val_loss,█▃▁

0,1
GFLOPS,0.0
best_epoch,2.0
best_val_loss,0.08486
binary_accuracy,0.97522
epoch,2.0
loss,0.11141
val_binary_accuracy,0.97995
val_loss,0.08486


[34m[1mwandb[0m: Agent Starting Run: lv951x9y with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 5e-05
[34m[1mwandb[0m: 	optimizer: rmsprop
[34m[1mwandb[0m: 	weight_decay: 0.005


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='48.856 MB of 48.856 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▇█
epoch,▁▅█
loss,█▃▁
val_binary_accuracy,▁▇█
val_loss,█▃▁

0,1
GFLOPS,0.0
best_epoch,2.0
best_val_loss,0.08618
binary_accuracy,0.9749
epoch,2.0
loss,0.11326
val_binary_accuracy,0.9797
val_loss,0.08618


[34m[1mwandb[0m: Agent Starting Run: uz23ml9i with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 5e-05
[34m[1mwandb[0m: 	optimizer: rmsprop
[34m[1mwandb[0m: 	weight_decay: 0.05


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='48.856 MB of 48.856 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▇█
epoch,▁▅█
loss,█▃▁
val_binary_accuracy,▁▇█
val_loss,█▃▁

0,1
GFLOPS,0.0
best_epoch,2.0
best_val_loss,0.08609
binary_accuracy,0.97496
epoch,2.0
loss,0.11309
val_binary_accuracy,0.97967
val_loss,0.08609


[34m[1mwandb[0m: Agent Starting Run: no5edpsd with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 0.0001
[34m[1mwandb[0m: 	optimizer: adam
[34m[1mwandb[0m: 	weight_decay: 0.0005


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='73.271 MB of 73.271 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁██
epoch,▁▅█
loss,█▂▁
val_binary_accuracy,▁▆█
val_loss,█▂▁

0,1
GFLOPS,0.0
best_epoch,2.0
best_val_loss,0.01805
binary_accuracy,0.99348
epoch,2.0
loss,0.02409
val_binary_accuracy,0.99476
val_loss,0.01805


[34m[1mwandb[0m: Agent Starting Run: 7yzzivh4 with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 0.0001
[34m[1mwandb[0m: 	optimizer: adam
[34m[1mwandb[0m: 	weight_decay: 0.005


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='73.271 MB of 73.271 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁██
epoch,▁▅█
loss,█▂▁
val_binary_accuracy,▁▆█
val_loss,█▂▁

0,1
GFLOPS,0.0
best_epoch,2.0
best_val_loss,0.0182
binary_accuracy,0.99341
epoch,2.0
loss,0.02433
val_binary_accuracy,0.99471
val_loss,0.0182


[34m[1mwandb[0m: Agent Starting Run: 2qqpieqb with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 0.0001
[34m[1mwandb[0m: 	optimizer: adam
[34m[1mwandb[0m: 	weight_decay: 0.05


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='73.271 MB of 73.271 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁██
epoch,▁▅█
loss,█▂▁
val_binary_accuracy,▁▆█
val_loss,█▂▁

0,1
GFLOPS,0.0
best_epoch,2.0
best_val_loss,0.01801
binary_accuracy,0.99349
epoch,2.0
loss,0.02405
val_binary_accuracy,0.99476
val_loss,0.01801


[34m[1mwandb[0m: Agent Starting Run: 5cn78jcw with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 0.0001
[34m[1mwandb[0m: 	optimizer: nadam
[34m[1mwandb[0m: 	weight_decay: 0.0005


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='73.271 MB of 73.271 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁██
epoch,▁▅█
loss,█▂▁
val_binary_accuracy,▁▆█
val_loss,█▂▁

0,1
GFLOPS,0.0
best_epoch,2.0
best_val_loss,0.02898
binary_accuracy,0.98902
epoch,2.0
loss,0.03656
val_binary_accuracy,0.99119
val_loss,0.02898


[34m[1mwandb[0m: Agent Starting Run: 0zd1axn3 with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 0.0001
[34m[1mwandb[0m: 	optimizer: nadam
[34m[1mwandb[0m: 	weight_decay: 0.005


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='73.271 MB of 73.271 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁██
epoch,▁▅█
loss,█▂▁
val_binary_accuracy,▁▆█
val_loss,█▂▁

0,1
GFLOPS,0.0
best_epoch,2.0
best_val_loss,0.02866
binary_accuracy,0.98916
epoch,2.0
loss,0.03609
val_binary_accuracy,0.9913
val_loss,0.02866


[34m[1mwandb[0m: Agent Starting Run: 2s3843mn with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 0.0001
[34m[1mwandb[0m: 	optimizer: nadam
[34m[1mwandb[0m: 	weight_decay: 0.05


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='73.271 MB of 73.271 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁██
epoch,▁▅█
loss,█▂▁
val_binary_accuracy,▁▆█
val_loss,█▂▁

0,1
GFLOPS,0.0
best_epoch,2.0
best_val_loss,0.02879
binary_accuracy,0.98912
epoch,2.0
loss,0.03629
val_binary_accuracy,0.99126
val_loss,0.02879


[34m[1mwandb[0m: Agent Starting Run: enu1kuwy with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 0.0001
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_decay: 0.0005


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='48.856 MB of 48.856 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▆█
epoch,▁▅█
loss,█▄▁
val_binary_accuracy,▁▆█
val_loss,█▄▁

0,1
GFLOPS,0.0
best_epoch,2.0
best_val_loss,0.68307
binary_accuracy,0.59381
epoch,2.0
loss,0.68446
val_binary_accuracy,0.59883
val_loss,0.68307


[34m[1mwandb[0m: Agent Starting Run: qch5hz75 with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 0.0001
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_decay: 0.005


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='48.856 MB of 48.856 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▆█
epoch,▁▅█
loss,█▄▁
val_binary_accuracy,▁▆█
val_loss,█▄▁

0,1
GFLOPS,0.0
best_epoch,2.0
best_val_loss,0.68279
binary_accuracy,0.5927
epoch,2.0
loss,0.68426
val_binary_accuracy,0.59941
val_loss,0.68279


[34m[1mwandb[0m: Agent Starting Run: ypn5lqtb with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 0.0001
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_decay: 0.05


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='48.856 MB of 48.856 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▆█
epoch,▁▅█
loss,█▄▁
val_binary_accuracy,▁▆█
val_loss,█▄▁

0,1
GFLOPS,0.0
best_epoch,2.0
best_val_loss,0.68291
binary_accuracy,0.59322
epoch,2.0
loss,0.68436
val_binary_accuracy,0.59894
val_loss,0.68291


[34m[1mwandb[0m: Agent Starting Run: h74j9hw5 with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 0.0001
[34m[1mwandb[0m: 	optimizer: rmsprop
[34m[1mwandb[0m: 	weight_decay: 0.0005


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='48.856 MB of 48.856 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁██
epoch,▁▅█
loss,█▂▁
val_binary_accuracy,▁▆█
val_loss,█▂▁

0,1
GFLOPS,0.0
best_epoch,2.0
best_val_loss,0.03701
binary_accuracy,0.98608
epoch,2.0
loss,0.04495
val_binary_accuracy,0.98815
val_loss,0.03701


[34m[1mwandb[0m: Agent Starting Run: nr4n1tmb with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 0.0001
[34m[1mwandb[0m: 	optimizer: rmsprop
[34m[1mwandb[0m: 	weight_decay: 0.005


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='48.856 MB of 48.856 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁██
epoch,▁▅█
loss,█▂▁
val_binary_accuracy,▁▆█
val_loss,█▂▁

0,1
GFLOPS,0.0
best_epoch,2.0
best_val_loss,0.03729
binary_accuracy,0.986
epoch,2.0
loss,0.04532
val_binary_accuracy,0.98812
val_loss,0.03729


[34m[1mwandb[0m: Agent Starting Run: aovqzxwr with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 0.0001
[34m[1mwandb[0m: 	optimizer: rmsprop
[34m[1mwandb[0m: 	weight_decay: 0.05


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='48.856 MB of 48.856 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁██
epoch,▁▅█
loss,█▂▁
val_binary_accuracy,▁▆█
val_loss,█▂▁

0,1
GFLOPS,0.0
best_epoch,2.0
best_val_loss,0.03717
binary_accuracy,0.98611
epoch,2.0
loss,0.04516
val_binary_accuracy,0.98814
val_loss,0.03717


[34m[1mwandb[0m: Agent Starting Run: 4i1a1k08 with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 0.0005
[34m[1mwandb[0m: 	optimizer: adam
[34m[1mwandb[0m: 	weight_decay: 0.0005


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='73.271 MB of 73.271 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁██
epoch,▁▅█
loss,█▁▁
val_binary_accuracy,▁▇█
val_loss,█▂▁

0,1
GFLOPS,0.0
best_epoch,2.0
best_val_loss,0.00547
binary_accuracy,0.99859
epoch,2.0
loss,0.00493
val_binary_accuracy,0.99836
val_loss,0.00547


[34m[1mwandb[0m: Agent Starting Run: dmug11f0 with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 0.0005
[34m[1mwandb[0m: 	optimizer: adam
[34m[1mwandb[0m: 	weight_decay: 0.005


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='73.271 MB of 73.271 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁██
epoch,▁▅█
loss,█▁▁
val_binary_accuracy,▁▇█
val_loss,█▂▁

0,1
GFLOPS,0.0
best_epoch,2.0
best_val_loss,0.00542
binary_accuracy,0.9986
epoch,2.0
loss,0.00493
val_binary_accuracy,0.99837
val_loss,0.00542


[34m[1mwandb[0m: Agent Starting Run: v5cgq5k5 with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 0.0005
[34m[1mwandb[0m: 	optimizer: adam
[34m[1mwandb[0m: 	weight_decay: 0.05


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='73.271 MB of 73.271 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁██
epoch,▁▅█
loss,█▁▁
val_binary_accuracy,▁▇█
val_loss,█▂▁

0,1
GFLOPS,0.0
best_epoch,2.0
best_val_loss,0.00542
binary_accuracy,0.99861
epoch,2.0
loss,0.0049
val_binary_accuracy,0.99837
val_loss,0.00542


[34m[1mwandb[0m: Agent Starting Run: e6gd4efb with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 0.0005
[34m[1mwandb[0m: 	optimizer: nadam
[34m[1mwandb[0m: 	weight_decay: 0.0005


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='73.271 MB of 73.271 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁██
epoch,▁▅█
loss,█▁▁
val_binary_accuracy,▁▇█
val_loss,█▃▁

0,1
GFLOPS,0.0
best_epoch,2.0
best_val_loss,0.00892
binary_accuracy,0.99688
epoch,2.0
loss,0.00982
val_binary_accuracy,0.9971
val_loss,0.00892


[34m[1mwandb[0m: Agent Starting Run: 71ddtpx1 with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 0.0005
[34m[1mwandb[0m: 	optimizer: nadam
[34m[1mwandb[0m: 	weight_decay: 0.005


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='73.271 MB of 73.271 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁██
epoch,▁▅█
loss,█▁▁
val_binary_accuracy,▁▇█
val_loss,█▃▁

0,1
GFLOPS,0.0
best_epoch,2.0
best_val_loss,0.00881
binary_accuracy,0.9969
epoch,2.0
loss,0.00978
val_binary_accuracy,0.99714
val_loss,0.00881


[34m[1mwandb[0m: Agent Starting Run: 5oafy4qh with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 0.0005
[34m[1mwandb[0m: 	optimizer: nadam
[34m[1mwandb[0m: 	weight_decay: 0.05


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='73.271 MB of 73.271 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁██
epoch,▁▅█
loss,█▁▁
val_binary_accuracy,▁▇█
val_loss,█▃▁

0,1
GFLOPS,0.0
best_epoch,2.0
best_val_loss,0.0088
binary_accuracy,0.99689
epoch,2.0
loss,0.00981
val_binary_accuracy,0.99716
val_loss,0.0088


[34m[1mwandb[0m: Agent Starting Run: so8mtu6b with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 0.0005
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_decay: 0.0005


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='48.856 MB of 48.856 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▇█
epoch,▁▅█
loss,█▄▁
val_binary_accuracy,▁▆█
val_loss,█▄▁

0,1
GFLOPS,0.0
best_epoch,2.0
best_val_loss,0.658
binary_accuracy,0.61621
epoch,2.0
loss,0.66263
val_binary_accuracy,0.63468
val_loss,0.658


[34m[1mwandb[0m: Agent Starting Run: gi1kh2zn with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 0.0005
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_decay: 0.005


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='48.856 MB of 48.856 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁██
epoch,▁▅█
loss,█▄▁
val_binary_accuracy,▁▆█
val_loss,█▄▁

0,1
GFLOPS,0.0
best_epoch,2.0
best_val_loss,0.65807
binary_accuracy,0.61573
epoch,2.0
loss,0.6626
val_binary_accuracy,0.6342
val_loss,0.65807


[34m[1mwandb[0m: Agent Starting Run: w9wubn9l with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 0.0005
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_decay: 0.05


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='48.856 MB of 48.856 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▇█
epoch,▁▅█
loss,█▄▁
val_binary_accuracy,▁▆█
val_loss,█▄▁

0,1
GFLOPS,0.0
best_epoch,2.0
best_val_loss,0.65768
binary_accuracy,0.61662
epoch,2.0
loss,0.66222
val_binary_accuracy,0.63462
val_loss,0.65768


[34m[1mwandb[0m: Agent Starting Run: okmvm35g with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 0.0005
[34m[1mwandb[0m: 	optimizer: rmsprop
[34m[1mwandb[0m: 	weight_decay: 0.0005


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='48.856 MB of 48.856 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁██
epoch,▁▅█
loss,█▁▁
val_binary_accuracy,▁▆█
val_loss,█▃▁

0,1
GFLOPS,0.0
best_epoch,2.0
best_val_loss,0.01283
binary_accuracy,0.99498
epoch,2.0
loss,0.01497
val_binary_accuracy,0.99553
val_loss,0.01283


[34m[1mwandb[0m: Agent Starting Run: iqj1jmop with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 0.0005
[34m[1mwandb[0m: 	optimizer: rmsprop
[34m[1mwandb[0m: 	weight_decay: 0.005


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='48.856 MB of 48.856 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁██
epoch,▁▅█
loss,█▁▁
val_binary_accuracy,▁▆█
val_loss,█▃▁

0,1
GFLOPS,0.0
best_epoch,2.0
best_val_loss,0.01287
binary_accuracy,0.99497
epoch,2.0
loss,0.01502
val_binary_accuracy,0.99551
val_loss,0.01287


[34m[1mwandb[0m: Agent Starting Run: cc2lu6z4 with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 0.0005
[34m[1mwandb[0m: 	optimizer: rmsprop
[34m[1mwandb[0m: 	weight_decay: 0.05


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='48.856 MB of 48.856 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁██
epoch,▁▅█
loss,█▁▁
val_binary_accuracy,▁▆█
val_loss,█▃▁

0,1
GFLOPS,0.0
best_epoch,2.0
best_val_loss,0.01282
binary_accuracy,0.99497
epoch,2.0
loss,0.01498
val_binary_accuracy,0.99552
val_loss,0.01282


[34m[1mwandb[0m: Agent Starting Run: mr4h1gv2 with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: adam
[34m[1mwandb[0m: 	weight_decay: 0.0005


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='73.271 MB of 73.271 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁██
epoch,▁▅█
loss,█▁▁
val_binary_accuracy,▃█▁
val_loss,█▁▆

0,1
GFLOPS,0.0
best_epoch,1.0
best_val_loss,0.00437
binary_accuracy,0.99886
epoch,2.0
loss,0.00387
val_binary_accuracy,0.99812
val_loss,0.00574


[34m[1mwandb[0m: Agent Starting Run: 5xjlf1e6 with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: adam
[34m[1mwandb[0m: 	weight_decay: 0.005


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='73.271 MB of 73.271 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁██
epoch,▁▅█
loss,█▁▁
val_binary_accuracy,▁█▁
val_loss,█▁▆

0,1
GFLOPS,0.0
best_epoch,1.0
best_val_loss,0.00439
binary_accuracy,0.99886
epoch,2.0
loss,0.00388
val_binary_accuracy,0.99818
val_loss,0.00565


[34m[1mwandb[0m: Agent Starting Run: w3y341rl with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: adam
[34m[1mwandb[0m: 	weight_decay: 0.05


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='73.271 MB of 73.271 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁██
epoch,▁▅█
loss,█▁▁
val_binary_accuracy,▃█▁
val_loss,█▁▆

0,1
GFLOPS,0.0
best_epoch,1.0
best_val_loss,0.0044
binary_accuracy,0.99886
epoch,2.0
loss,0.00387
val_binary_accuracy,0.99808
val_loss,0.00582


[34m[1mwandb[0m: Agent Starting Run: xbmu4wcx with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: nadam
[34m[1mwandb[0m: 	weight_decay: 0.0005


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='73.271 MB of 73.271 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁██
epoch,▁▅█
loss,█▁▁
val_binary_accuracy,▁▅█
val_loss,█▄▁

0,1
GFLOPS,0.0
best_epoch,2.0
best_val_loss,0.00596
binary_accuracy,0.99768
epoch,2.0
loss,0.00727
val_binary_accuracy,0.99805
val_loss,0.00596


[34m[1mwandb[0m: Agent Starting Run: tk0doy93 with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: nadam
[34m[1mwandb[0m: 	weight_decay: 0.005


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='73.271 MB of 73.271 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁██
epoch,▁▅█
loss,█▁▁
val_binary_accuracy,▁▆█
val_loss,█▄▁

0,1
GFLOPS,0.0
best_epoch,2.0
best_val_loss,0.00593
binary_accuracy,0.99767
epoch,2.0
loss,0.00724
val_binary_accuracy,0.99805
val_loss,0.00593


[34m[1mwandb[0m: Agent Starting Run: xpzr4vhs with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: nadam
[34m[1mwandb[0m: 	weight_decay: 0.05


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='73.271 MB of 73.271 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁██
epoch,▁▅█
loss,█▁▁
val_binary_accuracy,▁▆█
val_loss,█▄▁

0,1
GFLOPS,0.0
best_epoch,2.0
best_val_loss,0.006
binary_accuracy,0.99769
epoch,2.0
loss,0.00725
val_binary_accuracy,0.99807
val_loss,0.006


[34m[1mwandb[0m: Agent Starting Run: h2e40e4h with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_decay: 0.0005


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='48.856 MB of 48.856 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▇█
epoch,▁▅█
loss,█▃▁
val_binary_accuracy,▁▇█
val_loss,█▃▁

0,1
GFLOPS,0.0
best_epoch,2.0
best_val_loss,0.64542
binary_accuracy,0.62039
epoch,2.0
loss,0.65161
val_binary_accuracy,0.63933
val_loss,0.64542


[34m[1mwandb[0m: Agent Starting Run: y34j9dx3 with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_decay: 0.005


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='48.856 MB of 48.856 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▇█
epoch,▁▅█
loss,█▃▁
val_binary_accuracy,▁▆█
val_loss,█▃▁

0,1
GFLOPS,0.0
best_epoch,2.0
best_val_loss,0.64486
binary_accuracy,0.62097
epoch,2.0
loss,0.65101
val_binary_accuracy,0.63989
val_loss,0.64486


[34m[1mwandb[0m: Agent Starting Run: y8u3hatz with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_decay: 0.05


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='48.856 MB of 48.856 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▇█
epoch,▁▅█
loss,█▃▁
val_binary_accuracy,▁▆█
val_loss,█▃▁

0,1
GFLOPS,0.0
best_epoch,2.0
best_val_loss,0.64485
binary_accuracy,0.62113
epoch,2.0
loss,0.65087
val_binary_accuracy,0.63997
val_loss,0.64485


[34m[1mwandb[0m: Agent Starting Run: 0ba3pcy0 with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: rmsprop
[34m[1mwandb[0m: 	weight_decay: 0.0005


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='48.856 MB of 48.856 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁██
epoch,▁▅█
loss,█▁▁
val_binary_accuracy,▁▆█
val_loss,█▃▁

0,1
GFLOPS,0.0
best_epoch,2.0
best_val_loss,0.00973
binary_accuracy,0.99621
epoch,2.0
loss,0.01168
val_binary_accuracy,0.99677
val_loss,0.00973


[34m[1mwandb[0m: Agent Starting Run: if6fm9ld with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: rmsprop
[34m[1mwandb[0m: 	weight_decay: 0.005


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='48.856 MB of 48.856 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁██
epoch,▁▅█
loss,█▁▁
val_binary_accuracy,▁▆█
val_loss,█▃▁

0,1
GFLOPS,0.0
best_epoch,2.0
best_val_loss,0.0097
binary_accuracy,0.99624
epoch,2.0
loss,0.01165
val_binary_accuracy,0.99679
val_loss,0.0097


[34m[1mwandb[0m: Agent Starting Run: q0svhxu9 with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: rmsprop
[34m[1mwandb[0m: 	weight_decay: 0.05


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='48.856 MB of 48.856 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁██
epoch,▁▅█
loss,█▁▁
val_binary_accuracy,▁▆█
val_loss,█▃▁

0,1
GFLOPS,0.0
best_epoch,2.0
best_val_loss,0.00969
binary_accuracy,0.99621
epoch,2.0
loss,0.01165
val_binary_accuracy,0.99678
val_loss,0.00969


[34m[1mwandb[0m: Agent Starting Run: 6w9v7938 with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 0.005
[34m[1mwandb[0m: 	optimizer: adam
[34m[1mwandb[0m: 	weight_decay: 0.0005


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='73.271 MB of 73.271 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▇█
epoch,▁▅█
loss,█▂▁
val_binary_accuracy,▂█▁
val_loss,▆▁█

0,1
GFLOPS,0.0
best_epoch,1.0
best_val_loss,0.00402
binary_accuracy,0.99843
epoch,2.0
loss,0.00491
val_binary_accuracy,0.98446
val_loss,0.04396


[34m[1mwandb[0m: Agent Starting Run: l1p7q2wz with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 0.005
[34m[1mwandb[0m: 	optimizer: adam
[34m[1mwandb[0m: 	weight_decay: 0.005


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='73.271 MB of 73.271 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▇█
epoch,▁▅█
loss,█▂▁
val_binary_accuracy,▅█▁
val_loss,▄▁█

0,1
GFLOPS,0.0
best_epoch,1.0
best_val_loss,0.00788
binary_accuracy,0.99845
epoch,2.0
loss,0.00486
val_binary_accuracy,0.97976
val_loss,0.06145


[34m[1mwandb[0m: Agent Starting Run: 8rdrohws with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 0.005
[34m[1mwandb[0m: 	optimizer: adam
[34m[1mwandb[0m: 	weight_decay: 0.05


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='73.271 MB of 73.271 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▇█
epoch,▁▅█
loss,█▂▁
val_binary_accuracy,▃█▁
val_loss,▆▁█

0,1
GFLOPS,0.0
best_epoch,1.0
best_val_loss,0.00515
binary_accuracy,0.99844
epoch,2.0
loss,0.00488
val_binary_accuracy,0.98502
val_loss,0.04182


[34m[1mwandb[0m: Agent Starting Run: jfz25ris with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 0.005
[34m[1mwandb[0m: 	optimizer: nadam
[34m[1mwandb[0m: 	weight_decay: 0.0005


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='73.271 MB of 73.271 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▇█
epoch,▁▅█
loss,█▁▁
val_binary_accuracy,█▁▇
val_loss,▁█▂

0,1
GFLOPS,0.0
best_epoch,0.0
best_val_loss,0.01097
binary_accuracy,0.99762
epoch,2.0
loss,0.00706
val_binary_accuracy,0.99461
val_loss,0.01484


[34m[1mwandb[0m: Agent Starting Run: f0bwktd4 with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 0.005
[34m[1mwandb[0m: 	optimizer: nadam
[34m[1mwandb[0m: 	weight_decay: 0.005


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='73.271 MB of 73.271 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▇█
epoch,▁▅█
loss,█▁▁
val_binary_accuracy,█▁▇
val_loss,▁█▂

0,1
GFLOPS,0.0
best_epoch,0.0
best_val_loss,0.0119
binary_accuracy,0.99761
epoch,2.0
loss,0.00708
val_binary_accuracy,0.99378
val_loss,0.01729


[34m[1mwandb[0m: Agent Starting Run: xsqh2x46 with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 0.005
[34m[1mwandb[0m: 	optimizer: nadam
[34m[1mwandb[0m: 	weight_decay: 0.05


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='72.267 MB of 73.271 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=0.9862…

0,1
binary_accuracy,▁▇█
epoch,▁▅█
loss,█▂▁
val_binary_accuracy,█▁█
val_loss,▁█▁

0,1
GFLOPS,0.0
best_epoch,2.0
best_val_loss,0.01053
binary_accuracy,0.99764
epoch,2.0
loss,0.00704
val_binary_accuracy,0.99618
val_loss,0.01053


[34m[1mwandb[0m: Agent Starting Run: 9kfd3n9e with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 0.005
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_decay: 0.0005


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='48.856 MB of 48.856 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▄█
epoch,▁▅█
loss,█▅▁
val_binary_accuracy,▁▃█
val_loss,█▆▁

0,1
GFLOPS,0.0
best_epoch,2.0
best_val_loss,0.56388
binary_accuracy,0.68317
epoch,2.0
loss,0.59988
val_binary_accuracy,0.72283
val_loss,0.56388


[34m[1mwandb[0m: Agent Starting Run: 1g1hykza with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 0.005
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_decay: 0.005


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='48.856 MB of 48.856 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▃█
epoch,▁▅█
loss,█▅▁
val_binary_accuracy,▁▃█
val_loss,█▆▁

0,1
GFLOPS,0.0
best_epoch,2.0
best_val_loss,0.5602
binary_accuracy,0.68662
epoch,2.0
loss,0.59738
val_binary_accuracy,0.72636
val_loss,0.5602


[34m[1mwandb[0m: Agent Starting Run: wgu4j3v7 with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 0.005
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_decay: 0.05


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='48.856 MB of 48.856 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▄█
epoch,▁▅█
loss,█▅▁
val_binary_accuracy,▁▃█
val_loss,█▆▁

0,1
GFLOPS,0.0
best_epoch,2.0
best_val_loss,0.56176
binary_accuracy,0.68517
epoch,2.0
loss,0.59848
val_binary_accuracy,0.72517
val_loss,0.56176


[34m[1mwandb[0m: Agent Starting Run: abgbzzi9 with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 0.005
[34m[1mwandb[0m: 	optimizer: rmsprop
[34m[1mwandb[0m: 	weight_decay: 0.0005


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='48.856 MB of 48.856 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▇█
epoch,▁▅█
loss,█▂▁
val_binary_accuracy,▁▅█
val_loss,█▅▁

0,1
GFLOPS,0.0
best_epoch,2.0
best_val_loss,0.00708
binary_accuracy,0.99712
epoch,2.0
loss,0.00965
val_binary_accuracy,0.99777
val_loss,0.00708


[34m[1mwandb[0m: Agent Starting Run: m2dtjbga with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 0.005
[34m[1mwandb[0m: 	optimizer: rmsprop
[34m[1mwandb[0m: 	weight_decay: 0.005


Epoch 1/3