# Text classification using Tensorflow: Sentiment on Reviews

This notebook trains a binary classifier for sentiment analysis to classify restaurant food reviews as *negative* or *positive*, based on the text of the review where a sentiment score was previously calculated. 


In [None]:
from google.colab import drive 
drive.mount('/content/drive')

Drive already mounted at /content/drive; to attempt to forcibly remount, call drive.mount("/content/drive", force_remount=True).


In [None]:
!pip install --upgrade -q wandb
import wandb
from wandb.keras import WandbCallback
import os
import random
import numpy as np
import pandas as pd
import shutil
import time
import datetime
from datetime import datetime, timedelta
from timeit import default_timer as timer
import pickle
import joblib
from sklearn.utils import shuffle
import tensorflow as tf
from tensorflow.keras import layers
from tensorflow.keras import losses
from tensorboard.plugins.hparams import api as hp
from tensorflow.keras.callbacks import ReduceLROnPlateau, ModelCheckpoint, Callback, EarlyStopping
from tensorflow.keras.optimizers import Adam, RMSprop, SGD, Nadam
import matplotlib
import matplotlib.pyplot as plt
import tqdm
from tensorflow import keras
from keras.utils import np_utils

In [None]:
print('CUDA and NVIDIA GPU Information')
!/usr/local/cuda/bin/nvcc --version
!nvidia-smi

print('\n')
print('TensorFlow version: {}'.format(tf.__version__))
print('Eager execution is: {}'.format(tf.executing_eagerly()))
print('Keras version: {}'.format(tf.keras.__version__))
print('Num GPUs Available: ', len(tf.config.list_physical_devices('GPU')))

CUDA and NVIDIA GPU Information
nvcc: NVIDIA (R) Cuda compiler driver
Copyright (c) 2005-2020 NVIDIA Corporation
Built on Mon_Oct_12_20:09:46_PDT_2020
Cuda compilation tools, release 11.1, V11.1.105
Build cuda_11.1.TC455_06.29190527_0
Tue Jul  5 04:43:13 2022       
+-----------------------------------------------------------------------------+
| NVIDIA-SMI 460.32.03    Driver Version: 460.32.03    CUDA Version: 11.2     |
|-------------------------------+----------------------+----------------------+
| GPU  Name        Persistence-M| Bus-Id        Disp.A | Volatile Uncorr. ECC |
| Fan  Temp  Perf  Pwr:Usage/Cap|         Memory-Usage | GPU-Util  Compute M. |
|                               |                      |               MIG M. |
|   0  Tesla P100-PCIE...  Off  | 00000000:00:04.0 Off |                    0 |
| N/A   37C    P0    28W / 250W |      0MiB / 16280MiB |      0%      Default |
|                               |                      |                  N/A |
+------------

In [None]:
# Reproducibility in TF 
def init_seeds(seed=42):
    np.random.seed(seed)
    random.seed(seed)
    session_conf = tf.compat.v1.ConfigProto()
    session_conf = tf.compat.v1.ConfigProto(intra_op_parallelism_threads=1,
                              inter_op_parallelism_threads=1)
    os.environ['TF_CUDNN_DETERMINISTIC'] ='true'
    os.environ['TF_DETERMINISTIC_OPS'] = 'true'
    tf.random.set_seed(seed)
    sess = tf.compat.v1.Session(graph=tf.compat.v1.get_default_graph(),
                                config=session_conf)
    tf.compat.v1.keras.backend.set_session(sess)
    return sess

In [None]:
init_seeds(seed=42)

<tensorflow.python.client.session.Session at 0x7f2b6072bd90>

In [None]:
%cd /content/drive/MyDrive/Yelp_Reviews/Data/

/content/drive/MyDrive/Yelp_Reviews/Data


In [None]:
# Read tokenized reviews with sentiment
df = pd.read_parquet('YelpReviews_NLP_sentimentNegPos_tokenized.parquet')
print('Number of rows and columns:', df.shape)
df.head()

Number of rows and columns: (829874, 3)


Unnamed: 0_level_0,cleanReview,sentiment,stars_reviews
index,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1
1,"[order, chicken, finger, sub, honey, mustard, ...",Negative,3.0
3,"[dedicated, loving, memory, gary, feldman, gre...",Negative,5.0
12,"[absolutely, horrible, thought, would, order, ...",Negative,1.0
15,"[found, better, chicken, finger, know, inside,...",Negative,4.0
20,"[amazing, everything, tried, disappoint, chick...",Negative,5.0


In [None]:
# Examine how star reviews pairs with sentiment polarity
print(df[['stars_reviews', 'sentiment']].value_counts())

stars_reviews  sentiment
5.0            Positive     278011
1.0            Negative     231245
4.0            Positive     104585
2.0            Negative      90320
3.0            Negative      44097
4.0            Negative      26276
5.0            Negative      22999
3.0            Positive      22096
2.0            Positive       6690
1.0            Positive       3555
dtype: int64


In [None]:
# Remove comma from tokenize to make one string
df = df.copy()
df['cleanReview'] = df['cleanReview'].apply(lambda x: ','.join(map(str, x)))
df.loc[:,'cleanReview'] =  df['cleanReview'].str.replace(r',', ' ', regex=True)
df.head()

Unnamed: 0_level_0,cleanReview,sentiment,stars_reviews
index,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1
1,order chicken finger sub honey mustard sauce p...,Negative,3.0
3,dedicated loving memory gary feldman greatest ...,Negative,5.0
12,absolutely horrible thought would order place ...,Negative,1.0
15,found better chicken finger know inside crisp ...,Negative,4.0
20,amazing everything tried disappoint chicken ca...,Negative,5.0


In [None]:
# Recode to binary
df = df.copy()
df['sentiment'].mask(df['sentiment'] == 'Negative', 0, inplace=True)
df['sentiment'].mask(df['sentiment'] == 'Positive', 1, inplace=True)

print('Number of reviews per group:')
df[['sentiment']].value_counts() 

Number of reviews per group:


sentiment
0            414937
1            414937
dtype: int64

In [None]:
# Shuffle data
df = df.drop(['stars_reviews'], axis=1)
df = shuffle(df)
df.shape

(829874, 2)

In [None]:
# Convert data types
df = df.copy()
df[['cleanReview']] = df[['cleanReview']].astype('str')
df['sentiment'] = df['sentiment'].astype('float32')

In [None]:
features = df['cleanReview']
labels = df['sentiment']

In [None]:
# Load pandas df to tf
df = tf.data.Dataset.from_tensor_slices((features, labels))

In [None]:
# Define components for paritioning data
df_size = df.cardinality().numpy()
train_size = int(0.8 * df_size)
val_size = int(0.10 * df_size)
test_size = int(0.10 * df_size)
BATCH_SIZE = 32

In [None]:
# Prepare train/test sets
df = df.shuffle(800_000, seed=42, reshuffle_each_iteration=False)
train = df.take(train_size).batch(BATCH_SIZE) 
test = df.skip(train_size)
val = test.skip(val_size).batch(BATCH_SIZE) 
test= test.take(test_size).batch(BATCH_SIZE) 

print('Train data split:', len(train))
print('Eval data split', len(val))
print('Test data split', len(test))

Train data split: 20747
Eval data split 2594
Test data split 2594


# Sentiment analysis




### Prepare the data for training

Next, the reviews are tokenized and vectorized using `tf.keras.layers.TextVectorization` layer. Tokenization refers to splitting strings into single words, or tokens. Vectorization converts the tokens into numbers as input for the neural network. Unique integer indices are created for each token by using `output_mode` = `int`. The `max_features` and `sequence_length` are defined for what is sampled.

In [None]:
max_features = 50000
sequence_length = 300

vectorize_layer = layers.TextVectorization(
    max_tokens=max_features,
    output_mode='int',
    output_sequence_length=sequence_length)

The preprocessing layer is fit to the dataset by using `adapt` for the training data, which results in the model creating an index of strings to integers.

In [None]:
# Make a review-only dataset and then call adapt
train_text = train.map(lambda x, y:x)
vectorize_layer.adapt(train_text)

Now, define a function to examine how the created layer preprocesses the data:



In [None]:
def vectorize_text(cleanReview, sentiment):
  cleanReview = tf.expand_dims(cleanReview, -1)
  return vectorize_layer(cleanReview), sentiment

In [None]:
# Sample a batch reviews and labels
text_batch, label_batch = next(iter(train))
first_review, first_label = text_batch[0], label_batch[0]
print('Review', first_review)
print('Label', first_label)
print('Vectorized review', vectorize_text(first_review, first_label))

Review tf.Tensor(b'waste time still business yet competition dripping springs area ordered delivery dozen time food usually okay delivery service horrible tried order three different occasion delivery told delivery driver called sick tonight placed order people told hour hour fifteen minute called hour minute later informed delivery driver leave work call replacement two hour later still food called back two people working friendly gm always mia wait another chinese place come town put business delivery fee also outrageous type service', shape=(), dtype=string)
Label tf.Tensor(0.0, shape=(), dtype=float32)
Vectorized review (<tf.Tensor: shape=(1, 300), dtype=int64, numpy=
array([[ 444,    7,   85,  193,  365, 2678, 2372, 2330,  123,   16,  230,
        1280,    7,    2,  288,  406,  230,    6,  122,  101,   11,  260,
         231,  936,  230,   82,  230,  789,  177,  549,  462,  616,   11,
          42,   82,   63,   63, 3115,   29,  177,   63,   29,  270, 1135,
         230,  789,  30

In [None]:
print('12870 ---> ', vectorize_layer.get_vocabulary()[12870])
print(' 3130 ---> ', vectorize_layer.get_vocabulary()[3130])
print('Vocabulary size: {}'.format(len(vectorize_layer.get_vocabulary())))

12870 --->  spongey
 3130 --->  unsanitary
Vocabulary size: 50000


Then, apply the `TextVectorization` layer to the train, validation, and test sets.

In [None]:
train_ds = train.map(vectorize_text)
val_ds = val.map(vectorize_text)
test_ds = test.map(vectorize_text)

Configure the dataset for performance by using `.cache()` and `.prefetch()`.




In [None]:
AUTOTUNE = tf.data.AUTOTUNE

train_ds = train_ds.cache().prefetch(buffer_size=AUTOTUNE)
val_ds = val_ds.cache().prefetch(buffer_size=AUTOTUNE)
test_ds = test_ds.cache().prefetch(buffer_size=AUTOTUNE)

# Hyperparameter Tuning

In [None]:
# Set path for results
%cd /content/drive/MyDrive/Yelp_Reviews/DL/BoW/SentimentPolarity/Models/

/content/drive/MyDrive/Yelp_Reviews/DL/BoW/SentimentPolarity/Models


In [None]:
# Configure the sweep 
sweep_config = {
    'method': 'random', 
    'metric': {
      'name': 'BinaryAccuracy',
      'goal': 'maximize'   
    },
    'parameters': {
        'epochs': {
            'values': [3, 5, 7]
        },
        'batch_size': {
            'values': [8, 4, 2, 1]
        },
        'embedding_dim': {
            'values': [128, 64, 32]
        },        
        'dropout': {
            'values': [0.2, 0.3, 0.4, 0.5]
        },
        'weight_decay': {
            'values': [0.0005, 0.005, 0.05]
        },
        'learning_rate': {
            'values': [0.00001, 0.00005, 0.0001, 0.0005, 0.001, 0.005, 0.01]
        },
        'optimizer': {
            'values': ['adam', 'nadam', 'sgd', 'rmsprop']
        },
    }
}

## 2. Initialize the Sweep

In [None]:
# Initialize a new sweep
sweep_id = wandb.sweep(sweep_config, entity='aschultz', 
                       project='tf_textclass_sentpol_r2')

Create sweep with ID: o70jyzyg
Sweep URL: https://wandb.ai/aschultz/tf_textclass_sentpol_r2/sweeps/o70jyzyg


### Define Neural Network


In [None]:
# The sweep calls this function with each set of hyperparameters
def train():
    # Default values for hyperparameters
    config_defaults = {
        'epochs': 5,
        'batch_size': 8,
        'weight_decay': 0.0005,
        'learning_rate': 0.01,
        'optimizer': 'adam',
        'embedding_dim': 32,
        'dropout': 0.5,
        'momentum': 0.9,
        'seed': 42
    }

    # Initialize a new wandb run
    wandb.init(config=config_defaults)
    
    # Config hyperparameters and inputs
    config = wandb.config
    
    # Define the model architecture 
    model = tf.keras.Sequential()
    model.add(tf.keras.layers.Embedding(max_features + 1, config.embedding_dim))
    model.add(tf.keras.layers.Dropout(config.dropout))
    model.add(tf.keras.layers.GlobalAveragePooling1D())
    model.add(tf.keras.layers.Dropout(config.dropout))
    model.add(tf.keras.layers.Dense(1))

    # Define the optimizer
    if config.optimizer=='sgd':
      optimizer = SGD(learning_rate=config.learning_rate, decay=1e-5, 
                      momentum=config.momentum, nesterov=True)
    elif config.optimizer=='rmsprop':
      optimizer = RMSprop(learning_rate=config.learning_rate, decay=1e-5)
    elif config.optimizer=='adam':
      optimizer = Adam(learning_rate=config.learning_rate, beta_1=0.9, 
                       beta_2=0.999, clipnorm=1.0)
    elif config.optimizer=='nadam':
      optimizer = Nadam(learning_rate=config.learning_rate, beta_1=0.9, 
                        beta_2=0.999, clipnorm=1.0)

    # Define loss and metrics
    model.compile(loss=losses.BinaryCrossentropy(from_logits=True), 
                  optimizer = optimizer, 
                  metrics=tf.metrics.BinaryAccuracy(threshold=0.0))

    # Fit model
    model.fit(train_ds, batch_size=config.batch_size,
              epochs=config.epochs,
              validation_data=(val_ds),
              callbacks=[WandbCallback(data_type='text', validation_data=(val_ds)), 
                                       EarlyStopping(patience=10, 
                                                     restore_best_weights=True)]) 

## 3. Run the sweep agent

In [None]:
# Run sweep for HPO
wandb.agent(sweep_id, train)

[34m[1mwandb[0m: Agent Starting Run: xzcb1ebo with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_decay: 0.0005




Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='48.856 MB of 48.856 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▇█
epoch,▁▅█
loss,█▃▁
val_binary_accuracy,▁▅█
val_loss,█▃▁

0,1
best_epoch,2.0
best_val_loss,0.64671
binary_accuracy,0.61253
epoch,2.0
loss,0.65419
val_binary_accuracy,0.64073
val_loss,0.64671


[34m[1mwandb[0m: Agent Starting Run: 9ytlstul with config:
[34m[1mwandb[0m: 	batch_size: 4
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	embedding_dim: 64
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	learning_rate: 0.0005
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_decay: 0.05


Epoch 1/5
Epoch 2/5
Epoch 3/5
Epoch 4/5
Epoch 5/5


VBox(children=(Label(value='24.441 MB of 24.441 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▆▇▇█
epoch,▁▃▅▆█
loss,█▅▃▂▁
val_binary_accuracy,▁▅███
val_loss,█▅▃▂▁

0,1
best_epoch,4.0
best_val_loss,0.655
binary_accuracy,0.59867
epoch,4.0
loss,0.66204
val_binary_accuracy,0.63843
val_loss,0.655


[34m[1mwandb[0m: Agent Starting Run: 2qpd15nb with config:
[34m[1mwandb[0m: 	batch_size: 1
[34m[1mwandb[0m: 	dropout: 0.4
[34m[1mwandb[0m: 	embedding_dim: 32
[34m[1mwandb[0m: 	epochs: 7
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: rmsprop
[34m[1mwandb[0m: 	weight_decay: 0.005


Epoch 1/7
Epoch 2/7
Epoch 3/7
Epoch 4/7
Epoch 5/7
Epoch 6/7
Epoch 7/7


VBox(children=(Label(value='12.234 MB of 12.234 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▆▇████
epoch,▁▂▃▅▆▇█
loss,█▃▂▁▁▁▁
val_binary_accuracy,▁▂▆▇▆██
val_loss,█▇▃▂▃▂▁

0,1
best_epoch,6.0
best_val_loss,0.00817
binary_accuracy,0.99674
epoch,6.0
loss,0.01143
val_binary_accuracy,0.99749
val_loss,0.00817


[34m[1mwandb[0m: Agent Starting Run: s2aan9fi with config:
[34m[1mwandb[0m: 	batch_size: 4
[34m[1mwandb[0m: 	dropout: 0.4
[34m[1mwandb[0m: 	embedding_dim: 32
[34m[1mwandb[0m: 	epochs: 7
[34m[1mwandb[0m: 	learning_rate: 1e-05
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_decay: 0.005


Epoch 1/7
Epoch 2/7
Epoch 3/7
Epoch 4/7
Epoch 5/7
Epoch 6/7
Epoch 7/7


VBox(children=(Label(value='12.234 MB of 12.234 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▃▄▆▇▇█
epoch,▁▂▃▅▆▇█
loss,█▇▅▄▃▂▁
val_binary_accuracy,▁▂▄▅▆▇█
val_loss,█▆▅▄▃▂▁

0,1
best_epoch,6.0
best_val_loss,0.69058
binary_accuracy,0.53431
epoch,6.0
loss,0.69092
val_binary_accuracy,0.53033
val_loss,0.69058


[34m[1mwandb[0m: Agent Starting Run: 3xx86o4t with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.4
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 0.005
[34m[1mwandb[0m: 	optimizer: nadam
[34m[1mwandb[0m: 	weight_decay: 0.0005


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='73.271 MB of 73.271 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▇█
epoch,▁▅█
loss,█▂▁
val_binary_accuracy,▁█▆
val_loss,█▁▂

0,1
best_epoch,1.0
best_val_loss,0.0097
binary_accuracy,0.99673
epoch,2.0
loss,0.00949
val_binary_accuracy,0.99594
val_loss,0.01119


[34m[1mwandb[0m: Agent Starting Run: pt3rsali with config:
[34m[1mwandb[0m: 	batch_size: 4
[34m[1mwandb[0m: 	dropout: 0.4
[34m[1mwandb[0m: 	embedding_dim: 64
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 0.0005
[34m[1mwandb[0m: 	optimizer: adam
[34m[1mwandb[0m: 	weight_decay: 0.0005


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='36.649 MB of 36.649 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁██
epoch,▁▅█
loss,█▁▁
val_binary_accuracy,▁▇█
val_loss,█▂▁

0,1
best_epoch,2.0
best_val_loss,0.00768
binary_accuracy,0.99763
epoch,2.0
loss,0.00849
val_binary_accuracy,0.99766
val_loss,0.00768


[34m[1mwandb[0m: Agent Starting Run: vq0tn9bz with config:
[34m[1mwandb[0m: 	batch_size: 1
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 7
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: nadam
[34m[1mwandb[0m: 	weight_decay: 0.05


Epoch 1/7
Epoch 2/7
Epoch 3/7
Epoch 4/7
Epoch 5/7
Epoch 6/7
Epoch 7/7


VBox(children=(Label(value='73.271 MB of 73.271 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▇█████
epoch,▁▂▃▅▆▇█
loss,█▂▁▁▁▁▁
val_binary_accuracy,▁▅▇▇▇██
val_loss,█▄▂▂▂▁▁

0,1
best_epoch,6.0
best_val_loss,0.0048
binary_accuracy,0.99841
epoch,6.0
loss,0.00504
val_binary_accuracy,0.99841
val_loss,0.0048


[34m[1mwandb[0m: Agent Starting Run: sxt6pguh with config:
[34m[1mwandb[0m: 	batch_size: 2
[34m[1mwandb[0m: 	dropout: 0.4
[34m[1mwandb[0m: 	embedding_dim: 64
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	learning_rate: 1e-05
[34m[1mwandb[0m: 	optimizer: rmsprop
[34m[1mwandb[0m: 	weight_decay: 0.05


Epoch 1/5
Epoch 2/5
Epoch 3/5
Epoch 4/5
Epoch 5/5


VBox(children=(Label(value='24.441 MB of 24.441 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▅▆▇█
epoch,▁▃▅▆█
loss,█▇▅▃▁
val_binary_accuracy,▁▅▆▇█
val_loss,█▆▅▃▁

0,1
best_epoch,4.0
best_val_loss,0.54178
binary_accuracy,0.81405
epoch,4.0
loss,0.55816
val_binary_accuracy,0.8215
val_loss,0.54178


[34m[1mwandb[0m: Agent Starting Run: p3egdku5 with config:
[34m[1mwandb[0m: 	batch_size: 4
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	embedding_dim: 32
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 1e-05
[34m[1mwandb[0m: 	optimizer: nadam
[34m[1mwandb[0m: 	weight_decay: 0.0005


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='18.339 MB of 18.339 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▅█
epoch,▁▅█
loss,█▅▁
val_binary_accuracy,▁▆█
val_loss,█▅▁

0,1
best_epoch,2.0
best_val_loss,0.61351
binary_accuracy,0.75208
epoch,2.0
loss,0.63296
val_binary_accuracy,0.77046
val_loss,0.61351


[34m[1mwandb[0m: Agent Starting Run: kpckx0tl with config:
[34m[1mwandb[0m: 	batch_size: 4
[34m[1mwandb[0m: 	dropout: 0.4
[34m[1mwandb[0m: 	embedding_dim: 64
[34m[1mwandb[0m: 	epochs: 7
[34m[1mwandb[0m: 	learning_rate: 1e-05
[34m[1mwandb[0m: 	optimizer: rmsprop
[34m[1mwandb[0m: 	weight_decay: 0.05


Epoch 1/7
Epoch 2/7
Epoch 3/7
Epoch 4/7
Epoch 5/7
Epoch 6/7
Epoch 7/7


VBox(children=(Label(value='24.441 MB of 24.441 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▄▆▇▇██
epoch,▁▂▃▅▆▇█
loss,█▇▆▅▃▂▁
val_binary_accuracy,▁▄▆▆▇██
val_loss,█▇▆▄▃▂▁

0,1
best_epoch,6.0
best_val_loss,0.49285
binary_accuracy,0.83901
epoch,6.0
loss,0.50685
val_binary_accuracy,0.84544
val_loss,0.49285


[34m[1mwandb[0m: Agent Starting Run: mmcgu9kf with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	embedding_dim: 32
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	learning_rate: 0.005
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_decay: 0.005


Epoch 1/5
Epoch 2/5
Epoch 3/5
Epoch 4/5
Epoch 5/5


VBox(children=(Label(value='12.234 MB of 12.234 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▂▃▆█
epoch,▁▃▅▆█
loss,██▆▄▁
val_binary_accuracy,▁▁▄▇█
val_loss,█▇▆▃▁

0,1
best_epoch,4.0
best_val_loss,0.39298
binary_accuracy,0.8569
epoch,4.0
loss,0.44645
val_binary_accuracy,0.9352
val_loss,0.39298


[34m[1mwandb[0m: Agent Starting Run: 68gvkf83 with config:
[34m[1mwandb[0m: 	batch_size: 2
[34m[1mwandb[0m: 	dropout: 0.5
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	learning_rate: 1e-05
[34m[1mwandb[0m: 	optimizer: nadam
[34m[1mwandb[0m: 	weight_decay: 0.0005


Epoch 1/5
Epoch 2/5
Epoch 3/5
Epoch 4/5
Epoch 5/5


VBox(children=(Label(value='73.271 MB of 73.271 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▅▆▇█
epoch,▁▃▅▆█
loss,█▇▅▃▁
val_binary_accuracy,▁▄▆▇█
val_loss,█▇▅▃▁

0,1
best_epoch,4.0
best_val_loss,0.40626
binary_accuracy,0.86859
epoch,4.0
loss,0.44221
val_binary_accuracy,0.88632
val_loss,0.40626


[34m[1mwandb[0m: Agent Starting Run: 83cico03 with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.5
[34m[1mwandb[0m: 	embedding_dim: 64
[34m[1mwandb[0m: 	epochs: 7
[34m[1mwandb[0m: 	learning_rate: 5e-05
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_decay: 0.0005


Epoch 1/7
Epoch 2/7
Epoch 3/7
Epoch 4/7
Epoch 5/7
Epoch 6/7
Epoch 7/7


VBox(children=(Label(value='24.441 MB of 24.441 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▄▆▇███
epoch,▁▂▃▅▆▇█
loss,█▆▅▃▂▂▁
val_binary_accuracy,▁▃▅▆▇██
val_loss,█▆▅▄▃▂▁

0,1
best_epoch,6.0
best_val_loss,0.68456
binary_accuracy,0.57001
epoch,6.0
loss,0.68564
val_binary_accuracy,0.59903
val_loss,0.68456


[34m[1mwandb[0m: Agent Starting Run: gkovpnv8 with config:
[34m[1mwandb[0m: 	batch_size: 4
[34m[1mwandb[0m: 	dropout: 0.5
[34m[1mwandb[0m: 	embedding_dim: 32
[34m[1mwandb[0m: 	epochs: 7
[34m[1mwandb[0m: 	learning_rate: 0.0001
[34m[1mwandb[0m: 	optimizer: nadam
[34m[1mwandb[0m: 	weight_decay: 0.05


Epoch 1/7
Epoch 2/7
Epoch 3/7
Epoch 4/7
Epoch 5/7
Epoch 6/7
Epoch 7/7


VBox(children=(Label(value='18.339 MB of 18.339 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▇█████
epoch,▁▂▃▅▆▇█
loss,█▄▂▁▁▁▁
val_binary_accuracy,▁▆▇▇███
val_loss,█▄▂▂▁▁▁

0,1
best_epoch,6.0
best_val_loss,0.03322
binary_accuracy,0.9873
epoch,6.0
loss,0.04287
val_binary_accuracy,0.99044
val_loss,0.03322


[34m[1mwandb[0m: Agent Starting Run: 82zrm3je with config:
[34m[1mwandb[0m: 	batch_size: 4
[34m[1mwandb[0m: 	dropout: 0.5
[34m[1mwandb[0m: 	embedding_dim: 64
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	learning_rate: 1e-05
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_decay: 0.05


Epoch 1/5
Epoch 2/5
Epoch 3/5
Epoch 4/5
Epoch 5/5


VBox(children=(Label(value='24.441 MB of 24.441 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▃▅▇█
epoch,▁▃▅▆█
loss,█▅▄▂▁
val_binary_accuracy,▁▂▄▆█
val_loss,█▆▄▂▁

0,1
best_epoch,4.0
best_val_loss,0.69154
binary_accuracy,0.51846
epoch,4.0
loss,0.69187
val_binary_accuracy,0.51377
val_loss,0.69154


[34m[1mwandb[0m: Agent Starting Run: bf41ex83 with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.5
[34m[1mwandb[0m: 	embedding_dim: 64
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 0.005
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_decay: 0.005


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='24.441 MB of 24.441 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▃█
epoch,▁▅█
loss,█▆▁
val_binary_accuracy,▁▂█
val_loss,█▆▁

0,1
best_epoch,2.0
best_val_loss,0.58507
binary_accuracy,0.65227
epoch,2.0
loss,0.62678
val_binary_accuracy,0.75884
val_loss,0.58507


[34m[1mwandb[0m: Agent Starting Run: siva47vo with config:
[34m[1mwandb[0m: 	batch_size: 4
[34m[1mwandb[0m: 	dropout: 0.5
[34m[1mwandb[0m: 	embedding_dim: 32
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: nadam
[34m[1mwandb[0m: 	weight_decay: 0.005


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='18.339 MB of 18.339 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁██
epoch,▁▅█
loss,█▁▁
val_binary_accuracy,▁▆█
val_loss,█▂▁

0,1
best_epoch,2.0
best_val_loss,0.01131
binary_accuracy,0.99433
epoch,2.0
loss,0.01748
val_binary_accuracy,0.99639
val_loss,0.01131


[34m[1mwandb[0m: Agent Starting Run: xvhy6mou with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.5
[34m[1mwandb[0m: 	embedding_dim: 32
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 5e-05
[34m[1mwandb[0m: 	optimizer: adam
[34m[1mwandb[0m: 	weight_decay: 0.0005


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='18.338 MB of 18.338 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▆█
epoch,▁▅█
loss,█▄▁
val_binary_accuracy,▁▆█
val_loss,█▄▁

0,1
best_epoch,2.0
best_val_loss,0.18855
binary_accuracy,0.94745
epoch,2.0
loss,0.25397
val_binary_accuracy,0.96568
val_loss,0.18855


[34m[1mwandb[0m: Agent Starting Run: ghuzvqar with config:
[34m[1mwandb[0m: 	batch_size: 4
[34m[1mwandb[0m: 	dropout: 0.4
[34m[1mwandb[0m: 	embedding_dim: 64
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 0.005
[34m[1mwandb[0m: 	optimizer: rmsprop
[34m[1mwandb[0m: 	weight_decay: 0.005


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='24.441 MB of 24.441 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▇█
epoch,▁▅█
loss,█▂▁
val_binary_accuracy,▁▆█
val_loss,█▃▁

0,1
best_epoch,2.0
best_val_loss,0.00949
binary_accuracy,0.99577
epoch,2.0
loss,0.01385
val_binary_accuracy,0.99693
val_loss,0.00949


[34m[1mwandb[0m: Agent Starting Run: k92su58x with config:
[34m[1mwandb[0m: 	batch_size: 2
[34m[1mwandb[0m: 	dropout: 0.5
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 0.005
[34m[1mwandb[0m: 	optimizer: nadam
[34m[1mwandb[0m: 	weight_decay: 0.05


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='73.271 MB of 73.271 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▇█
epoch,▁▅█
loss,█▂▁
val_binary_accuracy,▁█▄
val_loss,█▁▅

0,1
best_epoch,1.0
best_val_loss,0.00939
binary_accuracy,0.99587
epoch,2.0
loss,0.01166
val_binary_accuracy,0.99526
val_loss,0.01314


[34m[1mwandb[0m: Agent Starting Run: dh12hovr with config:
[34m[1mwandb[0m: 	batch_size: 4
[34m[1mwandb[0m: 	dropout: 0.5
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_decay: 0.005


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='48.856 MB of 48.856 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▇█
epoch,▁▅█
loss,█▃▁
val_binary_accuracy,▁▅█
val_loss,█▃▁

0,1
best_epoch,2.0
best_val_loss,0.65036
binary_accuracy,0.59891
epoch,2.0
loss,0.66022
val_binary_accuracy,0.64176
val_loss,0.65036


[34m[1mwandb[0m: Agent Starting Run: tdsiib0k with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embedding_dim: 32
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	learning_rate: 5e-05
[34m[1mwandb[0m: 	optimizer: rmsprop
[34m[1mwandb[0m: 	weight_decay: 0.005


Epoch 1/5
Epoch 2/5
Epoch 3/5
Epoch 4/5
Epoch 5/5


VBox(children=(Label(value='12.234 MB of 12.234 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▅▇██
epoch,▁▃▅▆█
loss,█▅▃▂▁
val_binary_accuracy,▁▅▇██
val_loss,█▅▃▂▁

0,1
best_epoch,4.0
best_val_loss,0.12275
binary_accuracy,0.97064
epoch,4.0
loss,0.14269
val_binary_accuracy,0.97482
val_loss,0.12275


[34m[1mwandb[0m: Agent Starting Run: j3qywzh3 with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.5
[34m[1mwandb[0m: 	embedding_dim: 32
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: nadam
[34m[1mwandb[0m: 	weight_decay: 0.0005


Epoch 1/5
Epoch 2/5
Epoch 3/5
Epoch 4/5
Epoch 5/5


VBox(children=(Label(value='18.339 MB of 18.339 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▆▇██
epoch,▁▃▅▆█
loss,█▂▂▁▁
val_binary_accuracy,▂▃▇█▁
val_loss,▇▆▂▁█

0,1
best_epoch,3.0
best_val_loss,0.006
binary_accuracy,0.99563
epoch,4.0
loss,0.01252
val_binary_accuracy,0.99538
val_loss,0.01296


[34m[1mwandb[0m: Agent Starting Run: 2x6oi5oy with config:
[34m[1mwandb[0m: 	batch_size: 4
[34m[1mwandb[0m: 	dropout: 0.4
[34m[1mwandb[0m: 	embedding_dim: 64
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 0.0001
[34m[1mwandb[0m: 	optimizer: rmsprop
[34m[1mwandb[0m: 	weight_decay: 0.05


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='24.441 MB of 24.441 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▇█
epoch,▁▅█
loss,█▂▁
val_binary_accuracy,▁▇█
val_loss,█▂▁

0,1
best_epoch,2.0
best_val_loss,0.06203
binary_accuracy,0.9788
epoch,2.0
loss,0.07869
val_binary_accuracy,0.98219
val_loss,0.06203


[34m[1mwandb[0m: Agent Starting Run: 7aqllbm6 with config:
[34m[1mwandb[0m: 	batch_size: 2
[34m[1mwandb[0m: 	dropout: 0.5
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	learning_rate: 0.0005
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_decay: 0.05


Epoch 1/5
Epoch 2/5
Epoch 3/5
Epoch 4/5
Epoch 5/5


VBox(children=(Label(value='48.856 MB of 48.856 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▆▇▇█
epoch,▁▃▅▆█
loss,█▅▃▂▁
val_binary_accuracy,▁▅▇▇█
val_loss,█▅▃▂▁

0,1
best_epoch,4.0
best_val_loss,0.6561
binary_accuracy,0.59472
epoch,4.0
loss,0.6637
val_binary_accuracy,0.63931
val_loss,0.6561


[34m[1mwandb[0m: Agent Starting Run: k4lezu6f with config:
[34m[1mwandb[0m: 	batch_size: 2
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embedding_dim: 32
[34m[1mwandb[0m: 	epochs: 7
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: rmsprop
[34m[1mwandb[0m: 	weight_decay: 0.05


Epoch 1/7
Epoch 2/7
Epoch 3/7
Epoch 4/7
Epoch 5/7
Epoch 6/7
Epoch 7/7


VBox(children=(Label(value='12.234 MB of 12.234 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▆▇▇███
epoch,▁▂▃▅▆▇█
loss,█▃▂▁▁▁▁
val_binary_accuracy,▁▃▆▇▇▇█
val_loss,█▆▃▂▁▁▁

0,1
best_epoch,6.0
best_val_loss,0.00606
binary_accuracy,0.99804
epoch,6.0
loss,0.00729
val_binary_accuracy,0.99831
val_loss,0.00606


[34m[1mwandb[0m: Agent Starting Run: zu3i6h4y with config:
[34m[1mwandb[0m: 	batch_size: 1
[34m[1mwandb[0m: 	dropout: 0.4
[34m[1mwandb[0m: 	embedding_dim: 64
[34m[1mwandb[0m: 	epochs: 7
[34m[1mwandb[0m: 	learning_rate: 1e-05
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_decay: 0.0005


Epoch 1/7
Epoch 2/7
Epoch 3/7
Epoch 4/7
Epoch 5/7
Epoch 6/7
Epoch 7/7


VBox(children=(Label(value='24.441 MB of 24.441 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▃▄▅▆▇█
epoch,▁▂▃▅▆▇█
loss,█▆▅▄▃▂▁
val_binary_accuracy,▁▂▃▅▆▇█
val_loss,█▆▅▄▃▂▁

0,1
best_epoch,6.0
best_val_loss,0.69086
binary_accuracy,0.53222
epoch,6.0
loss,0.69113
val_binary_accuracy,0.52692
val_loss,0.69086


[34m[1mwandb[0m: Agent Starting Run: s2b57avr with config:
[34m[1mwandb[0m: 	batch_size: 2
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embedding_dim: 64
[34m[1mwandb[0m: 	epochs: 7
[34m[1mwandb[0m: 	learning_rate: 1e-05
[34m[1mwandb[0m: 	optimizer: adam
[34m[1mwandb[0m: 	weight_decay: 0.05


Epoch 1/7
Epoch 2/7
Epoch 3/7
Epoch 4/7
Epoch 5/7
Epoch 6/7
Epoch 7/7


VBox(children=(Label(value='36.649 MB of 36.649 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▄▅▆▇▇█
epoch,▁▂▃▅▆▇█
loss,█▇▆▅▃▂▁
val_binary_accuracy,▁▄▅▆▇▇█
val_loss,█▇▆▄▃▂▁

0,1
best_epoch,6.0
best_val_loss,0.27893
binary_accuracy,0.92626
epoch,6.0
loss,0.30602
val_binary_accuracy,0.93798
val_loss,0.27893


[34m[1mwandb[0m: Agent Starting Run: ago2u58a with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 0.0001
[34m[1mwandb[0m: 	optimizer: adam
[34m[1mwandb[0m: 	weight_decay: 0.05


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='73.271 MB of 73.271 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁██
epoch,▁▅█
loss,█▂▁
val_binary_accuracy,▁▆█
val_loss,█▂▁

0,1
best_epoch,2.0
best_val_loss,0.01998
binary_accuracy,0.99277
epoch,2.0
loss,0.0267
val_binary_accuracy,0.99432
val_loss,0.01998


[34m[1mwandb[0m: Agent Starting Run: zzi4pkq0 with config:
[34m[1mwandb[0m: 	batch_size: 4
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	embedding_dim: 32
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	learning_rate: 1e-05
[34m[1mwandb[0m: 	optimizer: adam
[34m[1mwandb[0m: 	weight_decay: 0.0005


Epoch 1/5
Epoch 2/5
Epoch 3/5
Epoch 4/5
Epoch 5/5


VBox(children=(Label(value='18.338 MB of 18.338 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▄▆▇█
epoch,▁▃▅▆█
loss,█▇▅▃▁
val_binary_accuracy,▁▄▆▇█
val_loss,█▇▅▃▁

0,1
best_epoch,4.0
best_val_loss,0.49827
binary_accuracy,0.82892
epoch,4.0
loss,0.5242
val_binary_accuracy,0.84118
val_loss,0.49827


[34m[1mwandb[0m: Agent Starting Run: p4p2c9u9 with config:
[34m[1mwandb[0m: 	batch_size: 1
[34m[1mwandb[0m: 	dropout: 0.5
[34m[1mwandb[0m: 	embedding_dim: 32
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	learning_rate: 5e-05
[34m[1mwandb[0m: 	optimizer: adam
[34m[1mwandb[0m: 	weight_decay: 0.0005


Epoch 1/5
Epoch 2/5
Epoch 3/5
Epoch 4/5
Epoch 5/5


VBox(children=(Label(value='18.338 MB of 18.338 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▅▇██
epoch,▁▃▅▆█
loss,█▅▃▂▁
val_binary_accuracy,▁▅▇██
val_loss,█▅▃▂▁

0,1
best_epoch,4.0
best_val_loss,0.08326
binary_accuracy,0.97813
epoch,4.0
loss,0.10791
val_binary_accuracy,0.98344
val_loss,0.08326


[34m[1mwandb[0m: Agent Starting Run: z8wiffme with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 5e-05
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_decay: 0.0005


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='48.856 MB of 48.856 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▅█
epoch,▁▅█
loss,█▄▁
val_binary_accuracy,▁▅█
val_loss,█▄▁

0,1
best_epoch,2.0
best_val_loss,0.68754
binary_accuracy,0.565
epoch,2.0
loss,0.68841
val_binary_accuracy,0.5699
val_loss,0.68754


[34m[1mwandb[0m: Agent Starting Run: j7cwnnu2 with config:
[34m[1mwandb[0m: 	batch_size: 4
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embedding_dim: 32
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	learning_rate: 0.0001
[34m[1mwandb[0m: 	optimizer: rmsprop
[34m[1mwandb[0m: 	weight_decay: 0.005


Epoch 1/5
Epoch 2/5
Epoch 3/5
Epoch 4/5
Epoch 5/5


VBox(children=(Label(value='12.234 MB of 12.234 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▇███
epoch,▁▃▅▆█
loss,█▃▂▁▁
val_binary_accuracy,▁▇▇██
val_loss,█▃▂▁▁

0,1
best_epoch,4.0
best_val_loss,0.04599
binary_accuracy,0.9844
epoch,4.0
loss,0.05266
val_binary_accuracy,0.98587
val_loss,0.04599


[34m[1mwandb[0m: Agent Starting Run: 8p20cbzp with config:
[34m[1mwandb[0m: 	batch_size: 2
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embedding_dim: 32
[34m[1mwandb[0m: 	epochs: 7
[34m[1mwandb[0m: 	learning_rate: 1e-05
[34m[1mwandb[0m: 	optimizer: rmsprop
[34m[1mwandb[0m: 	weight_decay: 0.0005


Epoch 1/7
Epoch 2/7
Epoch 3/7
Epoch 4/7
Epoch 5/7
Epoch 6/7
Epoch 7/7


VBox(children=(Label(value='12.234 MB of 12.234 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▄▆▇▇██
epoch,▁▂▃▅▆▇█
loss,█▇▆▅▃▂▁
val_binary_accuracy,▁▄▆▇▇██
val_loss,█▇▆▄▃▂▁

0,1
best_epoch,6.0
best_val_loss,0.53002
binary_accuracy,0.81906
epoch,6.0
loss,0.5411
val_binary_accuracy,0.82413
val_loss,0.53002


[34m[1mwandb[0m: Agent Starting Run: 9gno45dc with config:
[34m[1mwandb[0m: 	batch_size: 2
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embedding_dim: 32
[34m[1mwandb[0m: 	epochs: 7
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: nadam
[34m[1mwandb[0m: 	weight_decay: 0.005


Epoch 1/7
Epoch 2/7
Epoch 3/7
Epoch 4/7
Epoch 5/7
Epoch 6/7
Epoch 7/7


VBox(children=(Label(value='18.339 MB of 18.339 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▆▇▇███
epoch,▁▂▃▅▆▇█
loss,█▂▂▂▁▁▁
val_binary_accuracy,▄▇▆▄▁██
val_loss,▄▂▃▅█▁▁

0,1
best_epoch,5.0
best_val_loss,0.00441
binary_accuracy,0.99837
epoch,6.0
loss,0.00517
val_binary_accuracy,0.99845
val_loss,0.00521


[34m[1mwandb[0m: Agent Starting Run: bs3rqmti with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	embedding_dim: 32
[34m[1mwandb[0m: 	epochs: 7
[34m[1mwandb[0m: 	learning_rate: 5e-05
[34m[1mwandb[0m: 	optimizer: nadam
[34m[1mwandb[0m: 	weight_decay: 0.05


Epoch 1/7
Epoch 2/7
Epoch 3/7
Epoch 4/7
Epoch 5/7
Epoch 6/7
Epoch 7/7


VBox(children=(Label(value='18.339 MB of 18.339 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▅▇████
epoch,▁▂▃▅▆▇█
loss,█▅▃▂▂▁▁
val_binary_accuracy,▁▅▇████
val_loss,█▅▃▂▁▁▁

0,1
best_epoch,6.0
best_val_loss,0.05364
binary_accuracy,0.98341
epoch,6.0
loss,0.06239
val_binary_accuracy,0.98548
val_loss,0.05364


[34m[1mwandb[0m: Agent Starting Run: tppss6cu with config:
[34m[1mwandb[0m: 	batch_size: 4
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embedding_dim: 32
[34m[1mwandb[0m: 	epochs: 7
[34m[1mwandb[0m: 	learning_rate: 0.0001
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_decay: 0.0005


Epoch 1/7
Epoch 2/7
Epoch 3/7
Epoch 4/7
Epoch 5/7
Epoch 6/7
Epoch 7/7


VBox(children=(Label(value='12.234 MB of 12.234 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▆▇▇███
epoch,▁▂▃▅▆▇█
loss,█▆▅▃▃▂▁
val_binary_accuracy,▁▅▆▇▇██
val_loss,█▆▅▄▃▂▁

0,1
best_epoch,6.0
best_val_loss,0.67747
binary_accuracy,0.58733
epoch,6.0
loss,0.67917
val_binary_accuracy,0.61717
val_loss,0.67747


[34m[1mwandb[0m: Agent Starting Run: 3sl95tso with config:
[34m[1mwandb[0m: 	batch_size: 1
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embedding_dim: 32
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 1e-05
[34m[1mwandb[0m: 	optimizer: adam
[34m[1mwandb[0m: 	weight_decay: 0.0005


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='18.338 MB of 18.338 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▆█
epoch,▁▅█
loss,█▅▁
val_binary_accuracy,▁▆█
val_loss,█▅▁

0,1
best_epoch,2.0
best_val_loss,0.59354
binary_accuracy,0.76628
epoch,2.0
loss,0.61769
val_binary_accuracy,0.78558
val_loss,0.59354


[34m[1mwandb[0m: Agent Starting Run: g9owdpqv with config:
[34m[1mwandb[0m: 	batch_size: 1
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	embedding_dim: 64
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	learning_rate: 5e-05
[34m[1mwandb[0m: 	optimizer: nadam
[34m[1mwandb[0m: 	weight_decay: 0.0005


Epoch 1/5
Epoch 2/5
Epoch 3/5
Epoch 4/5
Epoch 5/5


VBox(children=(Label(value='36.649 MB of 36.649 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▆███
epoch,▁▃▅▆█
loss,█▄▂▁▁
val_binary_accuracy,▁▆▇██
val_loss,█▄▂▁▁

0,1
best_epoch,4.0
best_val_loss,0.05399
binary_accuracy,0.98321
epoch,4.0
loss,0.06429
val_binary_accuracy,0.9853
val_loss,0.05399


[34m[1mwandb[0m: Agent Starting Run: cjnjp3bb with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.5
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 1e-05
[34m[1mwandb[0m: 	optimizer: rmsprop
[34m[1mwandb[0m: 	weight_decay: 0.005


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='48.856 MB of 48.856 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▆█
epoch,▁▅█
loss,█▅▁
val_binary_accuracy,▁▆█
val_loss,█▅▁

0,1
best_epoch,2.0
best_val_loss,0.58689
binary_accuracy,0.78162
epoch,2.0
loss,0.60958
val_binary_accuracy,0.79663
val_loss,0.58689


[34m[1mwandb[0m: Agent Starting Run: 4andpext with config:
[34m[1mwandb[0m: 	batch_size: 2
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 1e-05
[34m[1mwandb[0m: 	optimizer: rmsprop
[34m[1mwandb[0m: 	weight_decay: 0.005


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='48.856 MB of 48.856 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▆█
epoch,▁▅█
loss,█▅▁
val_binary_accuracy,▁▆█
val_loss,█▅▁

0,1
best_epoch,2.0
best_val_loss,0.53129
binary_accuracy,0.80881
epoch,2.0
loss,0.56166
val_binary_accuracy,0.82483
val_loss,0.53129


[34m[1mwandb[0m: Agent Starting Run: ed3a5n5i with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.5
[34m[1mwandb[0m: 	embedding_dim: 64
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: nadam
[34m[1mwandb[0m: 	weight_decay: 0.005


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='36.649 MB of 36.649 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▇█
epoch,▁▅█
loss,█▂▁
val_binary_accuracy,▅▁█
val_loss,▅█▁

0,1
best_epoch,2.0
best_val_loss,0.00976
binary_accuracy,0.9954
epoch,2.0
loss,0.01303
val_binary_accuracy,0.99649
val_loss,0.00976


[34m[1mwandb[0m: Agent Starting Run: izlu5jsb with config:
[34m[1mwandb[0m: 	batch_size: 1
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	embedding_dim: 32
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: rmsprop
[34m[1mwandb[0m: 	weight_decay: 0.05


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='12.234 MB of 12.234 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁██
epoch,▁▅█
loss,█▁▁
val_binary_accuracy,▁▆█
val_loss,█▃▁

0,1
best_epoch,2.0
best_val_loss,0.01455
binary_accuracy,0.99393
epoch,2.0
loss,0.01804
val_binary_accuracy,0.99495
val_loss,0.01455


[34m[1mwandb[0m: Agent Starting Run: dlwkn85k with config:
[34m[1mwandb[0m: 	batch_size: 2
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embedding_dim: 32
[34m[1mwandb[0m: 	epochs: 7
[34m[1mwandb[0m: 	learning_rate: 1e-05
[34m[1mwandb[0m: 	optimizer: rmsprop
[34m[1mwandb[0m: 	weight_decay: 0.0005


Epoch 1/7
Epoch 2/7
Epoch 3/7
Epoch 4/7
Epoch 5/7
Epoch 6/7
Epoch 7/7


VBox(children=(Label(value='12.234 MB of 12.234 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▄▆▇▇██
epoch,▁▂▃▅▆▇█
loss,█▇▆▅▃▂▁
val_binary_accuracy,▁▄▆▇▇██
val_loss,█▇▆▄▃▂▁

0,1
best_epoch,6.0
best_val_loss,0.53208
binary_accuracy,0.81855
epoch,6.0
loss,0.54315
val_binary_accuracy,0.82313
val_loss,0.53208


[34m[1mwandb[0m: Agent Starting Run: h72mxiho with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	embedding_dim: 32
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 1e-05
[34m[1mwandb[0m: 	optimizer: adam
[34m[1mwandb[0m: 	weight_decay: 0.005


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='18.338 MB of 18.338 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▆█
epoch,▁▅█
loss,█▅▁
val_binary_accuracy,▁▆█
val_loss,█▅▁

0,1
best_epoch,2.0
best_val_loss,0.593
binary_accuracy,0.77254
epoch,2.0
loss,0.61651
val_binary_accuracy,0.78955
val_loss,0.593


[34m[1mwandb[0m: Agent Starting Run: 7umipknm with config:
[34m[1mwandb[0m: 	batch_size: 1
[34m[1mwandb[0m: 	dropout: 0.5
[34m[1mwandb[0m: 	embedding_dim: 64
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: rmsprop
[34m[1mwandb[0m: 	weight_decay: 0.005


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='24.441 MB of 24.441 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▇█
epoch,▁▅█
loss,█▂▁
val_binary_accuracy,▁▄█
val_loss,█▅▁

0,1
best_epoch,2.0
best_val_loss,0.01115
binary_accuracy,0.9946
epoch,2.0
loss,0.01731
val_binary_accuracy,0.99649
val_loss,0.01115


[34m[1mwandb[0m: Agent Starting Run: ivq2e0jy with config:
[34m[1mwandb[0m: 	batch_size: 1
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	embedding_dim: 32
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	learning_rate: 0.0001
[34m[1mwandb[0m: 	optimizer: adam
[34m[1mwandb[0m: 	weight_decay: 0.05


Epoch 1/5
Epoch 2/5
Epoch 3/5
Epoch 4/5
Epoch 5/5


VBox(children=(Label(value='18.338 MB of 18.338 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▇███
epoch,▁▃▅▆█
loss,█▃▂▁▁
val_binary_accuracy,▁▆▇██
val_loss,█▃▂▁▁

0,1
best_epoch,4.0
best_val_loss,0.02297
binary_accuracy,0.99251
epoch,4.0
loss,0.02858
val_binary_accuracy,0.99363
val_loss,0.02297


[34m[1mwandb[0m: Agent Starting Run: furz82vd with config:
[34m[1mwandb[0m: 	batch_size: 1
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embedding_dim: 64
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 0.0001
[34m[1mwandb[0m: 	optimizer: adam
[34m[1mwandb[0m: 	weight_decay: 0.0005


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='36.649 MB of 36.649 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▇█
epoch,▁▅█
loss,█▂▁
val_binary_accuracy,▁▇█
val_loss,█▂▁

0,1
best_epoch,2.0
best_val_loss,0.02676
binary_accuracy,0.9906
epoch,2.0
loss,0.03702
val_binary_accuracy,0.99283
val_loss,0.02676


[34m[1mwandb[0m: Agent Starting Run: oi4yfd92 with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.4
[34m[1mwandb[0m: 	embedding_dim: 32
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: nadam
[34m[1mwandb[0m: 	weight_decay: 0.0005


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='18.339 MB of 18.339 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▇█
epoch,▁▅█
loss,█▂▁
val_binary_accuracy,█▄▁
val_loss,▁▆█

0,1
best_epoch,0.0
best_val_loss,0.00821
binary_accuracy,0.99618
epoch,2.0
loss,0.01102
val_binary_accuracy,0.99589
val_loss,0.01143


[34m[1mwandb[0m: Agent Starting Run: r3ipdsed with config:
[34m[1mwandb[0m: 	batch_size: 2
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embedding_dim: 64
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_decay: 0.0005


Epoch 1/5
Epoch 2/5
Epoch 3/5
Epoch 4/5
Epoch 5/5


VBox(children=(Label(value='24.441 MB of 24.441 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▅▇▇█
epoch,▁▃▅▆█
loss,█▄▂▂▁
val_binary_accuracy,▁▅▆▇█
val_loss,█▅▃▂▁

0,1
best_epoch,4.0
best_val_loss,0.64141
binary_accuracy,0.61492
epoch,4.0
loss,0.64973
val_binary_accuracy,0.64394
val_loss,0.64141


[34m[1mwandb[0m: Agent Starting Run: kxtkvn6k with config:
[34m[1mwandb[0m: 	batch_size: 2
[34m[1mwandb[0m: 	dropout: 0.4
[34m[1mwandb[0m: 	embedding_dim: 64
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	learning_rate: 1e-05
[34m[1mwandb[0m: 	optimizer: nadam
[34m[1mwandb[0m: 	weight_decay: 0.005


Epoch 1/5
Epoch 2/5
Epoch 3/5
Epoch 4/5
Epoch 5/5


VBox(children=(Label(value='36.649 MB of 36.649 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▄▆▇█
epoch,▁▃▅▆█
loss,█▇▅▃▁
val_binary_accuracy,▁▄▆▇█
val_loss,█▇▅▃▁

0,1
best_epoch,4.0
best_val_loss,0.46361
binary_accuracy,0.8442
epoch,4.0
loss,0.49338
val_binary_accuracy,0.85927
val_loss,0.46361


[34m[1mwandb[0m: Agent Starting Run: 81evke16 with config:
[34m[1mwandb[0m: 	batch_size: 4
[34m[1mwandb[0m: 	dropout: 0.5
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: rmsprop
[34m[1mwandb[0m: 	weight_decay: 0.0005


Epoch 1/5
Epoch 2/5
Epoch 3/5
Epoch 4/5
Epoch 5/5


VBox(children=(Label(value='48.856 MB of 48.856 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▇███
epoch,▁▃▅▆█
loss,█▂▁▁▁
val_binary_accuracy,▁▅▆▇█
val_loss,█▄▃▁▁

0,1
best_epoch,4.0
best_val_loss,0.01443
binary_accuracy,0.99452
epoch,4.0
loss,0.01715
val_binary_accuracy,0.99534
val_loss,0.01443


[34m[1mwandb[0m: Agent Starting Run: gfcw3a0j with config:
[34m[1mwandb[0m: 	batch_size: 2
[34m[1mwandb[0m: 	dropout: 0.5
[34m[1mwandb[0m: 	embedding_dim: 32
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 0.0005
[34m[1mwandb[0m: 	optimizer: adam
[34m[1mwandb[0m: 	weight_decay: 0.0005


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='18.338 MB of 18.338 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁██
epoch,▁▅█
loss,█▁▁
val_binary_accuracy,▁▆█
val_loss,█▂▁

0,1
best_epoch,2.0
best_val_loss,0.01021
binary_accuracy,0.99531
epoch,2.0
loss,0.01639
val_binary_accuracy,0.99723
val_loss,0.01021


[34m[1mwandb[0m: Agent Starting Run: qrwlieh9 with config:
[34m[1mwandb[0m: 	batch_size: 2
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	learning_rate: 1e-05
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_decay: 0.05


Epoch 1/5
Epoch 2/5
Epoch 3/5
Epoch 4/5
Epoch 5/5


VBox(children=(Label(value='48.856 MB of 48.856 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▃▅▆█
epoch,▁▃▅▆█
loss,█▆▄▂▁
val_binary_accuracy,▁▃▄▆█
val_loss,█▆▄▂▁

0,1
best_epoch,4.0
best_val_loss,0.69103
binary_accuracy,0.52395
epoch,4.0
loss,0.69129
val_binary_accuracy,0.51881
val_loss,0.69103


[34m[1mwandb[0m: Agent Starting Run: b8mghh8n with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.4
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 7
[34m[1mwandb[0m: 	learning_rate: 0.0005
[34m[1mwandb[0m: 	optimizer: adam
[34m[1mwandb[0m: 	weight_decay: 0.005


Epoch 1/7
Epoch 2/7
Epoch 3/7
Epoch 4/7
Epoch 5/7
Epoch 6/7
Epoch 7/7


VBox(children=(Label(value='73.271 MB of 73.271 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁██████
epoch,▁▂▃▅▆▇█
loss,█▂▁▁▁▁▁
val_binary_accuracy,▁▅▆▇▇██
val_loss,█▄▂▂▂▁▁

0,1
best_epoch,6.0
best_val_loss,0.00348
binary_accuracy,0.99903
epoch,6.0
loss,0.00344
val_binary_accuracy,0.99901
val_loss,0.00348


[34m[1mwandb[0m: Agent Starting Run: bhruby58 with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 0.0001
[34m[1mwandb[0m: 	optimizer: rmsprop
[34m[1mwandb[0m: 	weight_decay: 0.0005


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='48.856 MB of 48.856 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁██
epoch,▁▅█
loss,█▂▁
val_binary_accuracy,▁▆█
val_loss,█▂▁

0,1
best_epoch,2.0
best_val_loss,0.03697
binary_accuracy,0.98612
epoch,2.0
loss,0.04489
val_binary_accuracy,0.98818
val_loss,0.03697


[34m[1mwandb[0m: Agent Starting Run: 6vbp12k1 with config:
[34m[1mwandb[0m: 	batch_size: 2
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 1e-05
[34m[1mwandb[0m: 	optimizer: adam
[34m[1mwandb[0m: 	weight_decay: 0.005


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='73.271 MB of 73.271 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▆█
epoch,▁▅█
loss,█▅▁
val_binary_accuracy,▁▅█
val_loss,█▅▁

0,1
best_epoch,2.0
best_val_loss,0.45521
binary_accuracy,0.83745
epoch,2.0
loss,0.50317
val_binary_accuracy,0.86112
val_loss,0.45521


[34m[1mwandb[0m: Agent Starting Run: wxxhj1w6 with config:
[34m[1mwandb[0m: 	batch_size: 2
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	embedding_dim: 32
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	learning_rate: 0.005
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_decay: 0.05


Epoch 1/5
Epoch 2/5
Epoch 3/5
Epoch 4/5
Epoch 5/5


VBox(children=(Label(value='12.234 MB of 12.234 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▂▃▆█
epoch,▁▃▅▆█
loss,██▆▄▁
val_binary_accuracy,▁▁▄▇█
val_loss,█▇▆▃▁

0,1
best_epoch,4.0
best_val_loss,0.39132
binary_accuracy,0.85859
epoch,4.0
loss,0.44412
val_binary_accuracy,0.93587
val_loss,0.39132


[34m[1mwandb[0m: Agent Starting Run: oxr90gv3 with config:
[34m[1mwandb[0m: 	batch_size: 1
[34m[1mwandb[0m: 	dropout: 0.5
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_decay: 0.005


Epoch 1/5
Epoch 2/5
Epoch 3/5
Epoch 4/5
Epoch 5/5


VBox(children=(Label(value='48.856 MB of 48.856 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▃▆██
epoch,▁▃▅▆█
loss,█▇▄▂▁
val_binary_accuracy,▁▄███
val_loss,█▆▃▂▁

0,1
best_epoch,4.0
best_val_loss,0.17017
binary_accuracy,0.92364
epoch,4.0
loss,0.21911
val_binary_accuracy,0.96014
val_loss,0.17017


[34m[1mwandb[0m: Agent Starting Run: cd0nmda1 with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embedding_dim: 32
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 1e-05
[34m[1mwandb[0m: 	optimizer: adam
[34m[1mwandb[0m: 	weight_decay: 0.05


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='18.338 MB of 18.338 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▅█
epoch,▁▅█
loss,█▅▁
val_binary_accuracy,▁▆█
val_loss,█▅▁

0,1
best_epoch,2.0
best_val_loss,0.5871
binary_accuracy,0.77233
epoch,2.0
loss,0.612
val_binary_accuracy,0.79121
val_loss,0.5871


[34m[1mwandb[0m: Agent Starting Run: wqs4et9l with config:
[34m[1mwandb[0m: 	batch_size: 4
[34m[1mwandb[0m: 	dropout: 0.4
[34m[1mwandb[0m: 	embedding_dim: 32
[34m[1mwandb[0m: 	epochs: 7
[34m[1mwandb[0m: 	learning_rate: 0.0005
[34m[1mwandb[0m: 	optimizer: adam
[34m[1mwandb[0m: 	weight_decay: 0.05


Epoch 1/7
Epoch 2/7
Epoch 3/7
Epoch 4/7
Epoch 5/7
Epoch 6/7
Epoch 7/7


VBox(children=(Label(value='18.338 MB of 18.338 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▇█████
epoch,▁▂▃▅▆▇█
loss,█▂▁▁▁▁▁
val_binary_accuracy,▁▆▇▇███
val_loss,█▃▂▂▁▁▁

0,1
best_epoch,6.0
best_val_loss,0.00431
binary_accuracy,0.99842
epoch,6.0
loss,0.0056
val_binary_accuracy,0.99871
val_loss,0.00431


[34m[1mwandb[0m: Agent Starting Run: nw84sr59 with config:
[34m[1mwandb[0m: 	batch_size: 1
[34m[1mwandb[0m: 	dropout: 0.5
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	learning_rate: 0.0005
[34m[1mwandb[0m: 	optimizer: nadam
[34m[1mwandb[0m: 	weight_decay: 0.05


Epoch 1/5
Epoch 2/5
Epoch 3/5
Epoch 4/5
Epoch 5/5


VBox(children=(Label(value='73.271 MB of 73.271 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▇███
epoch,▁▃▅▆█
loss,█▂▁▁▁
val_binary_accuracy,▁▆█▇█
val_loss,█▃▂▁▁

0,1
best_epoch,4.0
best_val_loss,0.01016
binary_accuracy,0.99663
epoch,4.0
loss,0.01048
val_binary_accuracy,0.9964
val_loss,0.01016


[34m[1mwandb[0m: Agent Starting Run: 9njey50y with config:
[34m[1mwandb[0m: 	batch_size: 4
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	embedding_dim: 64
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	learning_rate: 5e-05
[34m[1mwandb[0m: 	optimizer: rmsprop
[34m[1mwandb[0m: 	weight_decay: 0.0005


Epoch 1/5
Epoch 2/5
Epoch 3/5
Epoch 4/5
Epoch 5/5


VBox(children=(Label(value='24.441 MB of 24.441 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▆▇██
epoch,▁▃▅▆█
loss,█▅▂▁▁
val_binary_accuracy,▁▆▇██
val_loss,█▄▂▁▁

0,1
best_epoch,4.0
best_val_loss,0.08101
binary_accuracy,0.97723
epoch,4.0
loss,0.09391
val_binary_accuracy,0.97962
val_loss,0.08101


[34m[1mwandb[0m: Agent Starting Run: 8k3wgzlt with config:
[34m[1mwandb[0m: 	batch_size: 1
[34m[1mwandb[0m: 	dropout: 0.5
[34m[1mwandb[0m: 	embedding_dim: 32
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	learning_rate: 0.005
[34m[1mwandb[0m: 	optimizer: nadam
[34m[1mwandb[0m: 	weight_decay: 0.005


Epoch 1/5
Epoch 2/5
Epoch 3/5
Epoch 4/5
Epoch 5/5


VBox(children=(Label(value='18.339 MB of 18.339 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▇▇██
epoch,▁▃▅▆█
loss,█▂▁▁▁
val_binary_accuracy,▅▁██▅
val_loss,▄█▁▁▄

0,1
best_epoch,3.0
best_val_loss,0.00536
binary_accuracy,0.99588
epoch,4.0
loss,0.01195
val_binary_accuracy,0.99545
val_loss,0.01289


[34m[1mwandb[0m: Agent Starting Run: vjnbncvx with config:
[34m[1mwandb[0m: 	batch_size: 1
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embedding_dim: 64
[34m[1mwandb[0m: 	epochs: 7
[34m[1mwandb[0m: 	learning_rate: 0.0001
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_decay: 0.05


Epoch 1/7
Epoch 2/7
Epoch 3/7
Epoch 4/7
Epoch 5/7
Epoch 6/7
Epoch 7/7


VBox(children=(Label(value='24.441 MB of 24.441 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▅▇▇███
epoch,▁▂▃▅▆▇█
loss,█▆▅▄▃▂▁
val_binary_accuracy,▁▄▆▇▇██
val_loss,█▆▅▄▃▂▁

0,1
best_epoch,6.0
best_val_loss,0.67622
binary_accuracy,0.59965
epoch,6.0
loss,0.67755
val_binary_accuracy,0.61825
val_loss,0.67622


[34m[1mwandb[0m: Agent Starting Run: 2zosvjvo with config:
[34m[1mwandb[0m: 	batch_size: 1
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	embedding_dim: 64
[34m[1mwandb[0m: 	epochs: 7
[34m[1mwandb[0m: 	learning_rate: 0.0001
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_decay: 0.005


Epoch 1/7
Epoch 2/7
Epoch 3/7
Epoch 4/7
Epoch 5/7
Epoch 6/7
Epoch 7/7