# Text classification using Tensorflow: Sentiment on Reviews
# Hyperparameter Tuning

This notebook trains a binary classifier for sentiment analysis to classify restaurant food reviews as *negative* or *positive*, based on the text of the review where a sentiment score was previously calculated. 


In [None]:
from google.colab import drive 
drive.mount('/content/drive')

Mounted at /content/drive


In [None]:
!pip install --upgrade -q wandb
import wandb
from wandb.keras import WandbCallback
import os
import random
import numpy as np
import warnings
import pandas as pd
import shutil
from sklearn.utils import shuffle
import tensorflow as tf
from tensorflow.keras import layers, losses
from tensorboard.plugins.hparams import api as hp
from tensorflow.keras.callbacks import EarlyStopping, ModelCheckpoint
from tensorflow.keras.optimizers import RMSprop, SGD, Adam, Nadam
import matplotlib.pyplot as plt
import tqdm
warnings.filterwarnings('ignore')

[K     |████████████████████████████████| 1.8 MB 4.1 MB/s 
[K     |████████████████████████████████| 145 kB 56.8 MB/s 
[K     |████████████████████████████████| 181 kB 79.7 MB/s 
[K     |████████████████████████████████| 63 kB 1.8 MB/s 
[?25h  Building wheel for pathtools (setup.py) ... [?25l[?25hdone


In [None]:
print('CUDA and NVIDIA GPU Information')
!/usr/local/cuda/bin/nvcc --version
!nvidia-smi
print('\n')
print('TensorFlow version: {}'.format(tf.__version__))
print('Eager execution is: {}'.format(tf.executing_eagerly()))
print('Keras version: {}'.format(tf.keras.__version__))
print('Num GPUs Available: ', len(tf.config.list_physical_devices('GPU')))

CUDA and NVIDIA GPU Information
nvcc: NVIDIA (R) Cuda compiler driver
Copyright (c) 2005-2020 NVIDIA Corporation
Built on Mon_Oct_12_20:09:46_PDT_2020
Cuda compilation tools, release 11.1, V11.1.105
Build cuda_11.1.TC455_06.29190527_0
Tue Jul  5 04:48:26 2022       
+-----------------------------------------------------------------------------+
| NVIDIA-SMI 460.32.03    Driver Version: 460.32.03    CUDA Version: 11.2     |
|-------------------------------+----------------------+----------------------+
| GPU  Name        Persistence-M| Bus-Id        Disp.A | Volatile Uncorr. ECC |
| Fan  Temp  Perf  Pwr:Usage/Cap|         Memory-Usage | GPU-Util  Compute M. |
|                               |                      |               MIG M. |
|   0  Tesla P100-PCIE...  Off  | 00000000:00:04.0 Off |                    0 |
| N/A   33C    P0    28W / 250W |      0MiB / 16280MiB |      0%      Default |
|                               |                      |                  N/A |
+------------

In [None]:
# Reproducibility in TF 
def init_seeds(seed=42):
    np.random.seed(seed)
    random.seed(seed)
    session_conf = tf.compat.v1.ConfigProto()
    session_conf = tf.compat.v1.ConfigProto(intra_op_parallelism_threads=1,
                                            inter_op_parallelism_threads=1)
    os.environ['TF_CUDNN_DETERMINISTIC'] ='True'
    os.environ['TF_DETERMINISTIC_OPS'] = 'True'
    tf.random.set_seed(seed)
    sess = tf.compat.v1.Session(graph=tf.compat.v1.get_default_graph(),
                                config=session_conf)
    tf.compat.v1.keras.backend.set_session(sess)
    return sess

In [None]:
init_seeds(seed=42)

<tensorflow.python.client.session.Session at 0x7fa155b8e790>

In [None]:
%cd /content/drive/MyDrive/Yelp_Reviews/Data/

/content/drive/MyDrive/Yelp_Reviews/Data


In [None]:
# Read tokenized reviews with stars filtered to 1, 2 and 5
df = pd.read_parquet('YelpReviews_NLP_125stars_tokenized.parquet')
print('Number of rows and columns:', df.shape)
df.head()

Number of rows and columns: (1541486, 2)


Unnamed: 0_level_0,stars_reviews,cleanReview
index,Unnamed: 1_level_1,Unnamed: 2_level_1
2,5.0,"[wonderful, place, get, lunch, staff, friendly..."
3,5.0,"[dedicated, loving, memory, gary, feldman, gre..."
5,5.0,"[love, place, everything, menu, delicious, lik..."
7,5.0,"[truely, hidden, gem, place, greatest, buffalo..."
9,5.0,"[seriously, great, fresh, fantastic, food, spo..."


In [None]:
# Remove comma from tokenize to make one string
df['cleanReview'] = df['cleanReview'].apply(lambda x: ','.join(map(str, x)))
df.loc[:,'cleanReview'] =  df['cleanReview'].str.replace(r',', ' ', regex=True)
df.head()

Unnamed: 0_level_0,stars_reviews,cleanReview
index,Unnamed: 1_level_1,Unnamed: 2_level_1
2,5.0,wonderful place get lunch staff friendly effic...
3,5.0,dedicated loving memory gary feldman greatest ...
5,5.0,love place everything menu delicious like tuna...
7,5.0,truely hidden gem place greatest buffalo chick...
9,5.0,seriously great fresh fantastic food spot pric...


In [None]:
# Recode to binary
df['stars_reviews'].mask(df['stars_reviews'] == 1, 0, inplace=True)
df['stars_reviews'].mask(df['stars_reviews'] == 2, 0, inplace=True)
df['stars_reviews'].mask(df['stars_reviews'] == 5, 1, inplace=True)

print('Number of reviews per group:')
df[['stars_reviews']].value_counts() 

Number of reviews per group:


stars_reviews
0.0              770743
1.0              770743
dtype: int64

In [None]:
# Sample the number of reviews to balance with sentiment
df1 = df[df.stars_reviews==0]
df1 = shuffle(df1)
df1 = df1.sample(n=414937)

In [None]:
# Sample the number of reviews to balance with sentiment
df2 = df[df.stars_reviews==1]
df2 = shuffle(df2)
df2 = df2.sample(n=414937)

# Combine sampled groups 
df = pd.concat([df1, df2])
df = shuffle(df)

del df2

df.shape

(829874, 2)

In [None]:
# Convert data types
df[['cleanReview']] = df[['cleanReview']].astype('str')
df['stars_reviews'] = df['stars_reviews'].astype('float32')

In [None]:
# Set up features and label
features = df['cleanReview']
labels = df['stars_reviews']

In [None]:
# Load pandas df to tf
df = tf.data.Dataset.from_tensor_slices((features, labels))

In [None]:
# Define components for paritioning data
df_size = df.cardinality().numpy()
train_size = int(0.8 * df_size)
val_size = int(0.10 * df_size)
test_size = int(0.10 * df_size)
BATCH_SIZE = 32

In [None]:
# Prepare train/test sets
df = df.shuffle(800_000, seed=42, reshuffle_each_iteration=False)
train = df.take(train_size).batch(BATCH_SIZE) 
test = df.skip(train_size)
val = test.skip(val_size).batch(BATCH_SIZE) 
test= test.take(test_size).batch(BATCH_SIZE) 

print('Train data split:', len(train))
print('Eval data split', len(val))
print('Test data split', len(test))

Train data split: 20747
Eval data split 2594
Test data split 2594


# Sentiment analysis




### Prepare the data for training

Next, the reviews are tokenized and vectorized using `tf.keras.layers.TextVectorization` layer. Tokenization refers to splitting strings into single words, or tokens. Vectorization converts the tokens into numbers as input for the neural network. Unique integer indices are created for each token by using `output_mode` = `int`. The `max_features` and `sequence_length` are defined for what is sampled.

In [None]:
max_features = 50000
sequence_length = 300

vectorize_layer = layers.TextVectorization(
    max_tokens=max_features,
    output_mode='int',
    output_sequence_length=sequence_length)

The preprocessing layer is fit to the dataset by using `adapt` for the training data, which results in the model creating an index of strings to integers.

In [None]:
# Make a review-only dataset and then call adapt
train_text = train.map(lambda x, y:x)
vectorize_layer.adapt(train_text)

Now, define a function to examine how the created layer preprocesses the data:



In [None]:
def vectorize_text(cleanReview, stars_reviews):
  cleanReview = tf.expand_dims(cleanReview, -1)
  return vectorize_layer(cleanReview), stars_reviews

In [None]:
# Sample a batch reviews and labels
text_batch, label_batch = next(iter(train))
first_review, first_label = text_batch[0], label_batch[0]
print('Review', first_review)
print('Label', first_label)
print('Vectorized review', vectorize_text(first_review, first_label))

Review tf.Tensor(b'food terribly salted waiter personality never filled husband drink never asked everything good till stacked plate end', shape=(), dtype=string)
Label tf.Tensor(0.0, shape=(), dtype=float32)
Vectorized review (<tf.Tensor: shape=(1, 300), dtype=int64, numpy=
array([[   2, 2137, 1472,  157, 2144,   26,  709,  209,   34,   26,   57,
          77,    4, 1475, 3873,  137,  257,    0,    0,    0,    0,    0,
           0,    0,    0,    0,    0,    0,    0,    0,    0,    0,    0,
           0,    0,    0,    0,    0,    0,    0,    0,    0,    0,    0,
           0,    0,    0,    0,    0,    0,    0,    0,    0,    0,    0,
           0,    0,    0,    0,    0,    0,    0,    0,    0,    0,    0,
           0,    0,    0,    0,    0,    0,    0,    0,    0,    0,    0,
           0,    0,    0,    0,    0,    0,    0,    0,    0,    0,    0,
           0,    0,    0,    0,    0,    0,    0,    0,    0,    0,    0,
           0,    0,    0,    0,    0,    0,    0,    0,   

In [None]:
print('12870 ---> ', vectorize_layer.get_vocabulary()[12870])
print(' 3130 ---> ', vectorize_layer.get_vocabulary()[3130])
print('Vocabulary size: {}'.format(len(vectorize_layer.get_vocabulary())))

12870 --->  refers
 3130 --->  aged
Vocabulary size: 50000


Then, apply the `TextVectorization` layer to the train, validation, and test sets.

In [None]:
train_ds = train.map(vectorize_text)
val_ds = val.map(vectorize_text)
test_ds = test.map(vectorize_text)

Configure the dataset for performance by using `.cache()` and `.prefetch()`.




In [None]:
AUTOTUNE = tf.data.AUTOTUNE

train_ds = train_ds.cache().prefetch(buffer_size=AUTOTUNE)
val_ds = val_ds.cache().prefetch(buffer_size=AUTOTUNE)
test_ds = test_ds.cache().prefetch(buffer_size=AUTOTUNE)

# Hyperparameter Tuning

In [None]:
# Set path for results
%cd /content/drive/MyDrive/Yelp_Reviews/Models/DL/BoW/ReviewStars/Models/

In [None]:
# Log into wandb
wandb.login()

<IPython.core.display.Javascript object>

[34m[1mwandb[0m: Logging into wandb.ai. (Learn how to deploy a W&B server locally: https://wandb.me/wandb-server)
[34m[1mwandb[0m: You can find your API key in your browser here: https://wandb.ai/authorize


wandb: Paste an API key from your profile and hit enter, or press ctrl+c to quit: ··········


[34m[1mwandb[0m: Appending key for api.wandb.ai to your netrc file: /root/.netrc


True

In [None]:
# Configure the sweep 
sweep_config = {
    'method': 'random',
    'metric': {
      'name': 'BinaryAccuracy',
      'goal': 'maximize'},
    'parameters': {
        'epochs': {
            'values': [3, 5, 7]},
        'batch_size': {
            'values': [8, 4, 2, 1]},
        'embedding_dim': {
            'values': [128, 64, 32]},        
        'dropout': {
            'values': [0.2, 0.3, 0.4, 0.5]},
        'weight_decay': {
            'values': [0.0005, 0.005, 0.05]},
        'learning_rate': {
            'values': [0.00001, 0.00005, 0.0001, 0.0005, 0.001, 0.005, 0.01]},
        'optimizer': {
            'values': ['adam', 'nadam', 'sgd', 'rmsprop']}}
            }

## 2. Initialize the Sweep

In [None]:
# Initialize a new sweep
sweep_id = wandb.sweep(sweep_config, entity='aschultz', 
                       project='tf_textclass_reviewstars')

Create sweep with ID: ywp4qai8
Sweep URL: https://wandb.ai/aschultz/tf_textclass_reviewstars/sweeps/ywp4qai8


### Define Neural Network


In [None]:
# The sweep calls this function with each set of hyperparameters
def train():
  
    # Default values for hyperparameters
    config_defaults = {
        'epochs': 5,
        'batch_size': 8,
        'weight_decay': 0.0005,
        'learning_rate': 0.01,
        'optimizer': 'adam',
        'embedding_dim': 32,
        'dropout': 0.5,
        'momentum': 0.9,
        'seed': 42}

    # Initialize a new wandb run
    wandb.init(config=config_defaults)
    
    # Config hyperparameters and inputs
    config = wandb.config
    
    # Define the model architecture 
    model = tf.keras.Sequential()
    model.add(tf.keras.layers.Embedding(max_features + 1, config.embedding_dim))
    model.add(tf.keras.layers.Dropout(config.dropout))
    model.add(tf.keras.layers.GlobalAveragePooling1D())
    model.add(tf.keras.layers.Dropout(config.dropout))
    model.add(tf.keras.layers.Dense(1))

    # Define the optimizer
    if config.optimizer=='sgd':
      optimizer = SGD(learning_rate=config.learning_rate, decay=1e-5, 
                      momentum=config.momentum, nesterov=True)
    elif config.optimizer=='rmsprop':
      optimizer = RMSprop(learning_rate=config.learning_rate, decay=1e-5)
    elif config.optimizer=='adam':
      optimizer = Adam(learning_rate=config.learning_rate, beta_1=0.9, 
                       beta_2=0.999, clipnorm=1.0)
    elif config.optimizer=='nadam':
      optimizer = Nadam(learning_rate=config.learning_rate, beta_1=0.9, 
                        beta_2=0.999, clipnorm=1.0)

    # Define loss and metrics
    model.compile(loss=losses.BinaryCrossentropy(from_logits=True), 
                  optimizer=optimizer, 
                  metrics=tf.metrics.BinaryAccuracy(threshold=0.0))

    # Fit model
    model.fit(train_ds, batch_size=config.batch_size,
              epochs=config.epochs,
              validation_data=(val_ds),
              callbacks=[WandbCallback(data_type='text', 
                                       validation_data=(val_ds)), 
                                       EarlyStopping(patience=10, 
                                                     restore_best_weights=True)]) 

## 3. Run the sweep agent

In [None]:
# Run sweep for HPO
wandb.agent(sweep_id, train)

[34m[1mwandb[0m: Agent Starting Run: jfj72ec9 with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 7
[34m[1mwandb[0m: 	learning_rate: 0.0005
[34m[1mwandb[0m: 	optimizer: adam
[34m[1mwandb[0m: 	weight_decay: 0.005
[34m[1mwandb[0m: Currently logged in as: [33maschultz[0m. Use [1m`wandb login --relogin`[0m to force relogin




Epoch 1/7
Epoch 2/7
Epoch 3/7
Epoch 4/7
Epoch 5/7
Epoch 6/7
Epoch 7/7


VBox(children=(Label(value='73.271 MB of 73.271 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▇▇████
epoch,▁▂▃▅▆▇█
loss,█▂▂▁▁▁▁
val_binary_accuracy,▁▆▇█▇▇█
val_loss,█▃▂▁▁▂▁

0,1
best_epoch,3.0
best_val_loss,0.10704
binary_accuracy,0.96891
epoch,6.0
loss,0.09356
val_binary_accuracy,0.96507
val_loss,0.10722


[34m[1mwandb[0m: Agent Starting Run: 2fk35uoq with config:
[34m[1mwandb[0m: 	batch_size: 2
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	embedding_dim: 64
[34m[1mwandb[0m: 	epochs: 7
[34m[1mwandb[0m: 	learning_rate: 0.0001
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_decay: 0.005


Epoch 1/7
Epoch 2/7
Epoch 3/7
Epoch 4/7
Epoch 5/7
Epoch 6/7
Epoch 7/7


VBox(children=(Label(value='24.441 MB of 24.441 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▆▇▇███
epoch,▁▂▃▅▆▇█
loss,█▆▄▃▂▁▁
val_binary_accuracy,▁▅▆▇███
val_loss,█▆▅▃▂▂▁

0,1
best_epoch,6.0
best_val_loss,0.68361
binary_accuracy,0.5649
epoch,6.0
loss,0.68442
val_binary_accuracy,0.57537
val_loss,0.68361


[34m[1mwandb[0m: Agent Starting Run: n3gt5c3a with config:
[34m[1mwandb[0m: 	batch_size: 2
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 1e-05
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_decay: 0.005


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='48.856 MB of 48.856 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▅█
epoch,▁▅█
loss,█▄▁
val_binary_accuracy,▁▅█
val_loss,█▄▁

0,1
best_epoch,2.0
best_val_loss,0.69219
binary_accuracy,0.51279
epoch,2.0
loss,0.69222
val_binary_accuracy,0.50918
val_loss,0.69219


[34m[1mwandb[0m: Agent Starting Run: 8lt1xuo6 with config:
[34m[1mwandb[0m: 	batch_size: 1
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: adam
[34m[1mwandb[0m: 	weight_decay: 0.0005


Epoch 1/5
Epoch 2/5
Epoch 3/5
Epoch 4/5
Epoch 5/5


VBox(children=(Label(value='73.271 MB of 73.271 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▇▇██
epoch,▁▃▅▆█
loss,█▂▂▁▁
val_binary_accuracy,▁▆▇█▆
val_loss,█▂▁▁▂

0,1
best_epoch,3.0
best_val_loss,0.10629
binary_accuracy,0.9681
epoch,4.0
loss,0.09539
val_binary_accuracy,0.96534
val_loss,0.10691


[34m[1mwandb[0m: Agent Starting Run: 24cu1tsv with config:
[34m[1mwandb[0m: 	batch_size: 4
[34m[1mwandb[0m: 	dropout: 0.5
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 7
[34m[1mwandb[0m: 	learning_rate: 1e-05
[34m[1mwandb[0m: 	optimizer: rmsprop
[34m[1mwandb[0m: 	weight_decay: 0.0005


Epoch 1/7
Epoch 2/7
Epoch 3/7
Epoch 4/7
Epoch 5/7
Epoch 6/7
Epoch 7/7


VBox(children=(Label(value='48.856 MB of 48.856 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▄▅▆▇▇█
epoch,▁▂▃▅▆▇█
loss,█▇▆▄▃▂▁
val_binary_accuracy,▁▄▅▆▇▇█
val_loss,█▇▆▄▃▂▁

0,1
best_epoch,6.0
best_val_loss,0.50427
binary_accuracy,0.8117
epoch,6.0
loss,0.51621
val_binary_accuracy,0.81841
val_loss,0.50427


[34m[1mwandb[0m: Agent Starting Run: scyqssu3 with config:
[34m[1mwandb[0m: 	batch_size: 2
[34m[1mwandb[0m: 	dropout: 0.4
[34m[1mwandb[0m: 	embedding_dim: 64
[34m[1mwandb[0m: 	epochs: 7
[34m[1mwandb[0m: 	learning_rate: 5e-05
[34m[1mwandb[0m: 	optimizer: rmsprop
[34m[1mwandb[0m: 	weight_decay: 0.0005


Epoch 1/7
Epoch 2/7
Epoch 3/7
Epoch 4/7
Epoch 5/7
Epoch 6/7
Epoch 7/7


VBox(children=(Label(value='24.441 MB of 24.441 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▆▇████
epoch,▁▂▃▅▆▇█
loss,█▅▃▂▁▁▁
val_binary_accuracy,▁▆▇████
val_loss,█▅▃▂▁▁▁

0,1
best_epoch,6.0
best_val_loss,0.17561
binary_accuracy,0.94019
epoch,6.0
loss,0.18022
val_binary_accuracy,0.94135
val_loss,0.17561


[34m[1mwandb[0m: Agent Starting Run: benph5zg with config:
[34m[1mwandb[0m: 	batch_size: 2
[34m[1mwandb[0m: 	dropout: 0.4
[34m[1mwandb[0m: 	embedding_dim: 32
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	learning_rate: 0.0001
[34m[1mwandb[0m: 	optimizer: nadam
[34m[1mwandb[0m: 	weight_decay: 0.05


Epoch 1/5
Epoch 2/5
Epoch 3/5
Epoch 4/5
Epoch 5/5


VBox(children=(Label(value='18.339 MB of 18.339 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▇███
epoch,▁▃▅▆█
loss,█▃▂▁▁
val_binary_accuracy,▁▆▇██
val_loss,█▃▂▁▁

0,1
best_epoch,4.0
best_val_loss,0.16056
binary_accuracy,0.9421
epoch,4.0
loss,0.16989
val_binary_accuracy,0.9451
val_loss,0.16056


[34m[1mwandb[0m: Agent Starting Run: adnpws8i with config:
[34m[1mwandb[0m: 	batch_size: 2
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	learning_rate: 0.0005
[34m[1mwandb[0m: 	optimizer: nadam
[34m[1mwandb[0m: 	weight_decay: 0.005


Epoch 1/5
Epoch 2/5
Epoch 3/5
Epoch 4/5
Epoch 5/5


VBox(children=(Label(value='73.271 MB of 73.271 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▇▇██
epoch,▁▃▅▆█
loss,█▂▂▁▁
val_binary_accuracy,▁▅▇██
val_loss,█▄▂▁▁

0,1
best_epoch,4.0
best_val_loss,0.11105
binary_accuracy,0.96456
epoch,4.0
loss,0.10568
val_binary_accuracy,0.9633
val_loss,0.11105


[34m[1mwandb[0m: Agent Starting Run: z0ojgb0w with config:
[34m[1mwandb[0m: 	batch_size: 2
[34m[1mwandb[0m: 	dropout: 0.5
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 0.005
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_decay: 0.005


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='48.856 MB of 48.856 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▄█
epoch,▁▅█
loss,█▆▁
val_binary_accuracy,▁▃█
val_loss,█▆▁

0,1
best_epoch,2.0
best_val_loss,0.64474
binary_accuracy,0.61144
epoch,2.0
loss,0.6604
val_binary_accuracy,0.67556
val_loss,0.64474


[34m[1mwandb[0m: Agent Starting Run: o0bczptt with config:
[34m[1mwandb[0m: 	batch_size: 4
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	embedding_dim: 32
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: rmsprop
[34m[1mwandb[0m: 	weight_decay: 0.005


Epoch 1/5
Epoch 2/5
Epoch 3/5
Epoch 4/5
Epoch 5/5


VBox(children=(Label(value='12.234 MB of 12.234 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▇███
epoch,▁▃▅▆█
loss,█▂▁▁▁
val_binary_accuracy,▆█▅▁▄
val_loss,█▄▂▄▁

0,1
best_epoch,4.0
best_val_loss,0.12035
binary_accuracy,0.96012
epoch,4.0
loss,0.12132
val_binary_accuracy,0.96025
val_loss,0.12035


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: vnqp1ixh with config:
[34m[1mwandb[0m: 	batch_size: 1
[34m[1mwandb[0m: 	dropout: 0.5
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	learning_rate: 1e-05
[34m[1mwandb[0m: 	optimizer: adam
[34m[1mwandb[0m: 	weight_decay: 0.005


Epoch 1/5
Epoch 2/5
Epoch 3/5
Epoch 4/5
Epoch 5/5


VBox(children=(Label(value='73.271 MB of 73.271 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▄▆▇█
epoch,▁▃▅▆█
loss,█▇▅▃▁
val_binary_accuracy,▁▃▅▇█
val_loss,█▇▅▃▁

0,1
best_epoch,4.0
best_val_loss,0.43581
binary_accuracy,0.85224
epoch,4.0
loss,0.46726
val_binary_accuracy,0.87014
val_loss,0.43581


[34m[1mwandb[0m: Agent Starting Run: rt64v60x with config:
[34m[1mwandb[0m: 	batch_size: 4
[34m[1mwandb[0m: 	dropout: 0.4
[34m[1mwandb[0m: 	embedding_dim: 64
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 0.0001
[34m[1mwandb[0m: 	optimizer: rmsprop
[34m[1mwandb[0m: 	weight_decay: 0.005


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='24.441 MB of 24.441 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▇█
epoch,▁▅█
loss,█▂▁
val_binary_accuracy,▁▇█
val_loss,█▂▁

0,1
best_epoch,2.0
best_val_loss,0.17085
binary_accuracy,0.93946
epoch,2.0
loss,0.18375
val_binary_accuracy,0.94232
val_loss,0.17085


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: f9szqojc with config:
[34m[1mwandb[0m: 	batch_size: 1
[34m[1mwandb[0m: 	dropout: 0.5
[34m[1mwandb[0m: 	embedding_dim: 32
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 0.0005
[34m[1mwandb[0m: 	optimizer: nadam
[34m[1mwandb[0m: 	weight_decay: 0.0005


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='18.339 MB of 18.339 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▇█
epoch,▁▅█
loss,█▂▁
val_binary_accuracy,▁▆█
val_loss,█▃▁

0,1
best_epoch,2.0
best_val_loss,0.12751
binary_accuracy,0.95295
epoch,2.0
loss,0.13975
val_binary_accuracy,0.95721
val_loss,0.12751


[34m[1mwandb[0m: Agent Starting Run: ux2qukhm with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.4
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	learning_rate: 0.0001
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_decay: 0.0005


Epoch 1/5
Epoch 2/5
Epoch 3/5
Epoch 4/5
Epoch 5/5


VBox(children=(Label(value='48.856 MB of 48.856 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▆▇██
epoch,▁▃▅▆█
loss,█▅▄▂▁
val_binary_accuracy,▁▅▇▇█
val_loss,█▆▄▂▁

0,1
best_epoch,4.0
best_val_loss,0.68527
binary_accuracy,0.565
epoch,4.0
loss,0.68588
val_binary_accuracy,0.57277
val_loss,0.68527


[34m[1mwandb[0m: Agent Starting Run: s90pglcb with config:
[34m[1mwandb[0m: 	batch_size: 2
[34m[1mwandb[0m: 	dropout: 0.5
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_decay: 0.05


Epoch 1/5
Epoch 2/5
Epoch 3/5
Epoch 4/5
Epoch 5/5


VBox(children=(Label(value='48.856 MB of 48.856 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▂▅▇█
epoch,▁▃▅▆█
loss,█▇▅▃▁
val_binary_accuracy,▁▇▆▆█
val_loss,█▆▄▂▁

0,1
best_epoch,4.0
best_val_loss,0.39639
binary_accuracy,0.84409
epoch,4.0
loss,0.37311
val_binary_accuracy,0.79769
val_loss,0.39639


[34m[1mwandb[0m: Agent Starting Run: nfomm1ri with config:
[34m[1mwandb[0m: 	batch_size: 2
[34m[1mwandb[0m: 	dropout: 0.5
[34m[1mwandb[0m: 	embedding_dim: 64
[34m[1mwandb[0m: 	epochs: 7
[34m[1mwandb[0m: 	learning_rate: 5e-05
[34m[1mwandb[0m: 	optimizer: rmsprop
[34m[1mwandb[0m: 	weight_decay: 0.005


Epoch 1/7
Epoch 2/7
Epoch 3/7
Epoch 4/7
Epoch 5/7
Epoch 6/7
Epoch 7/7


VBox(children=(Label(value='24.441 MB of 24.441 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▅▇████
epoch,▁▂▃▅▆▇█
loss,█▅▃▂▂▁▁
val_binary_accuracy,▁▆▇████
val_loss,█▅▃▂▁▁▁

0,1
best_epoch,6.0
best_val_loss,0.18979
binary_accuracy,0.93519
epoch,6.0
loss,0.19683
val_binary_accuracy,0.93703
val_loss,0.18979


[34m[1mwandb[0m: Agent Starting Run: urvmmq7u with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	embedding_dim: 32
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 5e-05
[34m[1mwandb[0m: 	optimizer: adam
[34m[1mwandb[0m: 	weight_decay: 0.05


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='18.338 MB of 18.338 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▆█
epoch,▁▅█
loss,█▄▁
val_binary_accuracy,▁▇█
val_loss,█▄▁

0,1
best_epoch,2.0
best_val_loss,0.23899
binary_accuracy,0.92929
epoch,2.0
loss,0.28539
val_binary_accuracy,0.93738
val_loss,0.23899


[34m[1mwandb[0m: Agent Starting Run: 3q447nff with config:
[34m[1mwandb[0m: 	batch_size: 4
[34m[1mwandb[0m: 	dropout: 0.5
[34m[1mwandb[0m: 	embedding_dim: 32
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	learning_rate: 1e-05
[34m[1mwandb[0m: 	optimizer: rmsprop
[34m[1mwandb[0m: 	weight_decay: 0.0005


Epoch 1/5
Epoch 2/5
Epoch 3/5
Epoch 4/5
Epoch 5/5


VBox(children=(Label(value='12.234 MB of 12.234 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▄▆▇█
epoch,▁▃▅▆█
loss,█▇▅▃▁
val_binary_accuracy,▁▄▆▇█
val_loss,█▆▅▃▁

0,1
best_epoch,4.0
best_val_loss,0.63216
binary_accuracy,0.7208
epoch,4.0
loss,0.63907
val_binary_accuracy,0.72544
val_loss,0.63216


[34m[1mwandb[0m: Agent Starting Run: lbndjbu5 with config:
[34m[1mwandb[0m: 	batch_size: 1
[34m[1mwandb[0m: 	dropout: 0.4
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: nadam
[34m[1mwandb[0m: 	weight_decay: 0.0005


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='73.271 MB of 73.271 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▇█
epoch,▁▅█
loss,█▂▁
val_binary_accuracy,▅▁█
val_loss,█▅▁

0,1
best_epoch,2.0
best_val_loss,0.11
binary_accuracy,0.96107
epoch,2.0
loss,0.11286
val_binary_accuracy,0.96406
val_loss,0.11


[34m[1mwandb[0m: Agent Starting Run: lhd2a568 with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	embedding_dim: 64
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	learning_rate: 0.0005
[34m[1mwandb[0m: 	optimizer: nadam
[34m[1mwandb[0m: 	weight_decay: 0.0005


Epoch 1/5
Epoch 2/5
Epoch 3/5
Epoch 4/5
Epoch 5/5


VBox(children=(Label(value='36.649 MB of 36.649 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▇███
epoch,▁▃▅▆█
loss,█▂▂▁▁
val_binary_accuracy,▁▅▇██
val_loss,█▄▂▁▁

0,1
best_epoch,4.0
best_val_loss,0.11434
binary_accuracy,0.96256
epoch,4.0
loss,0.11114
val_binary_accuracy,0.96219
val_loss,0.11434


[34m[1mwandb[0m: Agent Starting Run: 8aaphgat with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.5
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: rmsprop
[34m[1mwandb[0m: 	weight_decay: 0.0005


Epoch 1/5
Epoch 2/5
Epoch 3/5
Epoch 4/5
Epoch 5/5


VBox(children=(Label(value='48.856 MB of 48.856 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▇███
epoch,▁▃▅▆█
loss,█▂▁▁▁
val_binary_accuracy,▁▆▇██
val_loss,█▃▂▁▁

0,1
best_epoch,4.0
best_val_loss,0.12832
binary_accuracy,0.95735
epoch,4.0
loss,0.12895
val_binary_accuracy,0.95744
val_loss,0.12832


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: 9shny2oy with config:
[34m[1mwandb[0m: 	batch_size: 2
[34m[1mwandb[0m: 	dropout: 0.5
[34m[1mwandb[0m: 	embedding_dim: 64
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 0.0005
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_decay: 0.05


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='24.441 MB of 24.441 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁██
epoch,▁▅█
loss,█▃▁
val_binary_accuracy,▁▅█
val_loss,█▃▁

0,1
best_epoch,2.0
best_val_loss,0.67966
binary_accuracy,0.55743
epoch,2.0
loss,0.68284
val_binary_accuracy,0.5812
val_loss,0.67966


[34m[1mwandb[0m: Agent Starting Run: rubmjzx4 with config:
[34m[1mwandb[0m: 	batch_size: 4
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	learning_rate: 0.0005
[34m[1mwandb[0m: 	optimizer: nadam
[34m[1mwandb[0m: 	weight_decay: 0.05


Epoch 1/5
Epoch 2/5
Epoch 3/5
Epoch 4/5
Epoch 5/5


VBox(children=(Label(value='73.271 MB of 73.271 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▇▇██
epoch,▁▃▅▆█
loss,█▂▂▁▁
val_binary_accuracy,▁▅▇██
val_loss,█▄▂▁▁

0,1
best_epoch,4.0
best_val_loss,0.11206
binary_accuracy,0.96372
epoch,4.0
loss,0.10781
val_binary_accuracy,0.96301
val_loss,0.11206


[34m[1mwandb[0m: Agent Starting Run: vtwlxmye with config:
[34m[1mwandb[0m: 	batch_size: 4
[34m[1mwandb[0m: 	dropout: 0.4
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 0.0005
[34m[1mwandb[0m: 	optimizer: rmsprop
[34m[1mwandb[0m: 	weight_decay: 0.05


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='48.856 MB of 48.856 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁██
epoch,▁▅█
loss,█▁▁
val_binary_accuracy,▁▆█
val_loss,█▃▁

0,1
best_epoch,2.0
best_val_loss,0.12799
binary_accuracy,0.95732
epoch,2.0
loss,0.12883
val_binary_accuracy,0.95783
val_loss,0.12799


[34m[1mwandb[0m: Agent Starting Run: 1ynbgvcx with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.5
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	learning_rate: 0.0001
[34m[1mwandb[0m: 	optimizer: rmsprop
[34m[1mwandb[0m: 	weight_decay: 0.0005


Epoch 1/5
Epoch 2/5
Epoch 3/5
Epoch 4/5
Epoch 5/5


VBox(children=(Label(value='48.856 MB of 48.856 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▇███
epoch,▁▃▅▆█
loss,█▂▁▁▁
val_binary_accuracy,▁▅▇▇█
val_loss,█▃▂▁▁

0,1
best_epoch,4.0
best_val_loss,0.15194
binary_accuracy,0.94705
epoch,4.0
loss,0.15511
val_binary_accuracy,0.94779
val_loss,0.15194


[34m[1mwandb[0m: Agent Starting Run: rfwqkdn0 with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 7
[34m[1mwandb[0m: 	learning_rate: 1e-05
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_decay: 0.0005


Epoch 1/7
Epoch 2/7
Epoch 3/7
Epoch 4/7
Epoch 5/7
Epoch 6/7
Epoch 7/7


VBox(children=(Label(value='48.856 MB of 48.856 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▃▄▅▆▇█
epoch,▁▂▃▅▆▇█
loss,█▆▅▄▃▂▁
val_binary_accuracy,▁▃▄▅▆▇█
val_loss,█▆▅▄▃▂▁

0,1
best_epoch,6.0
best_val_loss,0.69154
binary_accuracy,0.52646
epoch,6.0
loss,0.69157
val_binary_accuracy,0.52157
val_loss,0.69154


[34m[1mwandb[0m: Agent Starting Run: jdaxj513 with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.5
[34m[1mwandb[0m: 	embedding_dim: 64
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_decay: 0.05


Epoch 1/5
Epoch 2/5
Epoch 3/5
Epoch 4/5
Epoch 5/5


VBox(children=(Label(value='24.441 MB of 24.441 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▂▅▇█
epoch,▁▃▅▆█
loss,█▇▅▃▁
val_binary_accuracy,▁▇▄▆█
val_loss,█▇▄▃▁

0,1
best_epoch,4.0
best_val_loss,0.36858
binary_accuracy,0.8425
epoch,4.0
loss,0.37698
val_binary_accuracy,0.83178
val_loss,0.36858


[34m[1mwandb[0m: Agent Starting Run: 3q3g9yph with config:
[34m[1mwandb[0m: 	batch_size: 4
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embedding_dim: 64
[34m[1mwandb[0m: 	epochs: 7
[34m[1mwandb[0m: 	learning_rate: 0.005
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_decay: 0.05


Epoch 1/7
Epoch 2/7
Epoch 3/7
Epoch 4/7
Epoch 5/7
Epoch 6/7
Epoch 7/7


VBox(children=(Label(value='24.441 MB of 24.441 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▁▂▄▆▇█
epoch,▁▂▃▅▆▇█
loss,██▇▆▅▃▁
val_binary_accuracy,▁▂▃▆▇██
val_loss,██▇▆▄▂▁

0,1
best_epoch,6.0
best_val_loss,0.43147
binary_accuracy,0.84248
epoch,6.0
loss,0.45556
val_binary_accuracy,0.87749
val_loss,0.43147


[34m[1mwandb[0m: Agent Starting Run: vf2m0gt0 with config:
[34m[1mwandb[0m: 	batch_size: 4
[34m[1mwandb[0m: 	dropout: 0.5
[34m[1mwandb[0m: 	embedding_dim: 64
[34m[1mwandb[0m: 	epochs: 7
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: rmsprop
[34m[1mwandb[0m: 	weight_decay: 0.0005


Epoch 1/7
Epoch 2/7
Epoch 3/7
Epoch 4/7
Epoch 5/7
Epoch 6/7
Epoch 7/7


VBox(children=(Label(value='24.441 MB of 24.441 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▇█████
epoch,▁▂▃▅▆▇█
loss,█▂▁▁▁▁▁
val_binary_accuracy,▁▅▇▇███
val_loss,█▄▂▂▁▁▁

0,1
best_epoch,6.0
best_val_loss,0.12833
binary_accuracy,0.95712
epoch,6.0
loss,0.13059
val_binary_accuracy,0.95762
val_loss,0.12833


[34m[1mwandb[0m: Agent Starting Run: qnstox77 with config:
[34m[1mwandb[0m: 	batch_size: 2
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	embedding_dim: 32
[34m[1mwandb[0m: 	epochs: 7
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: nadam
[34m[1mwandb[0m: 	weight_decay: 0.05


Epoch 1/7
Epoch 2/7
Epoch 3/7
Epoch 4/7
Epoch 5/7
Epoch 6/7
Epoch 7/7


VBox(children=(Label(value='18.339 MB of 18.339 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▇▇████
epoch,▁▂▃▅▆▇█
loss,█▂▂▁▁▁▁
val_binary_accuracy,▁▅▇▇███
val_loss,█▄▃▂▂▁▁

0,1
best_epoch,6.0
best_val_loss,0.10953
binary_accuracy,0.96477
epoch,6.0
loss,0.10612
val_binary_accuracy,0.9639
val_loss,0.10953


[34m[1mwandb[0m: Agent Starting Run: k93fi8h3 with config:
[34m[1mwandb[0m: 	batch_size: 2
[34m[1mwandb[0m: 	dropout: 0.4
[34m[1mwandb[0m: 	embedding_dim: 32
[34m[1mwandb[0m: 	epochs: 7
[34m[1mwandb[0m: 	learning_rate: 5e-05
[34m[1mwandb[0m: 	optimizer: nadam
[34m[1mwandb[0m: 	weight_decay: 0.0005


Epoch 1/7
Epoch 2/7
Epoch 3/7
Epoch 4/7
Epoch 5/7
Epoch 6/7
Epoch 7/7


VBox(children=(Label(value='18.339 MB of 18.339 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▅▇████
epoch,▁▂▃▅▆▇█
loss,█▆▃▂▂▁▁
val_binary_accuracy,▁▆▇▇███
val_loss,█▅▃▂▂▁▁

0,1
best_epoch,6.0
best_val_loss,0.18224
binary_accuracy,0.93571
epoch,6.0
loss,0.19178
val_binary_accuracy,0.9381
val_loss,0.18224


[34m[1mwandb[0m: Agent Starting Run: 7nkxd49w with config:
[34m[1mwandb[0m: 	batch_size: 1
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	embedding_dim: 32
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	learning_rate: 0.0005
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_decay: 0.05


Epoch 1/5
Epoch 2/5
Epoch 3/5
Epoch 4/5
Epoch 5/5


VBox(children=(Label(value='12.234 MB of 12.234 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▅▆▇█
epoch,▁▃▅▆█
loss,█▄▂▁▁
val_binary_accuracy,▁▄▇██
val_loss,█▄▃▂▁

0,1
best_epoch,4.0
best_val_loss,0.67769
binary_accuracy,0.56317
epoch,4.0
loss,0.6809
val_binary_accuracy,0.5833
val_loss,0.67769


[34m[1mwandb[0m: Agent Starting Run: cjhge1on with config:
[34m[1mwandb[0m: 	batch_size: 2
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	learning_rate: 0.0005
[34m[1mwandb[0m: 	optimizer: adam
[34m[1mwandb[0m: 	weight_decay: 0.0005


Epoch 1/5
Epoch 2/5
Epoch 3/5
Epoch 4/5
Epoch 5/5


VBox(children=(Label(value='73.271 MB of 73.271 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▇▇██
epoch,▁▃▅▆█
loss,█▂▁▁▁
val_binary_accuracy,▁▆▇██
val_loss,█▃▂▁▁

0,1
best_epoch,3.0
best_val_loss,0.10712
binary_accuracy,0.96847
epoch,4.0
loss,0.09491
val_binary_accuracy,0.96491
val_loss,0.10759


[34m[1mwandb[0m: Agent Starting Run: 0a9wz737 with config:
[34m[1mwandb[0m: 	batch_size: 1
[34m[1mwandb[0m: 	dropout: 0.4
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	learning_rate: 0.0005
[34m[1mwandb[0m: 	optimizer: rmsprop
[34m[1mwandb[0m: 	weight_decay: 0.05


Epoch 1/5
Epoch 2/5
Epoch 3/5
Epoch 4/5
Epoch 5/5


VBox(children=(Label(value='48.856 MB of 48.856 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▇███
epoch,▁▃▅▆█
loss,█▂▁▁▁
val_binary_accuracy,▁▆▇██
val_loss,█▃▂▁▁

0,1
best_epoch,4.0
best_val_loss,0.12607
binary_accuracy,0.95862
epoch,4.0
loss,0.12537
val_binary_accuracy,0.9586
val_loss,0.12607


[34m[1mwandb[0m: Agent Starting Run: hwgnpu9x with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.5
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 7
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_decay: 0.0005


Epoch 1/7
Epoch 2/7
Epoch 3/7
Epoch 4/7
Epoch 5/7
Epoch 6/7
Epoch 7/7


VBox(children=(Label(value='48.856 MB of 48.856 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▂▅▇▇██
epoch,▁▂▃▅▆▇█
loss,█▇▆▃▂▁▁
val_binary_accuracy,▁▆▆▅▇██
val_loss,█▇▄▃▂▁▁

0,1
best_epoch,6.0
best_val_loss,0.35196
binary_accuracy,0.87514
epoch,6.0
loss,0.30841
val_binary_accuracy,0.82785
val_loss,0.35196


[34m[1mwandb[0m: Agent Starting Run: qedodz8o with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.4
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 0.0001
[34m[1mwandb[0m: 	optimizer: rmsprop
[34m[1mwandb[0m: 	weight_decay: 0.05


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='48.856 MB of 48.856 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁██
epoch,▁▅█
loss,█▂▁
val_binary_accuracy,▁▆█
val_loss,█▂▁

0,1
best_epoch,2.0
best_val_loss,0.15641
binary_accuracy,0.94435
epoch,2.0
loss,0.16348
val_binary_accuracy,0.94634
val_loss,0.15641


[34m[1mwandb[0m: Agent Starting Run: 8kzt639t with config:
[34m[1mwandb[0m: 	batch_size: 2
[34m[1mwandb[0m: 	dropout: 0.5
[34m[1mwandb[0m: 	embedding_dim: 64
[34m[1mwandb[0m: 	epochs: 7
[34m[1mwandb[0m: 	learning_rate: 0.005
[34m[1mwandb[0m: 	optimizer: adam
[34m[1mwandb[0m: 	weight_decay: 0.005


Epoch 1/7
Epoch 2/7
Epoch 3/7
Epoch 4/7
Epoch 5/7
Epoch 6/7
Epoch 7/7


VBox(children=(Label(value='36.649 MB of 36.649 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▆▇▇▇██
epoch,▁▂▃▅▆▇█
loss,█▃▂▂▂▁▁
val_binary_accuracy,▁▄▇▇██▇
val_loss,█▄▂▁▁▁▁

0,1
best_epoch,5.0
best_val_loss,0.10535
binary_accuracy,0.96602
epoch,6.0
loss,0.10195
val_binary_accuracy,0.96613
val_loss,0.1054


[34m[1mwandb[0m: Agent Starting Run: qwysj016 with config:
[34m[1mwandb[0m: 	batch_size: 2
[34m[1mwandb[0m: 	dropout: 0.5
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: rmsprop
[34m[1mwandb[0m: 	weight_decay: 0.05


Epoch 1/5
Epoch 2/5
Epoch 3/5
Epoch 4/5
Epoch 5/5


VBox(children=(Label(value='48.856 MB of 48.856 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▇███
epoch,▁▃▅▆█
loss,█▂▁▁▁
val_binary_accuracy,▁▆▇██
val_loss,█▃▂▁▁

0,1
best_epoch,4.0
best_val_loss,0.12833
binary_accuracy,0.95736
epoch,4.0
loss,0.12895
val_binary_accuracy,0.95746
val_loss,0.12833


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: u0cr2irs with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: nadam
[34m[1mwandb[0m: 	weight_decay: 0.005


Epoch 1/5
Epoch 2/5
Epoch 3/5
Epoch 4/5
Epoch 5/5


VBox(children=(Label(value='73.271 MB of 73.271 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▇▇██
epoch,▁▃▅▆█
loss,█▂▂▁▁
val_binary_accuracy,▁▄▆▇█
val_loss,█▄▂▁▁

0,1
best_epoch,4.0
best_val_loss,0.10824
binary_accuracy,0.96577
epoch,4.0
loss,0.10201
val_binary_accuracy,0.96489
val_loss,0.10824


[34m[1mwandb[0m: Agent Starting Run: uvnpgzlk with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embedding_dim: 64
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 0.0001
[34m[1mwandb[0m: 	optimizer: rmsprop
[34m[1mwandb[0m: 	weight_decay: 0.005


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='24.441 MB of 24.441 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▇█
epoch,▁▅█
loss,█▂▁
val_binary_accuracy,▁▆█
val_loss,█▂▁

0,1
best_epoch,2.0
best_val_loss,0.1561
binary_accuracy,0.94518
epoch,2.0
loss,0.16474
val_binary_accuracy,0.94725
val_loss,0.1561


[34m[1mwandb[0m: Agent Starting Run: 15sopxs2 with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embedding_dim: 64
[34m[1mwandb[0m: 	epochs: 7
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: adam
[34m[1mwandb[0m: 	weight_decay: 0.05


Epoch 1/7
Epoch 2/7
Epoch 3/7
Epoch 4/7
Epoch 5/7
Epoch 6/7
Epoch 7/7


VBox(children=(Label(value='36.649 MB of 36.649 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▇▇▇███
epoch,▁▂▃▅▆▇█
loss,█▂▂▁▁▁▁
val_binary_accuracy,▁▆▅█▆▇█
val_loss,█▂▂▁▂▂▂

0,1
best_epoch,3.0
best_val_loss,0.10664
binary_accuracy,0.96967
epoch,6.0
loss,0.09154
val_binary_accuracy,0.9656
val_loss,0.10703


[34m[1mwandb[0m: Agent Starting Run: o3vbp6tt with config:
[34m[1mwandb[0m: 	batch_size: 4
[34m[1mwandb[0m: 	dropout: 0.4
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 1e-05
[34m[1mwandb[0m: 	optimizer: rmsprop
[34m[1mwandb[0m: 	weight_decay: 0.005


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='48.856 MB of 48.856 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▆█
epoch,▁▅█
loss,█▅▁
val_binary_accuracy,▁▆█
val_loss,█▅▁

0,1
best_epoch,2.0
best_val_loss,0.59661
binary_accuracy,0.74392
epoch,2.0
loss,0.61518
val_binary_accuracy,0.75647
val_loss,0.59661


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: 7hnhy6gb with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 7
[34m[1mwandb[0m: 	learning_rate: 0.005
[34m[1mwandb[0m: 	optimizer: adam
[34m[1mwandb[0m: 	weight_decay: 0.05


Epoch 1/7
Epoch 2/7
Epoch 3/7
Epoch 4/7
Epoch 5/7
Epoch 6/7
Epoch 7/7


VBox(children=(Label(value='73.271 MB of 73.271 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▅▆▇▇██
epoch,▁▂▃▅▆▇█
loss,█▄▃▂▂▁▁
val_binary_accuracy,▁▁▆▇█▅▇
val_loss,█▄▁▁▁▂▂

0,1
best_epoch,3.0
best_val_loss,0.10694
binary_accuracy,0.96958
epoch,6.0
loss,0.09122
val_binary_accuracy,0.96548
val_loss,0.10722


[34m[1mwandb[0m: Agent Starting Run: ox62d3ne with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embedding_dim: 32
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: rmsprop
[34m[1mwandb[0m: 	weight_decay: 0.0005


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='12.234 MB of 12.234 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▇█
epoch,▁▅█
loss,█▂▁
val_binary_accuracy,▆█▁
val_loss,█▃▁

0,1
best_epoch,2.0
best_val_loss,0.11842
binary_accuracy,0.96084
epoch,2.0
loss,0.1188
val_binary_accuracy,0.96107
val_loss,0.11842


[34m[1mwandb[0m: Agent Starting Run: lpvkp6bp with config:
[34m[1mwandb[0m: 	batch_size: 4
[34m[1mwandb[0m: 	dropout: 0.5
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 0.0001
[34m[1mwandb[0m: 	optimizer: nadam
[34m[1mwandb[0m: 	weight_decay: 0.05


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='73.271 MB of 73.271 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▇█
epoch,▁▅█
loss,█▂▁
val_binary_accuracy,▁▆█
val_loss,█▂▁

0,1
best_epoch,2.0
best_val_loss,0.16072
binary_accuracy,0.94145
epoch,2.0
loss,0.17107
val_binary_accuracy,0.94461
val_loss,0.16072


[34m[1mwandb[0m: Agent Starting Run: xyi9znjm with config:
[34m[1mwandb[0m: 	batch_size: 1
[34m[1mwandb[0m: 	dropout: 0.4
[34m[1mwandb[0m: 	embedding_dim: 32
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: nadam
[34m[1mwandb[0m: 	weight_decay: 0.0005


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='18.339 MB of 18.339 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▇█
epoch,▁▅█
loss,█▂▁
val_binary_accuracy,▁▆█
val_loss,█▃▁

0,1
best_epoch,2.0
best_val_loss,0.11598
binary_accuracy,0.95915
epoch,2.0
loss,0.12106
val_binary_accuracy,0.96192
val_loss,0.11598


[34m[1mwandb[0m: Agent Starting Run: w31nwxpo with config:
[34m[1mwandb[0m: 	batch_size: 1
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embedding_dim: 32
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 0.0001
[34m[1mwandb[0m: 	optimizer: nadam
[34m[1mwandb[0m: 	weight_decay: 0.005


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='18.339 MB of 18.339 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▇█
epoch,▁▅█
loss,█▃▁
val_binary_accuracy,▁▆█
val_loss,█▃▁

0,1
best_epoch,2.0
best_val_loss,0.17787
binary_accuracy,0.93616
epoch,2.0
loss,0.194
val_binary_accuracy,0.93945
val_loss,0.17787


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: fet8o7l4 with config:
[34m[1mwandb[0m: 	batch_size: 4
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	embedding_dim: 64
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: nadam
[34m[1mwandb[0m: 	weight_decay: 0.05


Epoch 1/5
Epoch 2/5
Epoch 3/5
Epoch 4/5
Epoch 5/5


VBox(children=(Label(value='36.649 MB of 36.649 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▆▇▇█
epoch,▁▃▅▆█
loss,█▃▂▂▁
val_binary_accuracy,▃▁▄█▆
val_loss,█▆▄▂▁

0,1
best_epoch,4.0
best_val_loss,0.10793
binary_accuracy,0.96422
epoch,4.0
loss,0.1052
val_binary_accuracy,0.96467
val_loss,0.10793


[34m[1mwandb[0m: Agent Starting Run: qoi2uknp with config:
[34m[1mwandb[0m: 	batch_size: 2
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	embedding_dim: 32
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: adam
[34m[1mwandb[0m: 	weight_decay: 0.005


Epoch 1/5
Epoch 2/5
Epoch 3/5
Epoch 4/5
Epoch 5/5


VBox(children=(Label(value='18.338 MB of 18.338 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▇███
epoch,▁▃▅▆█
loss,█▂▁▁▁
val_binary_accuracy,▁▇███
val_loss,█▂▁▁▁

0,1
best_epoch,4.0
best_val_loss,0.10683
binary_accuracy,0.96722
epoch,4.0
loss,0.09858
val_binary_accuracy,0.96549
val_loss,0.10683


[34m[1mwandb[0m: Agent Starting Run: jjvzpm7k with config:
[34m[1mwandb[0m: 	batch_size: 2
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 0.005
[34m[1mwandb[0m: 	optimizer: adam
[34m[1mwandb[0m: 	weight_decay: 0.005


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='73.271 MB of 73.271 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▇█
epoch,▁▅█
loss,█▂▁
val_binary_accuracy,▁▃█
val_loss,█▄▁

0,1
best_epoch,2.0
best_val_loss,0.10671
binary_accuracy,0.96561
epoch,2.0
loss,0.10178
val_binary_accuracy,0.96531
val_loss,0.10671


[34m[1mwandb[0m: Agent Starting Run: 86wdkznp with config:
[34m[1mwandb[0m: 	batch_size: 2
[34m[1mwandb[0m: 	dropout: 0.4
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 0.0005
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_decay: 0.005


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='48.856 MB of 48.856 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁██
epoch,▁▅█
loss,█▃▁
val_binary_accuracy,▁▆█
val_loss,█▃▁

0,1
best_epoch,2.0
best_val_loss,0.67789
binary_accuracy,0.57071
epoch,2.0
loss,0.68006
val_binary_accuracy,0.58179
val_loss,0.67789


[34m[1mwandb[0m: Agent Starting Run: o78cjkd0 with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embedding_dim: 32
[34m[1mwandb[0m: 	epochs: 7
[34m[1mwandb[0m: 	learning_rate: 0.005
[34m[1mwandb[0m: 	optimizer: nadam
[34m[1mwandb[0m: 	weight_decay: 0.05


Epoch 1/7
Epoch 2/7
Epoch 3/7
Epoch 4/7
Epoch 5/7
Epoch 6/7
Epoch 7/7


VBox(children=(Label(value='18.339 MB of 18.339 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▆▇▇███
epoch,▁▂▃▅▆▇█
loss,█▃▂▂▁▁▁
val_binary_accuracy,▁▅▆▅▇█▆
val_loss,█▄▂▃▁▁▂

0,1
best_epoch,5.0
best_val_loss,0.10704
binary_accuracy,0.96619
epoch,6.0
loss,0.09997
val_binary_accuracy,0.96492
val_loss,0.10761


[34m[1mwandb[0m: Agent Starting Run: sl6tq7pu with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embedding_dim: 32
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: adam
[34m[1mwandb[0m: 	weight_decay: 0.05


Epoch 1/5
Epoch 2/5
Epoch 3/5
Epoch 4/5
Epoch 5/5


VBox(children=(Label(value='18.338 MB of 18.338 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▆▇██
epoch,▁▃▅▆█
loss,█▃▂▁▁
val_binary_accuracy,▁▆▅▅█
val_loss,█▂▁▂▁

0,1
best_epoch,4.0
best_val_loss,0.10679
binary_accuracy,0.968
epoch,4.0
loss,0.09588
val_binary_accuracy,0.96557
val_loss,0.10679


[34m[1mwandb[0m: Agent Starting Run: yheqsnqr with config:
[34m[1mwandb[0m: 	batch_size: 2
[34m[1mwandb[0m: 	dropout: 0.5
[34m[1mwandb[0m: 	embedding_dim: 32
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	learning_rate: 1e-05
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_decay: 0.005


Epoch 1/5
Epoch 2/5
Epoch 3/5
Epoch 4/5
Epoch 5/5


VBox(children=(Label(value='12.234 MB of 12.234 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▄▅▇█
epoch,▁▃▅▆█
loss,█▆▄▂▁
val_binary_accuracy,▁▃▅▇█
val_loss,█▆▄▂▁

0,1
best_epoch,4.0
best_val_loss,0.69174
binary_accuracy,0.52128
epoch,4.0
loss,0.69193
val_binary_accuracy,0.51841
val_loss,0.69174


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: 8wp3g1rn with config:
[34m[1mwandb[0m: 	batch_size: 2
[34m[1mwandb[0m: 	dropout: 0.5
[34m[1mwandb[0m: 	embedding_dim: 32
[34m[1mwandb[0m: 	epochs: 7
[34m[1mwandb[0m: 	learning_rate: 0.0001
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_decay: 0.0005


Epoch 1/7
Epoch 2/7
Epoch 3/7
Epoch 4/7
Epoch 5/7
Epoch 6/7
Epoch 7/7


VBox(children=(Label(value='12.234 MB of 12.234 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▆▇████
epoch,▁▂▃▅▆▇█
loss,█▅▄▃▂▁▁
val_binary_accuracy,▁▅▇▇███
val_loss,█▆▄▃▂▂▁

0,1
best_epoch,6.0
best_val_loss,0.68527
binary_accuracy,0.54669
epoch,6.0
loss,0.68683
val_binary_accuracy,0.57652
val_loss,0.68527


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: 6enyg7fa with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.4
[34m[1mwandb[0m: 	embedding_dim: 32
[34m[1mwandb[0m: 	epochs: 7
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_decay: 0.005


Epoch 1/7
Epoch 2/7
Epoch 3/7
Epoch 4/7
Epoch 5/7
Epoch 6/7
Epoch 7/7


VBox(children=(Label(value='12.234 MB of 12.234 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▃▅▇▇██
epoch,▁▂▃▅▆▇█
loss,█▇▅▃▂▁▁
val_binary_accuracy,▁▇▅▆▇██
val_loss,█▆▄▃▂▁▁

0,1
best_epoch,6.0
best_val_loss,0.35054
binary_accuracy,0.88316
epoch,6.0
loss,0.29668
val_binary_accuracy,0.82776
val_loss,0.35054


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: i9v13sag with config:
[34m[1mwandb[0m: 	batch_size: 8
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	embedding_dim: 64
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_decay: 0.05


Epoch 1/5
Epoch 2/5
Epoch 3/5
Epoch 4/5
Epoch 5/5


VBox(children=(Label(value='24.441 MB of 24.441 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▃▆▇█
epoch,▁▃▅▆█
loss,█▇▅▂▁
val_binary_accuracy,▁█▄▆█
val_loss,█▆▄▃▁

0,1
best_epoch,4.0
best_val_loss,0.36935
binary_accuracy,0.86657
epoch,4.0
loss,0.34452
val_binary_accuracy,0.82111
val_loss,0.36935


[34m[1mwandb[0m: Agent Starting Run: 64iz2c8d with config:
[34m[1mwandb[0m: 	batch_size: 4
[34m[1mwandb[0m: 	dropout: 0.5
[34m[1mwandb[0m: 	embedding_dim: 64
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 0.005
[34m[1mwandb[0m: 	optimizer: rmsprop
[34m[1mwandb[0m: 	weight_decay: 0.0005


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='24.441 MB of 24.441 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▇█
epoch,▁▅█
loss,█▁▁
val_binary_accuracy,▁▆█
val_loss,█▃▁

0,1
best_epoch,2.0
best_val_loss,0.1274
binary_accuracy,0.95609
epoch,2.0
loss,0.13197
val_binary_accuracy,0.95781
val_loss,0.1274


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: tlq33p7c with config:
[34m[1mwandb[0m: 	batch_size: 4
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 7
[34m[1mwandb[0m: 	learning_rate: 0.0001
[34m[1mwandb[0m: 	optimizer: adam
[34m[1mwandb[0m: 	weight_decay: 0.05


Epoch 1/7
Epoch 2/7
Epoch 3/7
Epoch 4/7
Epoch 5/7
Epoch 6/7
Epoch 7/7


VBox(children=(Label(value='73.271 MB of 73.271 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▇▇████
epoch,▁▂▃▅▆▇█
loss,█▂▂▁▁▁▁
val_binary_accuracy,▁▅▆▇███
val_loss,█▃▂▂▁▁▁

0,1
best_epoch,6.0
best_val_loss,0.11108
binary_accuracy,0.96494
epoch,6.0
loss,0.10532
val_binary_accuracy,0.96344
val_loss,0.11108


[34m[1mwandb[0m: Agent Starting Run: au83gr0w with config:
[34m[1mwandb[0m: 	batch_size: 2
[34m[1mwandb[0m: 	dropout: 0.4
[34m[1mwandb[0m: 	embedding_dim: 32
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 0.0005
[34m[1mwandb[0m: 	optimizer: nadam
[34m[1mwandb[0m: 	weight_decay: 0.0005


Epoch 1/3
Epoch 2/3
Epoch 3/3


VBox(children=(Label(value='18.339 MB of 18.339 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
binary_accuracy,▁▇█
epoch,▁▅█
loss,█▂▁
val_binary_accuracy,▁▆█
val_loss,█▃▁

0,1
best_epoch,2.0
best_val_loss,0.12478
binary_accuracy,0.95536
epoch,2.0
loss,0.13204
val_binary_accuracy,0.95798
val_loss,0.12478


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: bqlsm0i1 with config:
[34m[1mwandb[0m: 	batch_size: 2
[34m[1mwandb[0m: 	dropout: 0.4
[34m[1mwandb[0m: 	embedding_dim: 128
[34m[1mwandb[0m: 	epochs: 7
[34m[1mwandb[0m: 	learning_rate: 0.005
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_decay: 0.0005


Epoch 1/7
Epoch 2/7
Epoch 3/7
Epoch 4/7
Epoch 5/7