**Import libraries**

In [None]:
!pip install wandb

Collecting wandb
  Downloading wandb-0.12.15-py2.py3-none-any.whl (1.8 MB)
[K     |████████████████████████████████| 1.8 MB 4.3 MB/s 
Collecting setproctitle
  Downloading setproctitle-1.2.3-cp37-cp37m-manylinux_2_5_x86_64.manylinux1_x86_64.manylinux_2_17_x86_64.manylinux2014_x86_64.whl (29 kB)
Collecting GitPython>=1.0.0
  Downloading GitPython-3.1.27-py3-none-any.whl (181 kB)
[K     |████████████████████████████████| 181 kB 58.5 MB/s 
[?25hCollecting pathtools
  Downloading pathtools-0.1.2.tar.gz (11 kB)
Collecting sentry-sdk>=1.0.0
  Downloading sentry_sdk-1.5.10-py2.py3-none-any.whl (144 kB)
[K     |████████████████████████████████| 144 kB 61.9 MB/s 
Collecting docker-pycreds>=0.4.0
  Downloading docker_pycreds-0.4.0-py2.py3-none-any.whl (9.0 kB)
Collecting shortuuid>=0.5.0
  Downloading shortuuid-1.0.8-py3-none-any.whl (9.5 kB)
Collecting gitdb<5,>=4.0.1
  Downloading gitdb-4.0.9-py3-none-any.whl (63 kB)
[K     |████████████████████████████████| 63 kB 1.4 MB/s 
Collecting smm

In [None]:
import shutil
import math
import numpy as np
import pandas as pd
import wandb
from wandb.keras import WandbCallback

import keras
from keras.models import Model
from keras.layers import Input, Embedding, SimpleRNN, LSTM, GRU, Dense  
from tensorflow.keras.optimizers import Adam

**Downloading the dataset**

In [None]:
!curl --header "Host: storage.googleapis.com" --header "User-Agent: Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/89.0.4389.128 Safari/537.36 Edg/89.0.774.77" --header "Accept: text/html,application/xhtml+xml,application/xml;q=0.9,image/webp,image/apng,*/*;q=0.8,application/signed-exchange;v=b3;q=0.9" --header "Accept-Language: en-US,en;q=0.9" --header "Referer: https://github.com/google-research-datasets/dakshina" "https://storage.googleapis.com/gresearch/dakshina/dakshina_dataset_v1.0.tar" -L -o "dakshina_dataset_v1.0.tar"
shutil.unpack_archive("/content/dakshina_dataset_v1.0.tar",'/content/')

  % Total    % Received % Xferd  Average Speed   Time    Time     Time  Current
                                 Dload  Upload   Total   Spent    Left  Speed
100 1915M  100 1915M    0     0  67.8M      0  0:00:28  0:00:28 --:--:-- 90.7M


**Preparing the dataset**

In [None]:
TRAIN_PATH = "/content/dakshina_dataset_v1.0/hi/lexicons/hi.translit.sampled.train.tsv"
VAL_PATH = "/content/dakshina_dataset_v1.0/hi/lexicons/hi.translit.sampled.dev.tsv"
TEST_PATH = "/content/dakshina_dataset_v1.0/hi/lexicons/hi.translit.sampled.test.tsv"

# Function used to load data from a given path
def load_data(path):
  df = pd.read_csv(path, sep='\t', header=None)
  df.columns = ['Devanagari', 'Romanized', 'Attestations']
  df = df.dropna()
  input_texts = df['Romanized'].tolist()
  target_texts = df['Devanagari'].apply(lambda x: 'S' + x + 'E').tolist()
  return input_texts, target_texts

#loading training , testing and validation data
train_texts, train_target_texts = load_data(TRAIN_PATH)
val_texts, val_target_texts = load_data(VAL_PATH)
test_texts, test_target_texts = load_data(TEST_PATH)
print("Number of training samples: ", len(train_texts))
print("Number of validation samples: ", len(val_texts))
print("Number of testing samples: ", len(test_texts))


train_indices = np.arange(len(train_texts))
val_indices = np.arange(len(val_texts))
test_indices = np.arange(len(test_texts))

np.random.shuffle(train_indices)
np.random.shuffle(val_indices)

# Used to store vocabulary of source and target language
input_characters = set()
target_characters = set()

# Used to store texts after adding start and end token
train_target_texts_processed = []
val_target_texts_processed = []
test_target_texts_processed = []

# Adding starting and ending token in training data
for (input_text, target_text) in zip(train_texts, train_target_texts):
    # "S" -> start token, "E" -> end token, " " -> pad token
    target_text = "S" + target_text + "E"
    train_target_texts_processed.append(target_text)
    for char in input_text:
      input_characters.add(char)
    for char in target_text:
      target_characters.add(char)

# Adding starting and ending token in validation data
for (input_text, target_text) in zip(val_texts, val_target_texts):
    # "S" -> start token, "E" -> end token, " " -> pad token
    target_text = "S" + target_text + "E"
    val_target_texts_processed.append(target_text)
    for char in input_text:
      input_characters.add(char)
    for char in target_text:
      target_characters.add(char)

# Adding starting and ending token in testing data
for (input_text, target_text) in zip(test_texts, test_target_texts):
    # "S" -> start token, "E" -> end token, " " -> pad token
    target_text = "S" + target_text + "E"
    test_target_texts_processed.append(target_text)
    for char in input_text:
      input_characters.add(char)
    for char in target_text:
      target_characters.add(char)


input_texts = list(map(train_texts.__getitem__, train_indices))
target_texts = list(map(train_target_texts_processed.__getitem__, train_indices))

val_input_texts = list(map(val_texts.__getitem__, val_indices))
val_target_texts = list(map(val_target_texts_processed.__getitem__, val_indices))

test_input_texts = list(map(test_texts.__getitem__, test_indices))
test_target_texts = list(map(test_target_texts_processed.__getitem__, test_indices))

# Creating sorted vocabulary of source and target language
input_characters = sorted(list(input_characters))
target_characters = sorted(list(target_characters))

# Add pad tokens
input_characters.insert(0, " ")
target_characters.insert(0, " ")

# Creating essential parameters
num_encoder_tokens = len(input_characters)
num_decoder_tokens = len(target_characters)
max_encoder_seq_length = max([len(t) for t in input_texts])
max_decoder_seq_length = max([len(t) for t in target_texts])
val_max_encoder_seq_length = max([len(t) for t in val_input_texts])
val_max_decoder_seq_length = max([len(t) for t in val_target_texts])

test_max_encoder_seq_length = max([len(t) for t in test_input_texts])
test_max_decoder_seq_length = max([len(t) for t in test_target_texts])

# Mapping each character of vocabulary to index
input_token_index = dict([(char, i) for i, char in enumerate(input_characters)])
target_token_index = dict([(char, i) for i, char in enumerate(target_characters)])

# defining shapes of input sequence of encoder after padding for training data
encoder_input_data = np.zeros((len(input_texts), max_encoder_seq_length), dtype="float32")

# defining shapes of input and target sequence of decoder after padding for training data
decoder_input_data = np.zeros((len(input_texts), max_decoder_seq_length), dtype="float32")
decoder_target_data = np.zeros((len(input_texts), max_decoder_seq_length, num_decoder_tokens), dtype="float32")

# Adding training data
for i, (input_text, target_text) in enumerate(zip(input_texts, target_texts)):
    for t, char in enumerate(input_text):
        encoder_input_data[i, t] = input_token_index[char]
    encoder_input_data[i, t+1 :] = input_token_index[" "]

    for t, char in enumerate(target_text):
        decoder_input_data[i, t] = target_token_index[char]
        if t > 0:
            decoder_target_data[i, t-1, target_token_index[char]] = 1.0
    decoder_input_data[i, t + 1: ] = target_token_index[" "]
    decoder_target_data[i, t:, target_token_index[" "]] = 1.0

# defining shapes of input sequence of encoder after padding for validation data
val_encoder_input_data = np.zeros((len(input_texts), val_max_encoder_seq_length), dtype="float32")

# defining shapes of input and target sequence of decoder after padding for validation data
val_decoder_input_data = np.zeros((len(input_texts), val_max_decoder_seq_length), dtype="float32")
val_decoder_target_data = np.zeros((len(input_texts), val_max_decoder_seq_length, num_decoder_tokens), dtype="float32")

# Adding validation data
for i, (input_text, target_text) in enumerate(zip(val_input_texts, val_target_texts)):
    for t, char in enumerate(input_text):
        val_encoder_input_data[i, t] = input_token_index[char]
    val_encoder_input_data[i, t + 1 :] = input_token_index[" "]

    for t, char in enumerate(target_text):
        val_decoder_input_data[i, t] = target_token_index[char]
        if t > 0:
            val_decoder_target_data[i, t - 1, target_token_index[char]] = 1.0
    val_decoder_input_data[i, t + 1: ] = target_token_index[" "]
    val_decoder_target_data[i, t:, target_token_index[" "]] = 1.0

# defining shapes of input sequence of encoder after padding for testing data
test_encoder_input_data = np.zeros((len(input_texts), test_max_encoder_seq_length), dtype="float32")

# defining shapes of input and target sequence of decoder after padding for testing data
test_decoder_input_data = np.zeros((len(input_texts), test_max_decoder_seq_length), dtype="float32")
test_decoder_target_data = np.zeros((len(input_texts), test_max_decoder_seq_length, num_decoder_tokens), dtype="float32")

# Adding testing data
for i, (input_text, target_text) in enumerate(zip(test_input_texts, test_target_texts)):
    for t, char in enumerate(input_text):
        test_encoder_input_data[i, t] = input_token_index[char]
    test_encoder_input_data[i, t + 1 :] = input_token_index[" "]

    for t, char in enumerate(target_text):
        test_decoder_input_data[i, t] = target_token_index[char]
        if t > 0:
            test_decoder_target_data[i, t - 1, target_token_index[char]] = 1.0
    test_decoder_input_data[i, t + 1: ] = target_token_index[" "]
    test_decoder_target_data[i, t:, target_token_index[" "]] = 1.0

# creating inverse map which maps integer to character
inverse_input_token_index = dict((i, char) for char, i in input_token_index.items())
inverse_target_token_index = dict((i, char) for char, i in target_token_index.items())

Number of training samples:  44202
Number of validation samples:  4358
Number of testing samples:  4502


In [None]:
print("Number of samples:", len(input_texts))
print("Number of unique input tokens:", num_encoder_tokens)
print("Number of unique output tokens:", num_decoder_tokens)
print("Max sequence length for train inputs:", max_encoder_seq_length)
print("Max sequence length for train outputs:", max_decoder_seq_length)
print("Max sequence length for val inputs:", val_max_encoder_seq_length)
print("Max sequence length for val outputs:", val_max_decoder_seq_length)
print(input_characters)
print(target_characters)
print(input_token_index)
print(target_token_index)
print(encoder_input_data[10])
print(decoder_input_data[10])
print(decoder_target_data[10])

Number of samples: 44202
Number of unique input tokens: 27
Number of unique output tokens: 66
Max sequence length for train inputs: 20
Max sequence length for train outputs: 23
Max sequence length for val inputs: 18
Max sequence length for val outputs: 18
[' ', 'a', 'b', 'c', 'd', 'e', 'f', 'g', 'h', 'i', 'j', 'k', 'l', 'm', 'n', 'o', 'p', 'q', 'r', 's', 't', 'u', 'v', 'w', 'x', 'y', 'z']
[' ', 'E', 'S', 'ँ', 'ं', 'ः', 'अ', 'आ', 'इ', 'ई', 'उ', 'ऊ', 'ऋ', 'ए', 'ऐ', 'ऑ', 'ओ', 'औ', 'क', 'ख', 'ग', 'घ', 'ङ', 'च', 'छ', 'ज', 'झ', 'ञ', 'ट', 'ठ', 'ड', 'ढ', 'ण', 'त', 'थ', 'द', 'ध', 'न', 'प', 'फ', 'ब', 'भ', 'म', 'य', 'र', 'ल', 'व', 'श', 'ष', 'स', 'ह', '़', 'ा', 'ि', 'ी', 'ु', 'ू', 'ृ', 'ॅ', 'े', 'ै', 'ॉ', 'ो', 'ौ', '्', 'ॐ']
{' ': 0, 'a': 1, 'b': 2, 'c': 3, 'd': 4, 'e': 5, 'f': 6, 'g': 7, 'h': 8, 'i': 9, 'j': 10, 'k': 11, 'l': 12, 'm': 13, 'n': 14, 'o': 15, 'p': 16, 'q': 17, 'r': 18, 's': 19, 't': 20, 'u': 21, 'v': 22, 'w': 23, 'x': 24, 'y': 25, 'z': 26}
{' ': 0, 'E': 1, 'S': 2, 'ँ': 3, 'ं': 4, 'ः

**Defining Transliteration Model**

In [None]:
class TransliterationModel(object):
  def __init__(self, config):
    self.config = config

  def train_and_evaluate(self, encoder_input_data, decoder_input_data, decoder_target_data,
                         val_encoder_input_data, val_target_texts):
    # Encoder
    encoder_inputs = Input(shape=(None, ),name = 'Encoder_inputs')

    # Embedding layer: (num_encoder_tokens, input_embedding_size)
    encoder_embedded =  Embedding(num_encoder_tokens, self.config.input_embedding_size,
                         mask_zero=True, name='Encoder_embeddings')(encoder_inputs)
    encoder_outputs = encoder_embedded

    # Adding encoder layers and storing encoder states according to cell type
    if self.config.cell_type == 'RNN':
      encoder_layers = [SimpleRNN(self.config.hidden_units, 
                                  dropout=self.config.dropout, 
                                  return_sequences=True, 
                                  return_state=True, 
                                  name=f"Encoder_{layer_idx}")
                        for layer_idx in range(self.config.num_encoder_layers)]
      encoder_outputs, hidden = encoder_layers[0](encoder_outputs)
      encoder_states = [hidden]
      for layer_idx in range(1, self.config.num_encoder_layers):
        encoder_outputs, hidden = encoder_layers[layer_idx](encoder_outputs, initial_state=encoder_states)
        encoder_states = [hidden]  
    elif self.config.cell_type == 'LSTM':
      encoder_layers = [LSTM(self.config.hidden_units, 
                             dropout=self.config.dropout, 
                             return_sequences=True, 
                             return_state=True, 
                             name=f"Encoder_{layer_idx}")
                        for layer_idx in range(self.config.num_encoder_layers)]
      encoder_outputs, hidden, context = encoder_layers[0](encoder_outputs)
      encoder_states = [hidden, context]
      for layer_idx in range(1, self.config.num_encoder_layers):
        encoder_outputs, hidden, context = encoder_layers[layer_idx](encoder_outputs, initial_state=encoder_states)
        encoder_states = [hidden, context]
    elif self.config.cell_type == 'GRU':
      encoder_layers = [GRU(self.config.hidden_units, 
                            dropout=self.config.dropout, 
                            return_sequences=True, 
                            return_state=True, 
                            name=f"Encoder_{layer_idx}")
                        for layer_idx in range(self.config.num_encoder_layers)]
      encoder_outputs, hidden = encoder_layers[0](encoder_outputs)
      encoder_states = [hidden]
      for layer_idx in range(1, self.config.num_encoder_layers):
        encoder_outputs, hidden = encoder_layers[layer_idx](encoder_outputs, initial_state=encoder_states)
        encoder_states = [hidden]

    # Decoder
    decoder_inputs = Input(shape=(None,), name = 'Decoder_inputs')

    # Embedding layer: (num_decoder_tokens, hidden_units)
    decoder_embedded = Embedding(num_decoder_tokens, self.config.hidden_units,
                       mask_zero=True, name='Decoder_embeddings')(decoder_inputs)
    decoder_outputs = decoder_embedded

    # Adding decoder layers and storing decoder states according to cell type
    if self.config.cell_type == 'RNN':
      decoder_layers = [SimpleRNN(self.config.hidden_units, 
                                  dropout=self.config.dropout, 
                                  return_sequences=True, 
                                  return_state=True, 
                                  name=f"Decoder_{layer_idx}")
                        for layer_idx in range(self.config.num_decoder_layers)]
      decoder_outputs, _ = decoder_layers[0](decoder_outputs, initial_state=encoder_states)
      for layer_idx in range(1, self.config.num_decoder_layers):
        decoder_outputs, _ = decoder_layers[layer_idx](decoder_outputs, initial_state = encoder_states)
    if self.config.cell_type == 'LSTM':
      decoder_layers = [LSTM(self.config.hidden_units, 
                             dropout=self.config.dropout, 
                             return_sequences=True, 
                             return_state=True, 
                             name=f"Decoder_{layer_idx}")
                        for layer_idx in range(self.config.num_decoder_layers)]
      decoder_outputs, _, _ = decoder_layers[0](decoder_outputs, initial_state=encoder_states)
      for layer_idx in range(1, self.config.num_decoder_layers):
        decoder_outputs, _, _ = decoder_layers[layer_idx](decoder_outputs, initial_state = encoder_states)
    elif self.config.cell_type == 'GRU':
      decoder_layers = [GRU(self.config.hidden_units, 
                            dropout=self.config.dropout, 
                            return_sequences=True, 
                            return_state=True, 
                            name=f"Decoder_{layer_idx}")
                        for layer_idx in range(self.config.num_decoder_layers)]
      decoder_outputs, _ = decoder_layers[0](decoder_outputs, initial_state=encoder_states)
      for layer_idx in range(1, self.config.num_decoder_layers):
        decoder_outputs, _ = decoder_layers[layer_idx](decoder_outputs, initial_state=encoder_states)
    decoder_outputs = Dense(num_decoder_tokens, activation='softmax', name='dense')(decoder_outputs)

    # Defining our Seq2seq model
    model = Model([encoder_inputs, decoder_inputs], decoder_outputs)
    optimizer = Adam(learning_rate=self.config.learning_rate, beta_1=0.9, beta_2=0.999)
    model.compile(loss="categorical_crossentropy", optimizer=optimizer,
                  metrics=['accuracy'])
    model.fit(
        [encoder_input_data, decoder_input_data],
        decoder_target_data,
        batch_size=self.config.batch_size,
        epochs=self.config.epochs,
        validation_data=([val_encoder_input_data, val_decoder_input_data], val_decoder_target_data),
        callbacks = [WandbCallback()]
    )
    
    model.save("transliteration_model")
    # model = keras.models.load_model("transliteration_model")
    
    # Wrap Encoder Decoder
    encoder_inputs = model.input[0]
    if self.config.cell_type in ['RNN', 'GRU']:
      encoder_outputs, hidden_state = model.get_layer(f'Encoder_{self.config.num_encoder_layers-1}').output
      encoder_states = [hidden_state]
      encoder = Model(encoder_inputs, encoder_states)
      decoder_inputs = model.input[1]
      decoder_outputs = model.get_layer('Decoder_embeddings')(decoder_inputs)
      decoder_states_inputs = []
      decoder_states = []
      for i in range(self.config.num_decoder_layers):
        decoder_hidden = keras.Input(shape=(self.config.hidden_units,))
        states = [decoder_hidden]
        decoder_outputs, hidden_state_decoder = model.get_layer(f'Decoder_{i}')(decoder_outputs, initial_state=states)
        decoder_states += [hidden_state_decoder]
        decoder_states_inputs += states
    elif self.config.cell_type == 'LSTM':
      encoder_outputs, hidden_state, context_state = model.get_layer(f'Encoder_{self.config.num_encoder_layers-1}').output
      encoder_states = [hidden_state, context_state]
      encoder = Model(encoder_inputs, encoder_states)
      decoder_inputs = model.input[1]  # input_1
      decoder_outputs = model.get_layer('Decoder_embeddings')(decoder_inputs)
      decoder_states_inputs = []
      decoder_states = []
      for i in range(self.config.num_decoder_layers):
        decoder_hidden = keras.Input(shape=(self.config.hidden_units,))
        decoder_context = keras.Input(shape=(self.config.hidden_units,))
        states = [decoder_hidden, decoder_context]
        decoder = model.get_layer(f'Decoder_{i}')
        decoder_outputs, hidden_state_decoder, context_state_decoder = decoder(decoder_outputs, initial_state=states)
        decoder_states += [hidden_state_decoder, context_state_decoder]
        decoder_states_inputs += states
    decoder_dense = model.get_layer('dense')
    decoder_outputs = decoder_dense(decoder_outputs)
    decoder = Model([decoder_inputs] + decoder_states_inputs, [decoder_outputs] + decoder_states)
 
    # finding validation accuracy and logging it into wandb
    total, correct = 0, 0
    output_list, target_list = [], []
    for i in range(len(val_texts)):
      output = self.decode_to_text(val_encoder_input_data[i:i+1], encoder, decoder)
      target = val_target_texts[i][1:len(val_target_texts[i])-1]
      output = output[0:len(output)-1]
      output = output.replace(' ', '').replace('S', '').replace('E', '')
      target = target.replace(' ', '').replace('S', '').replace('E', '')
      output_list.append(output)
      target_list.append(target)
      # print('O/P TGT: ', output, target)
      if output == target:
        correct += 1
      total += 1
      validation_word_accuracy = correct / total
      if i % 100 == 0:
        print({o: t for o, t in zip(output_list[i:i+100], target_list[i:i+100])})
        wandb.log({'validation_word_accuracy' : validation_word_accuracy})
    word_val_accuracy = correct / total
    wandb.log({'word_val_accuracy' : word_val_accuracy})
      
  def decode_to_text(self, inputs, encoder, decoder):
    encoder_states = [encoder.predict(inputs) for _ in range(self.config.num_decoder_layers)]
    target = np.array([[target_token_index['S']]])
    sentence, done = "", False
    beam_width = 1 if self.config.decoding_strategy == 'greedy' else self.config.beam_width
    sentence = self.beam_search_decoder(inputs, encoder, decoder, beam_width)
    return sentence


  def beam_search_decoder(self, inputs, encoder, decoder, beam_width):
        
        done, decoded_sentence = False, ""

        # Get encoder states
        encoder_states = [encoder.predict(inputs) for _ in range(self.config.num_decoder_layers)]

        # Decoder input begins with Start Token "S"
        target_sequence = np.array([[target_token_index["S"]]])

        # sum_of_log_probs (score), flag for end of current sequence, target_sequence, states , sequence_token, sequence_char
        sequences = [[0.0, 0,  target_sequence, encoder_states,  list(),list()]]
        while not done:
            candidates = list()
            for i in range(len(sequences)):
              output = decoder.predict([sequences[i][2]] + sequences[i][3])
              output_tokens, states = output[0], output[1:]
              prob = output_tokens[0,-1,:]
              
              score, flag, _, _, sequence_token, sequence_char = sequences[i]
              
              if flag == 0:
                for j in range(len(inverse_target_token_index)):
                  char = inverse_target_token_index[j]
                  target_sequence = np.array([[j]])
                  candidate = [score - np.log(prob[j]), 0, target_sequence, states,  sequence_token + [j] , sequence_char + [char] ]
                  candidates.append(candidate)
            sorted_candidates = sorted(candidates, key=lambda x:x[0])
            k = min(beam_width, len(sorted_candidates))
            sequences = sorted_candidates[:k]
            done = True
           
            for sequence in range(len(sequences)):
                score, flag, tgt_seq, states, sequence_token, sequence_char = sequences[sequence]
                if (len(sequence_char) > max_decoder_seq_length) or (sequence_char[-1] == "E"): 
                  flag = 1
                sequences[sequence][1] = flag
                done = False if flag == 0 else done
            if sequences[0][-1][-1]=="E": 
              done = True
        top_decoded_sentence = ''.join(sequences[0][5])
        return top_decoded_sentence

**Defining the Sweep Hyperparameter dictionary**

In [None]:
wandb.login()
sweep_config = {
    'method': 'bayes', 
    'metric': {
      'name': 'word_val_accuracy',
      'goal': 'maximize'   
    },
    'parameters': {

        'dropout': {
            'values': [0, 0.2, 0.3]
        },
        'learning_rate': {
            'values': [0.001,0.0001,0.0003,0.0005]
        },
        'batch_size': {
            'values': [64, 128, 256]
        },
        'input_embedding_size': {
            'values': [32, 64, 128, 256, 512]
        },
        'num_encoder_layers': {
            'values': [1, 2, 3, 4]
        },
        'num_decoder_layers': {
            'values': [1, 2, 3, 4]
        },
        'hidden_size':{
            'values': [32, 64, 128, 256, 512]
        },
        'cell_type': {
            'values': ['RNN', 'LSTM', 'GRU']
        },
        'decoding_strategy': {
            'values': ['beam_search', 'greedy']
        },
        'beam_sizes':{
            'values': [3, 5, 7]
        },
        'epochs':{
            'values': [5,10,15,20]
        }
    }
}

sweep_id = wandb.sweep(sweep_config, project="Assigment3_Q2", entity="cs21s006_cs21s043")
print('sweep_id: ', sweep_id)

Create sweep with ID: alseo6jh
Sweep URL: https://wandb.ai/cs21s006_cs21s043/Assigment3_Q2/sweeps/alseo6jh
sweep_id:  alseo6jh


In [None]:
def spawn_fn():
      with wandb.init(project="Assignment3_Q2", entity="cs21s006_cs21s043") as run:
        config = wandb.config
        wandb.run.name = 'ep-'+str(config.epochs)+'-dr-'+str(config.dropout)+'-lr-'+str(config.learning_rate)+'-bs'+str(config.batch_size)+'-es-'+str(config.input_embedding_size)\
        +'-el-'+str(config.num_encoder_layers)+'-dl-'+str(config.num_decoder_layers)+'-hs-'+str(config.hidden_size)+'-cell-'+str(config.cell_type)+'-dec_str-'+str(config.decoding_strategy)\
        +'-bs-'+str(config.beam_sizes)

        model_transliteration = TransliterationModel(config)
        model_transliteration.train_and_evaluate(encoder_input_data,decoder_input_data,decoder_target_data,val_encoder_input_data, val_target_texts)

**By this cell only 15 sweeps ran**

In [None]:
wandb.agent("ajlstr1d", function = spawn_fn , count=50)

[34m[1mwandb[0m: Agent Starting Run: 3khcbuep with config:
[34m[1mwandb[0m: 	batch_size: 128
[34m[1mwandb[0m: 	beam_sizes: 5
[34m[1mwandb[0m: 	cell_type: LSTM
[34m[1mwandb[0m: 	decoding_strategy: beam_search
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_size: 256
[34m[1mwandb[0m: 	input_embedding_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.0005
[34m[1mwandb[0m: 	num_decoder_layers: 1
[34m[1mwandb[0m: 	num_encoder_layers: 2


Epoch 1/5
Epoch 2/5
Epoch 3/5
Epoch 4/5
Epoch 5/5


VBox(children=(Label(value='16.260 MB of 16.260 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
accuracy,▁▃▅▇█
epoch,▁▃▅▆█
loss,█▅▃▂▁
val_accuracy,▁▃▆▇█
val_loss,█▆▃▂▁
validation_word_accuracy,▄▃▁▄▅▇▇▆▇▇█████▇▇▇▇▇▇▇▆▆▆▆▆▅▅▅▅▅▅▅▅▅▅▅▅▅
word_val_accuracy,▁

0,1
accuracy,0.71727
best_epoch,4.0
best_val_loss,0.04051
epoch,4.0
loss,0.36769
val_accuracy,0.74877
val_loss,0.04051
validation_word_accuracy,0.12851
word_val_accuracy,0.1285


[34m[1mwandb[0m: Agent Starting Run: wrva5utm with config:
[34m[1mwandb[0m: 	batch_size: 256
[34m[1mwandb[0m: 	beam_sizes: 5
[34m[1mwandb[0m: 	cell_type: LSTM
[34m[1mwandb[0m: 	decoding_strategy: beam_search
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	epochs: 20
[34m[1mwandb[0m: 	hidden_size: 512
[34m[1mwandb[0m: 	input_embedding_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.0005
[34m[1mwandb[0m: 	num_decoder_layers: 4
[34m[1mwandb[0m: 	num_encoder_layers: 2


Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20


VBox(children=(Label(value='133.783 MB of 133.783 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0,…

0,1
accuracy,▁▂▃▄▄▅▆▆▆▇▇▇▇▇▇█████
epoch,▁▁▂▂▂▃▃▄▄▄▅▅▅▆▆▇▇▇██
loss,█▆▅▅▄▄▃▃▂▂▂▂▂▂▁▁▁▁▁▁
val_accuracy,▁▂▃▄▅▆▆▆▇▇▇▇████████
val_loss,█▇▅▄▄▃▃▂▂▂▂▁▁▁▁▁▁▁▁▁
validation_word_accuracy,▂▃▁▄▆██▇██▇███▇▇▇▇▇▇████████▇▇▇▇▇▇▇▇▇▇▇▇
word_val_accuracy,▁

0,1
accuracy,0.91007
best_epoch,19.0
best_val_loss,0.02277
epoch,19.0
loss,0.11228
val_accuracy,0.85692
val_loss,0.02277
validation_word_accuracy,0.32322
word_val_accuracy,0.32331


[34m[1mwandb[0m: Agent Starting Run: rw6vd4jf with config:
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	beam_sizes: 3
[34m[1mwandb[0m: 	cell_type: GRU
[34m[1mwandb[0m: 	decoding_strategy: greedy
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	epochs: 15
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	input_embedding_size: 128
[34m[1mwandb[0m: 	learning_rate: 0.0005
[34m[1mwandb[0m: 	num_decoder_layers: 4
[34m[1mwandb[0m: 	num_encoder_layers: 2


Epoch 1/15
Epoch 2/15
Epoch 3/15
Epoch 4/15
Epoch 5/15
Epoch 6/15
Epoch 7/15
Epoch 8/15
Epoch 9/15
Epoch 10/15
Epoch 11/15
Epoch 12/15
Epoch 13/15
Epoch 14/15
Epoch 15/15


VBox(children=(Label(value='2.103 MB of 2.103 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
accuracy,▁▃▄▄▅▆▆▇▇▇▇████
epoch,▁▁▂▃▃▃▄▅▅▅▆▇▇▇█
loss,█▆▅▄▄▃▃▂▂▂▁▁▁▁▁
val_accuracy,▁▂▃▄▅▆▆▇▇▇▇████
val_loss,█▆▆▄▄▃▂▂▂▂▁▁▁▁▁
validation_word_accuracy,▁█▂▃▄▄▃▃▅▆▇█▇█▇███▇█▇█▇█████▇▇▇▇▇▇▇▇▇▇▇▇
word_val_accuracy,▁

0,1
accuracy,0.77946
best_epoch,14.0
best_val_loss,0.03032
epoch,14.0
loss,0.28092
val_accuracy,0.81147
val_loss,0.03032
validation_word_accuracy,0.22989
word_val_accuracy,0.22946


[34m[1mwandb[0m: Agent Starting Run: oo3285pb with config:
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	beam_sizes: 3
[34m[1mwandb[0m: 	cell_type: RNN
[34m[1mwandb[0m: 	decoding_strategy: greedy
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	input_embedding_size: 128
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	num_decoder_layers: 4
[34m[1mwandb[0m: 	num_encoder_layers: 1


Epoch 1/5
Epoch 2/5
Epoch 3/5
Epoch 4/5
Epoch 5/5


VBox(children=(Label(value='0.750 MB of 0.750 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
accuracy,▁▅▆▇█
epoch,▁▃▅▆█
loss,█▄▃▂▁
val_accuracy,▁▄▆▇█
val_loss,█▅▃▂▁
validation_word_accuracy,▃█▃▂▁▁▂▂▂▂▂▂▃▂▂▂▂▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁▂▁▁▁▁▁▁▁
word_val_accuracy,▁

0,1
accuracy,0.53797
best_epoch,4.0
best_val_loss,0.07258
epoch,4.0
loss,0.65402
val_accuracy,0.58395
val_loss,0.07258
validation_word_accuracy,0.01586
word_val_accuracy,0.01583


[34m[1mwandb[0m: Agent Starting Run: ur9u5vct with config:
[34m[1mwandb[0m: 	batch_size: 256
[34m[1mwandb[0m: 	beam_sizes: 5
[34m[1mwandb[0m: 	cell_type: RNN
[34m[1mwandb[0m: 	decoding_strategy: beam_search
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	input_embedding_size: 512
[34m[1mwandb[0m: 	learning_rate: 0.0003
[34m[1mwandb[0m: 	num_decoder_layers: 1
[34m[1mwandb[0m: 	num_encoder_layers: 4


Epoch 1/5
Epoch 2/5
Epoch 3/5
Epoch 4/5
Epoch 5/5


VBox(children=(Label(value='0.595 MB of 0.595 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
accuracy,▁▆▇██
epoch,▁▃▅▆█
loss,█▅▃▂▁
val_accuracy,▁▆▇██
val_loss,█▅▃▂▁
validation_word_accuracy,▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁██▇▇▇▇▆▆▆▆▆▆▅▅▅▅▅▅▅▅
word_val_accuracy,▁

0,1
accuracy,0.3621
best_epoch,4.0
best_val_loss,0.1171
epoch,4.0
loss,0.96712
val_accuracy,0.3686
val_loss,0.1171
validation_word_accuracy,0.00023
word_val_accuracy,0.00023


[34m[1mwandb[0m: Agent Starting Run: jllt7kyx with config:
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	beam_sizes: 3
[34m[1mwandb[0m: 	cell_type: RNN
[34m[1mwandb[0m: 	decoding_strategy: beam_search
[34m[1mwandb[0m: 	dropout: 0
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_size: 256
[34m[1mwandb[0m: 	input_embedding_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.0001
[34m[1mwandb[0m: 	num_decoder_layers: 3
[34m[1mwandb[0m: 	num_encoder_layers: 4


Epoch 1/5
Epoch 2/5
Epoch 3/5
Epoch 4/5
Epoch 5/5


VBox(children=(Label(value='10.485 MB of 10.485 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
accuracy,▁▅▇▇█
epoch,▁▃▅▆█
loss,█▄▂▁▁
val_accuracy,▁▅▆▇█
val_loss,█▄▂▂▁
validation_word_accuracy,▃█▁▄▃▂▂▂▃▃▃▄▄▄▄▄▄▄▄▄▃▃▃▃▃▃▃▃▃▃▃▃▃▃▃▃▃▃▃▃
word_val_accuracy,▁

0,1
accuracy,0.78406
best_epoch,4.0
best_val_loss,0.03784
epoch,4.0
loss,0.28301
val_accuracy,0.76795
val_loss,0.03784
validation_word_accuracy,0.17839
word_val_accuracy,0.17806


[34m[1mwandb[0m: Agent Starting Run: ex8e0fzf with config:
[34m[1mwandb[0m: 	batch_size: 128
[34m[1mwandb[0m: 	beam_sizes: 5
[34m[1mwandb[0m: 	cell_type: LSTM
[34m[1mwandb[0m: 	decoding_strategy: beam_search
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	epochs: 15
[34m[1mwandb[0m: 	hidden_size: 256
[34m[1mwandb[0m: 	input_embedding_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.0003
[34m[1mwandb[0m: 	num_decoder_layers: 1
[34m[1mwandb[0m: 	num_encoder_layers: 3


Epoch 1/15
Epoch 2/15
Epoch 3/15
Epoch 4/15
Epoch 5/15
Epoch 6/15
Epoch 7/15
Epoch 8/15
Epoch 9/15
Epoch 10/15
Epoch 11/15
Epoch 12/15
Epoch 13/15
Epoch 14/15
Epoch 15/15


VBox(children=(Label(value='21.903 MB of 21.903 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
accuracy,▁▂▃▄▄▅▅▆▆▆▇▇▇██
epoch,▁▁▂▃▃▃▄▅▅▅▆▇▇▇█
loss,█▆▅▅▄▄▃▃▃▂▂▂▁▁▁
val_accuracy,▁▂▂▃▄▅▅▆▆▆▇▇▇██
val_loss,█▇▆▅▅▄▄▃▃▂▂▂▂▁▁
validation_word_accuracy,▁▄▆▇▆▆▆▆▇▇▇███▇▇▇▇▇█████▇▇▇▆▆▆▆▆▇▇▆▆▆▆▇▆
word_val_accuracy,▁

0,1
accuracy,0.71767
best_epoch,14.0
best_val_loss,0.04484
epoch,14.0
loss,0.36668
val_accuracy,0.72265
val_loss,0.04484
validation_word_accuracy,0.08851
word_val_accuracy,0.08834


[34m[1mwandb[0m: Agent Starting Run: 817pb5g2 with config:
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	beam_sizes: 3
[34m[1mwandb[0m: 	cell_type: RNN
[34m[1mwandb[0m: 	decoding_strategy: beam_search
[34m[1mwandb[0m: 	dropout: 0
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_size: 512
[34m[1mwandb[0m: 	input_embedding_size: 128
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	num_decoder_layers: 4
[34m[1mwandb[0m: 	num_encoder_layers: 4


Epoch 1/5
Epoch 2/5
Epoch 3/5
Epoch 4/5
Epoch 5/5


VBox(children=(Label(value='46.743 MB of 46.743 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
accuracy,▁▅▆▇█
epoch,▁▃▅▆█
loss,█▄▃▂▁
val_accuracy,▁▄▅▇█
val_loss,█▅▃▁▁
validation_word_accuracy,▁▁▄▅▆█▇▆▆▆▆▇███▇▇▆▆▇▇▇▇▇▇▇▆▆▆▆▆▆▆▆▆▆▆▇▆▆
word_val_accuracy,▁

0,1
accuracy,0.63378
best_epoch,4.0
best_val_loss,0.06953
epoch,4.0
loss,0.48994
val_accuracy,0.59661
val_loss,0.06953
validation_word_accuracy,0.00667
word_val_accuracy,0.00665


[34m[1mwandb[0m: Agent Starting Run: 5ni4obj4 with config:
[34m[1mwandb[0m: 	batch_size: 256
[34m[1mwandb[0m: 	beam_sizes: 3
[34m[1mwandb[0m: 	cell_type: LSTM
[34m[1mwandb[0m: 	decoding_strategy: greedy
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_size: 256
[34m[1mwandb[0m: 	input_embedding_size: 256
[34m[1mwandb[0m: 	learning_rate: 0.0005
[34m[1mwandb[0m: 	num_decoder_layers: 4
[34m[1mwandb[0m: 	num_encoder_layers: 4


Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10


VBox(children=(Label(value='48.695 MB of 48.695 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
accuracy,▁▂▃▅▆▆▇▇██
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▇▅▄▃▂▂▁▁▁
val_accuracy,▁▂▄▅▆▇▇███
val_loss,█▇▅▄▃▂▂▁▁▁
validation_word_accuracy,▁▃▃▇▆▇▆▆▆▇▇▇██▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇
word_val_accuracy,▁

0,1
accuracy,0.80219
best_epoch,9.0
best_val_loss,0.03079
epoch,9.0
loss,0.25094
val_accuracy,0.80221
val_loss,0.03079
validation_word_accuracy,0.22046
word_val_accuracy,0.22006


[34m[1mwandb[0m: Agent Starting Run: dkdeyqlu with config:
[34m[1mwandb[0m: 	batch_size: 128
[34m[1mwandb[0m: 	beam_sizes: 7
[34m[1mwandb[0m: 	cell_type: GRU
[34m[1mwandb[0m: 	decoding_strategy: greedy
[34m[1mwandb[0m: 	dropout: 0
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	input_embedding_size: 128
[34m[1mwandb[0m: 	learning_rate: 0.0005
[34m[1mwandb[0m: 	num_decoder_layers: 2
[34m[1mwandb[0m: 	num_encoder_layers: 2


Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10


VBox(children=(Label(value='0.566 MB of 0.566 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
accuracy,▁▄▅▅▆▆▇▇██
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▅▄▄▃▃▂▂▁▁
val_accuracy,▁▂▃▄▅▅▆▇▇█
val_loss,█▆▅▄▄▃▂▂▁▁
validation_word_accuracy,▁▇▄▅▄▄▆▆▇▇██▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▆▆▆
word_val_accuracy,▁

0,1
accuracy,0.55678
best_epoch,9.0
best_val_loss,0.07382
epoch,9.0
loss,0.60709
val_accuracy,0.56997
val_loss,0.07382
validation_word_accuracy,0.01287
word_val_accuracy,0.01285


[34m[1mwandb[0m: Agent Starting Run: fl3g8zoj with config:
[34m[1mwandb[0m: 	batch_size: 128
[34m[1mwandb[0m: 	beam_sizes: 5
[34m[1mwandb[0m: 	cell_type: LSTM
[34m[1mwandb[0m: 	decoding_strategy: beam_search
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	input_embedding_size: 256
[34m[1mwandb[0m: 	learning_rate: 0.0003
[34m[1mwandb[0m: 	num_decoder_layers: 4
[34m[1mwandb[0m: 	num_encoder_layers: 3


Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10


VBox(children=(Label(value='1.245 MB of 1.245 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
accuracy,▁▂▃▄▆▆▇▇██
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▆▅▄▄▃▂▂▁▁
val_accuracy,▁▁▃▄▅▆▇▇██
val_loss,█▇▆▅▄▃▂▂▁▁
validation_word_accuracy,▁█▅▄▅▅▄▄▄▄▅▄▅▄▄▄▅▅▄▅▅▅▅▅▅▅▅▅▅▅▅▅▅▅▅▅▅▅▅▅
word_val_accuracy,▁

0,1
accuracy,0.47488
best_epoch,9.0
best_val_loss,0.08749
epoch,9.0
loss,0.73918
val_accuracy,0.49691
val_loss,0.08749
validation_word_accuracy,0.0069
word_val_accuracy,0.00688


[34m[1mwandb[0m: Agent Starting Run: 5omb6k9z with config:
[34m[1mwandb[0m: 	batch_size: 256
[34m[1mwandb[0m: 	beam_sizes: 7
[34m[1mwandb[0m: 	cell_type: GRU
[34m[1mwandb[0m: 	decoding_strategy: beam_search
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	input_embedding_size: 512
[34m[1mwandb[0m: 	learning_rate: 0.0005
[34m[1mwandb[0m: 	num_decoder_layers: 3
[34m[1mwandb[0m: 	num_encoder_layers: 1


Epoch 1/5
Epoch 2/5
Epoch 3/5
Epoch 4/5
Epoch 5/5


VBox(children=(Label(value='2.468 MB of 2.468 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
accuracy,▁▄▆▇█
epoch,▁▃▅▆█
loss,█▅▃▂▁
val_accuracy,▁▄▅▇█
val_loss,█▆▄▂▁
validation_word_accuracy,▁▁▄█▆▅▅▄▄▃▄▄▄▄▄▃▄▄▃▅▅▅▅▅▅▅▅▅▅▅▅▅▅▅▅▅▅▅▅▅
word_val_accuracy,▁

0,1
accuracy,0.47315
best_epoch,4.0
best_val_loss,0.08565
epoch,4.0
loss,0.74557
val_accuracy,0.51269
val_loss,0.08565
validation_word_accuracy,0.00506
word_val_accuracy,0.00505


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: lskdcqfk with config:
[34m[1mwandb[0m: 	batch_size: 128
[34m[1mwandb[0m: 	beam_sizes: 3
[34m[1mwandb[0m: 	cell_type: LSTM
[34m[1mwandb[0m: 	decoding_strategy: beam_search
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_size: 128
[34m[1mwandb[0m: 	input_embedding_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.0001
[34m[1mwandb[0m: 	num_decoder_layers: 2
[34m[1mwandb[0m: 	num_encoder_layers: 3


Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10


VBox(children=(Label(value='7.265 MB of 7.265 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
accuracy,▁▃▅▆▇▇▇███
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▅▄▃▃▂▂▁▁▁
val_accuracy,▁▄▅▆▆▇▇▇██
val_loss,█▆▅▄▃▂▂▂▁▁
validation_word_accuracy,▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁██▇▇▇▇▇▇▆▆▆
word_val_accuracy,▁

0,1
accuracy,0.40398
best_epoch,9.0
best_val_loss,0.10331
epoch,9.0
loss,0.84724
val_accuracy,0.41117
val_loss,0.10331
validation_word_accuracy,0.00023
word_val_accuracy,0.00023


[34m[1mwandb[0m: Agent Starting Run: vkioczb9 with config:
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	beam_sizes: 5
[34m[1mwandb[0m: 	cell_type: LSTM
[34m[1mwandb[0m: 	decoding_strategy: greedy
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	epochs: 15
[34m[1mwandb[0m: 	hidden_size: 512
[34m[1mwandb[0m: 	input_embedding_size: 512
[34m[1mwandb[0m: 	learning_rate: 0.0005
[34m[1mwandb[0m: 	num_decoder_layers: 4
[34m[1mwandb[0m: 	num_encoder_layers: 1


Epoch 1/15
Epoch 2/15
Epoch 3/15
Epoch 4/15
Epoch 5/15
Epoch 6/15
Epoch 7/15
Epoch 8/15
Epoch 9/15
Epoch 10/15
Epoch 11/15
Epoch 12/15
Epoch 13/15
Epoch 14/15
Epoch 15/15


In [None]:
wandb.agent("ajlstr1d", function = spawn_fn , count=20)

[34m[1mwandb[0m: Agent Starting Run: n3t3hivm with config:
[34m[1mwandb[0m: 	batch_size: 128
[34m[1mwandb[0m: 	beam_sizes: 7
[34m[1mwandb[0m: 	cell_type: LSTM
[34m[1mwandb[0m: 	decoding_strategy: beam_search
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_size: 512
[34m[1mwandb[0m: 	input_embedding_size: 512
[34m[1mwandb[0m: 	learning_rate: 0.0005
[34m[1mwandb[0m: 	num_decoder_layers: 3
[34m[1mwandb[0m: 	num_encoder_layers: 1
[34m[1mwandb[0m: Currently logged in as: [33mcs21s043[0m (use `wandb login --relogin` to force relogin)


Epoch 1/5
Epoch 2/5
Epoch 3/5
Epoch 4/5
Epoch 5/5


VBox(children=(Label(value='97.110 MB of 97.110 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
accuracy,▁▆▇██
epoch,▁▃▅▆█
loss,█▃▂▁▁
val_accuracy,▁▆▇██
val_loss,█▃▂▁▁
validation_word_accuracy,▁█▄▇▅▅▅▅▅▄▃▃▄▅▅▅▅▆▅▅▅▅▅▅▅▅▄▅▅▅▅▅▅▅▅▅▅▅▅▅
word_val_accuracy,▁

0,1
accuracy,0.88585
best_epoch,4.0
best_val_loss,0.02157
epoch,4.0
loss,0.14348
val_accuracy,0.85762
val_loss,0.02157
validation_word_accuracy,0.32851
word_val_accuracy,0.3279


[34m[1mwandb[0m: Agent Starting Run: b3lhdphv with config:
[34m[1mwandb[0m: 	batch_size: 256
[34m[1mwandb[0m: 	beam_sizes: 7
[34m[1mwandb[0m: 	cell_type: LSTM
[34m[1mwandb[0m: 	decoding_strategy: beam_search
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	epochs: 15
[34m[1mwandb[0m: 	hidden_size: 512
[34m[1mwandb[0m: 	input_embedding_size: 512
[34m[1mwandb[0m: 	learning_rate: 0.0003
[34m[1mwandb[0m: 	num_decoder_layers: 3
[34m[1mwandb[0m: 	num_encoder_layers: 1


Epoch 1/15
Epoch 2/15
Epoch 3/15
Epoch 4/15
Epoch 5/15
Epoch 6/15
Epoch 7/15
Epoch 8/15
Epoch 9/15
Epoch 10/15
Epoch 11/15
Epoch 12/15
Epoch 13/15
Epoch 14/15
Epoch 15/15


VBox(children=(Label(value='97.110 MB of 97.110 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
accuracy,▁▃▅▆▆▇▇▇▇██████
epoch,▁▁▂▃▃▃▄▅▅▅▆▇▇▇█
loss,█▅▄▃▂▂▂▂▁▁▁▁▁▁▁
val_accuracy,▁▄▅▆▇▇▇████████
val_loss,█▄▃▂▂▂▂▁▁▁▁▁▁▁▁
validation_word_accuracy,▁▆▆█▇▇▇▇▇▇▇▇▇█▇█████████████████████████
word_val_accuracy,▁

0,1
accuracy,0.9155
best_epoch,14.0
best_val_loss,0.02074
epoch,14.0
loss,0.10742
val_accuracy,0.86561
val_loss,0.02074
validation_word_accuracy,0.35103
word_val_accuracy,0.35062


[34m[1mwandb[0m: Agent Starting Run: b14lzzpa with config:
[34m[1mwandb[0m: 	batch_size: 128
[34m[1mwandb[0m: 	beam_sizes: 5
[34m[1mwandb[0m: 	cell_type: LSTM
[34m[1mwandb[0m: 	decoding_strategy: beam_search
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_size: 512
[34m[1mwandb[0m: 	input_embedding_size: 512
[34m[1mwandb[0m: 	learning_rate: 0.0005
[34m[1mwandb[0m: 	num_decoder_layers: 4
[34m[1mwandb[0m: 	num_encoder_layers: 1


Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10


VBox(children=(Label(value='121.144 MB of 121.144 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0,…

0,1
accuracy,▁▅▆▇▇▇████
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▄▂▂▂▂▁▁▁▁
val_accuracy,▁▅▇▇▇█████
val_loss,█▄▂▂▁▁▁▁▁▁
validation_word_accuracy,▁▇▆▇█▇██▇▇▇▇▇█▇█████████████████████████
word_val_accuracy,▁

0,1
accuracy,0.95179
best_epoch,8.0
best_val_loss,0.02076
epoch,9.0
loss,0.0608
val_accuracy,0.87152
val_loss,0.02116
validation_word_accuracy,0.36253
word_val_accuracy,0.36209


[34m[1mwandb[0m: Agent Starting Run: 97jkzf33 with config:
[34m[1mwandb[0m: 	batch_size: 256
[34m[1mwandb[0m: 	beam_sizes: 7
[34m[1mwandb[0m: 	cell_type: LSTM
[34m[1mwandb[0m: 	decoding_strategy: beam_search
[34m[1mwandb[0m: 	dropout: 0
[34m[1mwandb[0m: 	epochs: 15
[34m[1mwandb[0m: 	hidden_size: 256
[34m[1mwandb[0m: 	input_embedding_size: 512
[34m[1mwandb[0m: 	learning_rate: 0.0005
[34m[1mwandb[0m: 	num_decoder_layers: 4
[34m[1mwandb[0m: 	num_encoder_layers: 1


Epoch 1/15
Epoch 2/15
Epoch 3/15
Epoch 4/15
Epoch 5/15
Epoch 6/15
Epoch 7/15
Epoch 8/15
Epoch 9/15
Epoch 10/15
Epoch 11/15
Epoch 12/15
Epoch 13/15
Epoch 14/15
Epoch 15/15


VBox(children=(Label(value='33.698 MB of 33.698 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
accuracy,▁▃▅▆▆▇▇▇▇▇█████
epoch,▁▁▂▃▃▃▄▅▅▅▆▇▇▇█
loss,█▆▄▃▂▂▂▂▂▁▁▁▁▁▁
val_accuracy,▁▄▆▆▇▇▇████████
val_loss,█▅▃▃▂▂▁▁▁▁▁▁▁▁▁
validation_word_accuracy,▁▅▂▇▇▆▅▃▅▅▅▄▅▅▅▅▅▇▇█▇▇▇█▇██████████▇▇▇▇▇
word_val_accuracy,▁

0,1
accuracy,0.91729
best_epoch,13.0
best_val_loss,0.0241
epoch,14.0
loss,0.10905
val_accuracy,0.84625
val_loss,0.02417
validation_word_accuracy,0.30874
word_val_accuracy,0.3084


[34m[1mwandb[0m: Agent Starting Run: yjvjq7vh with config:
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	beam_sizes: 3
[34m[1mwandb[0m: 	cell_type: LSTM
[34m[1mwandb[0m: 	decoding_strategy: greedy
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	epochs: 20
[34m[1mwandb[0m: 	hidden_size: 512
[34m[1mwandb[0m: 	input_embedding_size: 512
[34m[1mwandb[0m: 	learning_rate: 0.0005
[34m[1mwandb[0m: 	num_decoder_layers: 4
[34m[1mwandb[0m: 	num_encoder_layers: 2


Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20


VBox(children=(Label(value='145.181 MB of 145.181 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0,…

0,1
accuracy,▁▅▆▇▇▇██████████████
epoch,▁▁▂▂▂▃▃▄▄▄▅▅▅▆▆▇▇▇██
loss,█▄▃▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁
val_accuracy,▁▅▇▇████████████████
val_loss,█▃▂▁▁▁▁▁▂▂▂▂▂▂▂▂▃▃▃▃
validation_word_accuracy,▁▆▆▇▇▇█▇▇▇▇▇▇▇▇▇▇███████████████████████
word_val_accuracy,▁

0,1
accuracy,0.98492
best_epoch,5.0
best_val_loss,0.02057
epoch,19.0
loss,0.0194
val_accuracy,0.87238
val_loss,0.02645
validation_word_accuracy,0.3577
word_val_accuracy,0.3575


[34m[1mwandb[0m: Agent Starting Run: 174veenp with config:
[34m[1mwandb[0m: 	batch_size: 128
[34m[1mwandb[0m: 	beam_sizes: 7
[34m[1mwandb[0m: 	cell_type: GRU
[34m[1mwandb[0m: 	decoding_strategy: greedy
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	epochs: 15
[34m[1mwandb[0m: 	hidden_size: 512
[34m[1mwandb[0m: 	input_embedding_size: 512
[34m[1mwandb[0m: 	learning_rate: 0.0003
[34m[1mwandb[0m: 	num_decoder_layers: 3
[34m[1mwandb[0m: 	num_encoder_layers: 1


Epoch 1/15
Epoch 2/15
Epoch 3/15
Epoch 4/15
Epoch 5/15
Epoch 6/15
Epoch 7/15
Epoch 8/15
Epoch 9/15
Epoch 10/15
Epoch 11/15
Epoch 12/15
Epoch 13/15
Epoch 14/15
Epoch 15/15


VBox(children=(Label(value='73.157 MB of 73.157 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
accuracy,▁▄▆▆▇▇▇▇███████
epoch,▁▁▂▃▃▃▄▅▅▅▆▇▇▇█
loss,█▄▃▂▂▂▂▁▁▁▁▁▁▁▁
val_accuracy,▁▅▆▇▇██████████
val_loss,█▄▂▂▁▁▁▁▁▁▁▁▁▁▁
validation_word_accuracy,▁▅▆▇████▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇
word_val_accuracy,▁

0,1
accuracy,0.94786
best_epoch,12.0
best_val_loss,0.01891
epoch,14.0
loss,0.06501
val_accuracy,0.88003
val_loss,0.01937
validation_word_accuracy,0.37954
word_val_accuracy,0.3793


[34m[1mwandb[0m: Agent Starting Run: gh46sicv with config:
[34m[1mwandb[0m: 	batch_size: 128
[34m[1mwandb[0m: 	beam_sizes: 3
[34m[1mwandb[0m: 	cell_type: LSTM
[34m[1mwandb[0m: 	decoding_strategy: greedy
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	epochs: 20
[34m[1mwandb[0m: 	hidden_size: 512
[34m[1mwandb[0m: 	input_embedding_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.0005
[34m[1mwandb[0m: 	num_decoder_layers: 4
[34m[1mwandb[0m: 	num_encoder_layers: 1


Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20


VBox(children=(Label(value='110.505 MB of 110.505 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0,…

0,1
accuracy,▁▃▅▆▆▇▇▇▇▇██████████
epoch,▁▁▂▂▂▃▃▄▄▄▅▅▅▆▆▇▇▇██
loss,█▆▄▃▂▂▂▂▂▂▁▁▁▁▁▁▁▁▁▁
val_accuracy,▁▄▆▇▇███████████████
val_loss,█▅▃▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
validation_word_accuracy,▁▄▅█▇███▇▇▇▇▇█▇█▇███▇██████████▇▇▇▇▇▇▇▇▇
word_val_accuracy,▁

0,1
accuracy,0.96871
best_epoch,11.0
best_val_loss,0.01993
epoch,19.0
loss,0.0378
val_accuracy,0.87457
val_loss,0.02217
validation_word_accuracy,0.36437
word_val_accuracy,0.36416


[34m[1mwandb[0m: Agent Starting Run: 81q5x5vp with config:
[34m[1mwandb[0m: 	batch_size: 256
[34m[1mwandb[0m: 	beam_sizes: 7
[34m[1mwandb[0m: 	cell_type: LSTM
[34m[1mwandb[0m: 	decoding_strategy: beam_search
[34m[1mwandb[0m: 	dropout: 0
[34m[1mwandb[0m: 	epochs: 20
[34m[1mwandb[0m: 	hidden_size: 512
[34m[1mwandb[0m: 	input_embedding_size: 512
[34m[1mwandb[0m: 	learning_rate: 0.0005
[34m[1mwandb[0m: 	num_decoder_layers: 2
[34m[1mwandb[0m: 	num_encoder_layers: 1


Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20


VBox(children=(Label(value='73.070 MB of 73.070 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
accuracy,▁▄▆▆▇▇▇▇▇███████████
epoch,▁▁▂▂▂▃▃▄▄▄▅▅▅▆▆▇▇▇██
loss,█▄▃▂▂▂▂▂▂▁▁▁▁▁▁▁▁▁▁▁
val_accuracy,▁▅▆▇▇███████████████
val_loss,█▄▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
validation_word_accuracy,▁▇██▇▇▇▇▇▆▆▆▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▆▇
word_val_accuracy,▁

0,1
accuracy,0.98084
best_epoch,9.0
best_val_loss,0.02075
epoch,19.0
loss,0.02609
val_accuracy,0.87002
val_loss,0.02318
validation_word_accuracy,0.35954
word_val_accuracy,0.35957


[34m[1mwandb[0m: Agent Starting Run: yud4fw4k with config:
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	beam_sizes: 5
[34m[1mwandb[0m: 	cell_type: LSTM
[34m[1mwandb[0m: 	decoding_strategy: greedy
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	epochs: 20
[34m[1mwandb[0m: 	hidden_size: 512
[34m[1mwandb[0m: 	input_embedding_size: 256
[34m[1mwandb[0m: 	learning_rate: 0.0005
[34m[1mwandb[0m: 	num_decoder_layers: 4
[34m[1mwandb[0m: 	num_encoder_layers: 1


Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20


VBox(children=(Label(value='115.065 MB of 115.065 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0,…

0,1
accuracy,▁▅▆▇▇▇▇█████████████
epoch,▁▁▂▂▂▃▃▄▄▄▅▅▅▆▆▇▇▇██
loss,█▄▃▂▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁
val_accuracy,▁▅▇▇████████████████
val_loss,█▃▂▁▁▁▁▁▁▁▁▂▂▂▂▂▂▂▂▂
validation_word_accuracy,▁▄▆▇▇██▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇
word_val_accuracy,▁

0,1
accuracy,0.98324
best_epoch,6.0
best_val_loss,0.02041
epoch,19.0
loss,0.02099
val_accuracy,0.87509
val_loss,0.02569
validation_word_accuracy,0.36345
word_val_accuracy,0.36324


[34m[1mwandb[0m: Agent Starting Run: qw0fnj1i with config:
[34m[1mwandb[0m: 	batch_size: 256
[34m[1mwandb[0m: 	beam_sizes: 5
[34m[1mwandb[0m: 	cell_type: GRU
[34m[1mwandb[0m: 	decoding_strategy: greedy
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	epochs: 15
[34m[1mwandb[0m: 	hidden_size: 512
[34m[1mwandb[0m: 	input_embedding_size: 256
[34m[1mwandb[0m: 	learning_rate: 0.0005
[34m[1mwandb[0m: 	num_decoder_layers: 3
[34m[1mwandb[0m: 	num_encoder_layers: 1


Epoch 1/15
Epoch 2/15
Epoch 3/15
Epoch 4/15
Epoch 5/15
Epoch 6/15
Epoch 7/15
Epoch 8/15
Epoch 9/15
Epoch 10/15
Epoch 11/15
Epoch 12/15
Epoch 13/15
Epoch 14/15
Epoch 15/15


VBox(children=(Label(value='68.577 MB of 68.577 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
accuracy,▁▃▅▆▇▇▇▇▇██████
epoch,▁▁▂▃▃▃▄▅▅▅▆▇▇▇█
loss,█▅▄▃▂▂▂▂▁▁▁▁▁▁▁
val_accuracy,▁▄▆▇▇▇█████████
val_loss,█▅▃▂▂▁▁▁▁▁▁▁▁▁▁
validation_word_accuracy,▁▄▅▆▆▇▇▇▇▇▆▆▇███████████▇▇██████████████
word_val_accuracy,▁

0,1
accuracy,0.93834
best_epoch,14.0
best_val_loss,0.01887
epoch,14.0
loss,0.07689
val_accuracy,0.88101
val_loss,0.01887
validation_word_accuracy,0.38667
word_val_accuracy,0.38619


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: 4u5i878i with config:
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	beam_sizes: 5
[34m[1mwandb[0m: 	cell_type: RNN
[34m[1mwandb[0m: 	decoding_strategy: greedy
[34m[1mwandb[0m: 	dropout: 0
[34m[1mwandb[0m: 	epochs: 15
[34m[1mwandb[0m: 	hidden_size: 512
[34m[1mwandb[0m: 	input_embedding_size: 512
[34m[1mwandb[0m: 	learning_rate: 0.0005
[34m[1mwandb[0m: 	num_decoder_layers: 2
[34m[1mwandb[0m: 	num_encoder_layers: 1


Epoch 1/15
Epoch 2/15
Epoch 3/15
Epoch 4/15
Epoch 5/15
Epoch 6/15
Epoch 7/15
Epoch 8/15
Epoch 9/15
Epoch 10/15
Epoch 11/15
Epoch 12/15
Epoch 13/15
Epoch 14/15
Epoch 15/15


VBox(children=(Label(value='19.018 MB of 19.018 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
accuracy,▁▄▅▆▆▆▇▇▇▇▇████
epoch,▁▁▂▃▃▃▄▅▅▅▆▇▇▇█
loss,█▅▄▃▃▂▂▂▂▂▁▁▁▁▁
val_accuracy,▁▄▅▆▇▇▇████████
val_loss,█▄▃▂▁▁▁▁▁▁▂▂▂▂▃
validation_word_accuracy,▁▃▂▆▆▆▇▇█▇▆▆▇▇▇▇▆▇▇▇▇▆▆▆▇▇▆▆▆▆▆▆▆▆▆▆▆▆▆▆
word_val_accuracy,▁

0,1
accuracy,0.93983
best_epoch,4.0
best_val_loss,0.03087
epoch,14.0
loss,0.07219
val_accuracy,0.80807
val_loss,0.03443
validation_word_accuracy,0.22046
word_val_accuracy,0.22006


[34m[1mwandb[0m: Agent Starting Run: ojwyqs25 with config:
[34m[1mwandb[0m: 	batch_size: 256
[34m[1mwandb[0m: 	beam_sizes: 7
[34m[1mwandb[0m: 	cell_type: GRU
[34m[1mwandb[0m: 	decoding_strategy: greedy
[34m[1mwandb[0m: 	dropout: 0
[34m[1mwandb[0m: 	epochs: 20
[34m[1mwandb[0m: 	hidden_size: 512
[34m[1mwandb[0m: 	input_embedding_size: 256
[34m[1mwandb[0m: 	learning_rate: 0.0003
[34m[1mwandb[0m: 	num_decoder_layers: 3
[34m[1mwandb[0m: 	num_encoder_layers: 1


Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20


VBox(children=(Label(value='68.577 MB of 68.577 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
accuracy,▁▂▄▅▆▆▇▇▇▇▇▇▇███████
epoch,▁▁▂▂▂▃▃▄▄▄▅▅▅▆▆▇▇▇██
loss,█▆▅▄▃▂▂▂▂▂▂▁▁▁▁▁▁▁▁▁
val_accuracy,▁▂▄▅▆▇▇▇████████████
val_loss,█▆▅▃▂▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁
validation_word_accuracy,▁▇▆██▇▇▇▇▇▇▆▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇
word_val_accuracy,▁

0,1
accuracy,0.95028
best_epoch,19.0
best_val_loss,0.02088
epoch,19.0
loss,0.0677
val_accuracy,0.86944
val_loss,0.02088
validation_word_accuracy,0.35908
word_val_accuracy,0.35865


[34m[1mwandb[0m: Agent Starting Run: f4r6dym9 with config:
[34m[1mwandb[0m: 	batch_size: 256
[34m[1mwandb[0m: 	beam_sizes: 3
[34m[1mwandb[0m: 	cell_type: RNN
[34m[1mwandb[0m: 	decoding_strategy: beam_search
[34m[1mwandb[0m: 	dropout: 0
[34m[1mwandb[0m: 	epochs: 15
[34m[1mwandb[0m: 	hidden_size: 512
[34m[1mwandb[0m: 	input_embedding_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.0005
[34m[1mwandb[0m: 	num_decoder_layers: 4
[34m[1mwandb[0m: 	num_encoder_layers: 1


Epoch 1/15
Epoch 2/15
Epoch 3/15
Epoch 4/15
Epoch 5/15
Epoch 6/15
Epoch 7/15
Epoch 8/15
Epoch 9/15
Epoch 10/15
Epoch 11/15
Epoch 12/15
Epoch 13/15
Epoch 14/15
Epoch 15/15


VBox(children=(Label(value='9.381 MB of 9.381 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
accuracy,▁▄▅▆▆▇▇▇▇▇█████
epoch,▁▁▂▃▃▃▄▅▅▅▆▇▇▇█
loss,█▄▃▃▂▂▂▂▂▁▁▁▁▁▁
val_accuracy,▁▄▆▆▇▇█████████
val_loss,█▄▃▂▂▁▁▁▁▁▁▁▁▁▁
validation_word_accuracy,▁▇▇██████▇▇▇▇▇▇▇▇█████████████████████▇▇
word_val_accuracy,▁

0,1
accuracy,0.93783
best_epoch,7.0
best_val_loss,0.02936
epoch,14.0
loss,0.07799
val_accuracy,0.81597
val_loss,0.03128
validation_word_accuracy,0.24368
word_val_accuracy,0.24323


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: fjdiiyto with config:
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	beam_sizes: 5
[34m[1mwandb[0m: 	cell_type: GRU
[34m[1mwandb[0m: 	decoding_strategy: greedy
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	epochs: 20
[34m[1mwandb[0m: 	hidden_size: 512
[34m[1mwandb[0m: 	input_embedding_size: 512
[34m[1mwandb[0m: 	learning_rate: 0.0005
[34m[1mwandb[0m: 	num_decoder_layers: 4
[34m[1mwandb[0m: 	num_encoder_layers: 1


Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20


VBox(children=(Label(value='91.202 MB of 91.202 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
accuracy,▁▅▆▇▇▇▇▇████████████
epoch,▁▁▂▂▂▃▃▄▄▄▅▅▅▆▆▇▇▇██
loss,█▃▃▂▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁
val_accuracy,▁▆▇▇▇███████████████
val_loss,█▃▂▁▁▁▁▁▁▁▂▂▂▂▂▃▃▃▃▃
validation_word_accuracy,█▃▃▇▄▄▄▄▃▂▁▁▂▃▃▃▃▄▄▄▄▄▄▄▄▄▄▄▄▄▄▄▃▄▄▄▄▄▃▃
word_val_accuracy,▁

0,1
accuracy,0.97602
best_epoch,5.0
best_val_loss,0.01943
epoch,19.0
loss,0.02856
val_accuracy,0.88155
val_loss,0.02518
validation_word_accuracy,0.38161
word_val_accuracy,0.38137


[34m[1mwandb[0m: Agent Starting Run: ur7wftij with config:
[34m[1mwandb[0m: 	batch_size: 128
[34m[1mwandb[0m: 	beam_sizes: 5
[34m[1mwandb[0m: 	cell_type: GRU
[34m[1mwandb[0m: 	decoding_strategy: greedy
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	epochs: 20
[34m[1mwandb[0m: 	hidden_size: 512
[34m[1mwandb[0m: 	input_embedding_size: 128
[34m[1mwandb[0m: 	learning_rate: 0.0005
[34m[1mwandb[0m: 	num_decoder_layers: 4
[34m[1mwandb[0m: 	num_encoder_layers: 1


Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20


VBox(children=(Label(value='28.127 MB of 28.127 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
accuracy,▁▄▅▆▇▇▇▇▇▇██████████
epoch,▁▁▂▂▂▃▃▄▄▄▅▅▅▆▆▇▇▇██
loss,█▅▃▃▂▂▂▂▂▁▁▁▁▁▁▁▁▁▁▁
val_accuracy,▁▅▆▇▇███████████████
val_loss,█▄▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
validation_word_accuracy,▁▅▇█▇███▇▇▇▆▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇
word_val_accuracy,▁

0,1
accuracy,0.96313
best_epoch,11.0
best_val_loss,0.01989
epoch,19.0
loss,0.0434
val_accuracy,0.87553
val_loss,0.02248
validation_word_accuracy,0.36943
word_val_accuracy,0.36898


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: i8yvhk3p with config:
[34m[1mwandb[0m: 	batch_size: 128
[34m[1mwandb[0m: 	beam_sizes: 5
[34m[1mwandb[0m: 	cell_type: GRU
[34m[1mwandb[0m: 	decoding_strategy: greedy
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	epochs: 20
[34m[1mwandb[0m: 	hidden_size: 512
[34m[1mwandb[0m: 	input_embedding_size: 512
[34m[1mwandb[0m: 	learning_rate: 0.0005
[34m[1mwandb[0m: 	num_decoder_layers: 3
[34m[1mwandb[0m: 	num_encoder_layers: 1


Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20


VBox(children=(Label(value='73.157 MB of 73.157 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
accuracy,▁▅▆▇▇▇▇▇▇███████████
epoch,▁▁▂▂▂▃▃▄▄▄▅▅▅▆▆▇▇▇██
loss,█▄▃▂▂▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁
val_accuracy,▁▆▇▇████████████████
val_loss,█▃▂▁▁▁▁▁▁▁▁▁▁▁▁▂▂▂▂▂
validation_word_accuracy,▃▃▂█▅▅▇▅▄▃▂▁▂▄▃▃▄▅▆▅▆▆▆▆▅▅▅▅▄▅▄▄▄▅▅▅▅▅▅▅
word_val_accuracy,▁

0,1
accuracy,0.97756
best_epoch,8.0
best_val_loss,0.01886
epoch,19.0
loss,0.02719
val_accuracy,0.87867
val_loss,0.024
validation_word_accuracy,0.36644
word_val_accuracy,0.36622


[34m[1mwandb[0m: Agent Starting Run: hagwlhs9 with config:
[34m[1mwandb[0m: 	batch_size: 256
[34m[1mwandb[0m: 	beam_sizes: 3
[34m[1mwandb[0m: 	cell_type: GRU
[34m[1mwandb[0m: 	decoding_strategy: greedy
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	epochs: 20
[34m[1mwandb[0m: 	hidden_size: 512
[34m[1mwandb[0m: 	input_embedding_size: 256
[34m[1mwandb[0m: 	learning_rate: 0.0005
[34m[1mwandb[0m: 	num_decoder_layers: 4
[34m[1mwandb[0m: 	num_encoder_layers: 2


Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20


VBox(children=(Label(value='104.672 MB of 104.672 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0,…

0,1
accuracy,▁▄▆▆▇▇▇▇▇███████████
epoch,▁▁▂▂▂▃▃▄▄▄▅▅▅▆▆▇▇▇██
loss,█▅▃▂▂▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁
val_accuracy,▁▅▇▇▇███████████████
val_loss,█▄▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
validation_word_accuracy,▁▅▆▇▇▇▇▇▇▇▇▇▇████████████████████████▇▇█
word_val_accuracy,▁

0,1
accuracy,0.97262
best_epoch,9.0
best_val_loss,0.0195
epoch,19.0
loss,0.03339
val_accuracy,0.88129
val_loss,0.02182
validation_word_accuracy,0.37931
word_val_accuracy,0.37861


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: zzwembf9 with config:
[34m[1mwandb[0m: 	batch_size: 128
[34m[1mwandb[0m: 	beam_sizes: 7
[34m[1mwandb[0m: 	cell_type: RNN
[34m[1mwandb[0m: 	decoding_strategy: beam_search
[34m[1mwandb[0m: 	dropout: 0
[34m[1mwandb[0m: 	epochs: 20
[34m[1mwandb[0m: 	hidden_size: 512
[34m[1mwandb[0m: 	input_embedding_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.0005
[34m[1mwandb[0m: 	num_decoder_layers: 4
[34m[1mwandb[0m: 	num_encoder_layers: 3


Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20

[34m[1mwandb[0m: [32m[41mERROR[0m Error while calling W&B API: context deadline exceeded (<Response [500]>)


Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20


VBox(children=(Label(value='40.331 MB of 40.331 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
accuracy,▁▄▅▆▆▇▇▇▇▇██████████
epoch,▁▁▂▂▂▃▃▄▄▄▅▅▅▆▆▇▇▇██
loss,█▄▃▃▂▂▂▂▂▁▁▁▁▁▁▁▁▁▁▁
val_accuracy,▁▅▆▆█████████▇▇▇▇▇█▇
val_loss,█▄▂▂▁▁▁▁▁▂▂▂▂▃▃▃▃▃▃▄
validation_word_accuracy,▁▅▆▇▇▇▇▇▇▆▆▆▆▇▇▇▇▇▇▇▇▇▇█████████████████
word_val_accuracy,▁

0,1
accuracy,0.94086
best_epoch,6.0
best_val_loss,0.02993
epoch,19.0
loss,0.06917
val_accuracy,0.80573
val_loss,0.03673
validation_word_accuracy,0.22667
word_val_accuracy,0.22625


[34m[1mwandb[0m: Agent Starting Run: agltfmht with config:
[34m[1mwandb[0m: 	batch_size: 128
[34m[1mwandb[0m: 	beam_sizes: 3
[34m[1mwandb[0m: 	cell_type: GRU
[34m[1mwandb[0m: 	decoding_strategy: greedy
[34m[1mwandb[0m: 	dropout: 0
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_size: 512
[34m[1mwandb[0m: 	input_embedding_size: 512
[34m[1mwandb[0m: 	learning_rate: 0.0005
[34m[1mwandb[0m: 	num_decoder_layers: 3
[34m[1mwandb[0m: 	num_encoder_layers: 1


Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10


VBox(children=(Label(value='73.157 MB of 73.157 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
accuracy,▁▅▆▇▇▇████
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▃▂▂▂▁▁▁▁▁
val_accuracy,▁▆▇▇██████
val_loss,█▃▂▁▁▁▁▁▁▁
validation_word_accuracy,▁▆▆▆▆▇▇▇▇▇▇▇▇▇▇▇█████████████████████▇▇▇
word_val_accuracy,▁

0,1
accuracy,0.96859
best_epoch,6.0
best_val_loss,0.0201
epoch,9.0
loss,0.04103
val_accuracy,0.8759
val_loss,0.02147
validation_word_accuracy,0.36299
word_val_accuracy,0.36301


[34m[1mwandb[0m: Agent Starting Run: 42iy9gd7 with config:
[34m[1mwandb[0m: 	batch_size: 256
[34m[1mwandb[0m: 	beam_sizes: 7
[34m[1mwandb[0m: 	cell_type: LSTM
[34m[1mwandb[0m: 	decoding_strategy: beam_search
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	epochs: 20
[34m[1mwandb[0m: 	hidden_size: 512
[34m[1mwandb[0m: 	input_embedding_size: 256
[34m[1mwandb[0m: 	learning_rate: 0.0005
[34m[1mwandb[0m: 	num_decoder_layers: 4
[34m[1mwandb[0m: 	num_encoder_layers: 1


Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20


VBox(children=(Label(value='115.065 MB of 115.065 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0,…

0,1
accuracy,▁▄▅▆▆▇▇▇▇▇██████████
epoch,▁▁▂▂▂▃▃▄▄▄▅▅▅▆▆▇▇▇██
loss,█▅▃▃▂▂▂▂▂▁▁▁▁▁▁▁▁▁▁▁
val_accuracy,▁▄▆▇▇▇██████████████
val_loss,█▄▃▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
validation_word_accuracy,▁██▇▆▆▆▆▅▅▅▅▅▅▅▅▅▆▆▆▆▆▆▆▆▅▅▅▆▆▆▆▆▆▆▆▆▆▆▆
word_val_accuracy,▁

0,1
accuracy,0.96683
best_epoch,12.0
best_val_loss,0.0211
epoch,19.0
loss,0.04204
val_accuracy,0.86872
val_loss,0.02247
validation_word_accuracy,0.35172
word_val_accuracy,0.35154


In [None]:
wandb.agent("ajlstr1d", function = spawn_fn , count=20)

[34m[1mwandb[0m: Agent Starting Run: 182sh6tz with config:
[34m[1mwandb[0m: 	batch_size: 256
[34m[1mwandb[0m: 	beam_sizes: 3
[34m[1mwandb[0m: 	cell_type: LSTM
[34m[1mwandb[0m: 	decoding_strategy: greedy
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	epochs: 20
[34m[1mwandb[0m: 	hidden_size: 512
[34m[1mwandb[0m: 	input_embedding_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.0005
[34m[1mwandb[0m: 	num_decoder_layers: 3
[34m[1mwandb[0m: 	num_encoder_layers: 1


Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20


VBox(children=(Label(value='86.471 MB of 86.471 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
accuracy,▁▂▄▅▆▆▆▇▇▇▇▇▇███████
epoch,▁▁▂▂▂▃▃▄▄▄▅▅▅▆▆▇▇▇██
loss,█▆▅▄▃▃▂▂▂▂▂▁▁▁▁▁▁▁▁▁
val_accuracy,▁▂▄▅▆▇▇▇████████████
val_loss,█▆▅▃▂▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁
validation_word_accuracy,▁▇▄▆▄▄▆▆▅▆▅▅▆▆▆▆▇▇▇▇██▇██▇▇▇██████████▇█
word_val_accuracy,▁

0,1
accuracy,0.93276
best_epoch,19.0
best_val_loss,0.02005
epoch,19.0
loss,0.08368
val_accuracy,0.87452
val_loss,0.02005
validation_word_accuracy,0.36322
word_val_accuracy,0.36301


[34m[1mwandb[0m: Agent Starting Run: ied1rsb5 with config:
[34m[1mwandb[0m: 	batch_size: 256
[34m[1mwandb[0m: 	beam_sizes: 5
[34m[1mwandb[0m: 	cell_type: GRU
[34m[1mwandb[0m: 	decoding_strategy: beam_search
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	epochs: 20
[34m[1mwandb[0m: 	hidden_size: 512
[34m[1mwandb[0m: 	input_embedding_size: 256
[34m[1mwandb[0m: 	learning_rate: 0.0003
[34m[1mwandb[0m: 	num_decoder_layers: 1
[34m[1mwandb[0m: 	num_encoder_layers: 1


Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20


VBox(children=(Label(value='32.481 MB of 32.481 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
accuracy,▁▂▃▄▅▅▆▆▇▇▇▇▇███████
epoch,▁▁▂▂▂▃▃▄▄▄▅▅▅▆▆▇▇▇██
loss,█▆▆▅▄▃▃▂▂▂▂▂▁▁▁▁▁▁▁▁
val_accuracy,▁▂▃▄▅▆▇▇▇▇██████████
val_loss,█▇▆▅▄▃▂▂▂▁▁▁▁▁▁▁▁▁▁▁
validation_word_accuracy,▃▁▃█▃▄▆▅▄▄▁▁▂▄▃▄▅▅▅▅▅▆▅▆▅▆▆▆▆▆▆▆▆▆▆▆▆▅▅▅
word_val_accuracy,▁

0,1
accuracy,0.92014
best_epoch,19.0
best_val_loss,0.02083
epoch,19.0
loss,0.10207
val_accuracy,0.86875
val_loss,0.02083
validation_word_accuracy,0.3531
word_val_accuracy,0.35268


[34m[1mwandb[0m: Agent Starting Run: rvt2797a with config:
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	beam_sizes: 3
[34m[1mwandb[0m: 	cell_type: GRU
[34m[1mwandb[0m: 	decoding_strategy: greedy
[34m[1mwandb[0m: 	dropout: 0
[34m[1mwandb[0m: 	epochs: 20
[34m[1mwandb[0m: 	hidden_size: 256
[34m[1mwandb[0m: 	input_embedding_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.0005
[34m[1mwandb[0m: 	num_decoder_layers: 4
[34m[1mwandb[0m: 	num_encoder_layers: 4


Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20


VBox(children=(Label(value='34.994 MB of 34.994 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
accuracy,▁▄▆▆▇▇▇▇▇███████████
epoch,▁▁▂▂▂▃▃▄▄▄▅▅▅▆▆▇▇▇██
loss,█▅▃▂▂▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁
val_accuracy,▁▅▇▇████████████████
val_loss,█▄▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▂▂▂
validation_word_accuracy,▁▅▅█▆▆▆▅▃▃▃▃▄▅▄▄▄▅▅▅▅▅▅▅▅▅▅▅▅▅▅▅▅▅▅▅▅▅▅▅
word_val_accuracy,▁

0,1
accuracy,0.98076
best_epoch,7.0
best_val_loss,0.02185
epoch,19.0
loss,0.02405
val_accuracy,0.86223
val_loss,0.0283
validation_word_accuracy,0.32874
word_val_accuracy,0.32836


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: pqk5fk1g with config:
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	beam_sizes: 3
[34m[1mwandb[0m: 	cell_type: GRU
[34m[1mwandb[0m: 	decoding_strategy: greedy
[34m[1mwandb[0m: 	dropout: 0
[34m[1mwandb[0m: 	epochs: 20
[34m[1mwandb[0m: 	hidden_size: 512
[34m[1mwandb[0m: 	input_embedding_size: 128
[34m[1mwandb[0m: 	learning_rate: 0.0005
[34m[1mwandb[0m: 	num_decoder_layers: 4
[34m[1mwandb[0m: 	num_encoder_layers: 3


Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20


VBox(children=(Label(value='120.432 MB of 120.432 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0,…

0,1
accuracy,▁▆▇▇▇███████████████
epoch,▁▁▂▂▂▃▃▄▄▄▅▅▅▆▆▇▇▇██
loss,█▃▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
val_accuracy,▁▆▇█████████████████
val_loss,█▃▁▁▁▁▂▂▂▂▃▃▃▃▃▄▄▄▄▄
validation_word_accuracy,▁█▇█▇▇▇▇▇▆▆▆▆▆▆▆▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇
word_val_accuracy,▁

0,1
accuracy,0.98502
best_epoch,3.0
best_val_loss,0.02016
epoch,19.0
loss,0.01962
val_accuracy,0.87625
val_loss,0.02688
validation_word_accuracy,0.37241
word_val_accuracy,0.37219


[34m[1mwandb[0m: Agent Starting Run: p5ebszqd with config:
[34m[1mwandb[0m: 	batch_size: 256
[34m[1mwandb[0m: 	beam_sizes: 7
[34m[1mwandb[0m: 	cell_type: GRU
[34m[1mwandb[0m: 	decoding_strategy: greedy
[34m[1mwandb[0m: 	dropout: 0
[34m[1mwandb[0m: 	epochs: 20
[34m[1mwandb[0m: 	hidden_size: 512
[34m[1mwandb[0m: 	input_embedding_size: 512
[34m[1mwandb[0m: 	learning_rate: 0.0005
[34m[1mwandb[0m: 	num_decoder_layers: 4
[34m[1mwandb[0m: 	num_encoder_layers: 1


Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20


VBox(children=(Label(value='91.202 MB of 91.202 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
accuracy,▁▄▆▆▇▇▇▇▇███████████
epoch,▁▁▂▂▂▃▃▄▄▄▅▅▅▆▆▇▇▇██
loss,█▅▃▂▂▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁
val_accuracy,▁▅▇▇▇███████████████
val_loss,█▄▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
validation_word_accuracy,▁█▅▇▆▆▇▆▆▆▅▄▅▆▅▅▆▆▆▆▆▆▆▆▆▆▆▆▆▆▆▆▆▆▆▆▅▅▅▅
word_val_accuracy,▁

0,1
accuracy,0.98439
best_epoch,8.0
best_val_loss,0.02039
epoch,19.0
loss,0.02062
val_accuracy,0.87253
val_loss,0.02477
validation_word_accuracy,0.35747
word_val_accuracy,0.35727


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: yos76c1v with config:
[34m[1mwandb[0m: 	batch_size: 256
[34m[1mwandb[0m: 	beam_sizes: 7
[34m[1mwandb[0m: 	cell_type: GRU
[34m[1mwandb[0m: 	decoding_strategy: beam_search
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	epochs: 20
[34m[1mwandb[0m: 	hidden_size: 512
[34m[1mwandb[0m: 	input_embedding_size: 512
[34m[1mwandb[0m: 	learning_rate: 0.0005
[34m[1mwandb[0m: 	num_decoder_layers: 4
[34m[1mwandb[0m: 	num_encoder_layers: 1


Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20


VBox(children=(Label(value='91.202 MB of 91.202 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
accuracy,▁▄▅▆▇▇▇▇▇▇██████████
epoch,▁▁▂▂▂▃▃▄▄▄▅▅▅▆▆▇▇▇██
loss,█▅▃▂▂▂▂▂▂▁▁▁▁▁▁▁▁▁▁▁
val_accuracy,▁▅▆▇▇███████████████
val_loss,█▄▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
validation_word_accuracy,▅▁▃▆▄▅▅▅▄▄▄▃▄▅▅▆▆▇▇██▇█▇▇▇▇▇▇▇▇▇▇▇██████
word_val_accuracy,▁

0,1
accuracy,0.97313
best_epoch,9.0
best_val_loss,0.01946
epoch,19.0
loss,0.0336
val_accuracy,0.87853
val_loss,0.02207
validation_word_accuracy,0.37241
word_val_accuracy,0.37219


[34m[1mwandb[0m: Agent Starting Run: 4lykdz6u with config:
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	beam_sizes: 7
[34m[1mwandb[0m: 	cell_type: GRU
[34m[1mwandb[0m: 	decoding_strategy: beam_search
[34m[1mwandb[0m: 	dropout: 0
[34m[1mwandb[0m: 	epochs: 20
[34m[1mwandb[0m: 	hidden_size: 512
[34m[1mwandb[0m: 	input_embedding_size: 256
[34m[1mwandb[0m: 	learning_rate: 0.0003
[34m[1mwandb[0m: 	num_decoder_layers: 1
[34m[1mwandb[0m: 	num_encoder_layers: 1


Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20


VBox(children=(Label(value='32.481 MB of 32.481 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
accuracy,▁▄▆▆▇▇▇▇▇▇██████████
epoch,▁▁▂▂▂▃▃▄▄▄▅▅▅▆▆▇▇▇██
loss,█▅▃▂▂▂▂▂▂▁▁▁▁▁▁▁▁▁▁▁
val_accuracy,▁▅▇▇▇███████████████
val_loss,█▄▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▂▂
validation_word_accuracy,▁▆██▇▇▇▇▇▇▆▆▇▇▆▇▇▇▇▇▇▇▇▇▇▇▆▆▇▇▇▇▇▇▇▇▇▇▇▇
word_val_accuracy,▁

0,1
accuracy,0.98139
best_epoch,8.0
best_val_loss,0.02062
epoch,19.0
loss,0.02457
val_accuracy,0.86837
val_loss,0.02592
validation_word_accuracy,0.3469
word_val_accuracy,0.34672


[34m[1mwandb[0m: Agent Starting Run: o5w6jnmp with config:
[34m[1mwandb[0m: 	batch_size: 256
[34m[1mwandb[0m: 	beam_sizes: 7
[34m[1mwandb[0m: 	cell_type: GRU
[34m[1mwandb[0m: 	decoding_strategy: beam_search
[34m[1mwandb[0m: 	dropout: 0
[34m[1mwandb[0m: 	epochs: 20
[34m[1mwandb[0m: 	hidden_size: 512
[34m[1mwandb[0m: 	input_embedding_size: 128
[34m[1mwandb[0m: 	learning_rate: 0.0001
[34m[1mwandb[0m: 	num_decoder_layers: 4
[34m[1mwandb[0m: 	num_encoder_layers: 1


Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20


VBox(children=(Label(value='84.333 MB of 84.333 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
accuracy,▁▃▄▄▄▄▅▅▅▆▆▆▆▇▇▇▇███
epoch,▁▁▂▂▂▃▃▄▄▄▅▅▅▆▆▇▇▇██
loss,█▆▅▅▄▄▄▃▃▃▃▃▂▂▂▂▁▁▁▁
val_accuracy,▁▂▂▃▃▄▄▄▅▅▅▆▆▆▇▇▇███
val_loss,█▇▆▆▅▅▄▄▄▃▃▃▃▂▂▂▂▁▁▁
validation_word_accuracy,▁▄▆▆██████▇▇▇▇▇▇▇▇▇▇▇▇██████████████████
word_val_accuracy,▁

0,1
accuracy,0.67079
best_epoch,19.0
best_val_loss,0.05811
epoch,19.0
loss,0.44375
val_accuracy,0.65562
val_loss,0.05811
validation_word_accuracy,0.03448
word_val_accuracy,0.03442


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: zk822sv9 with config:
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	beam_sizes: 3
[34m[1mwandb[0m: 	cell_type: GRU
[34m[1mwandb[0m: 	decoding_strategy: beam_search
[34m[1mwandb[0m: 	dropout: 0
[34m[1mwandb[0m: 	epochs: 20
[34m[1mwandb[0m: 	hidden_size: 512
[34m[1mwandb[0m: 	input_embedding_size: 256
[34m[1mwandb[0m: 	learning_rate: 0.0005
[34m[1mwandb[0m: 	num_decoder_layers: 3
[34m[1mwandb[0m: 	num_encoder_layers: 1


Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20


[34m[1mwandb[0m: [32m[41mERROR[0m Error while calling W&B API: Error 1040: Too many connections (<Response [500]>)
[34m[1mwandb[0m: Network error (HTTPError), entering retry loop.
[34m[1mwandb[0m: [32m[41mERROR[0m Error while calling W&B API: Error 1040: Too many connections (<Response [500]>)


VBox(children=(Label(value='68.577 MB of 68.577 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
accuracy,▁▅▆▇▇▇██████████████
epoch,▁▁▂▂▂▃▃▄▄▄▅▅▅▆▆▇▇▇██
loss,█▃▂▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁
val_accuracy,▁▆▇█████████████████
val_loss,█▃▂▁▁▁▁▁▁▂▂▂▂▂▂▃▃▃▃▃
validation_word_accuracy,▁█▅▇▄▆▇█▇▇▅▄▅▆▆▇▇█▇█▇▇▇▇▇▇▆▆▆▆▆▆▆▆▇▆▆▆▆▇
word_val_accuracy,▁

0,1
accuracy,0.98532
best_epoch,4.0
best_val_loss,0.02026
epoch,19.0
loss,0.01896
val_accuracy,0.87778
val_loss,0.02649
validation_word_accuracy,0.37195
word_val_accuracy,0.3715


[34m[1mwandb[0m: Agent Starting Run: 7hzwoppv with config:
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	beam_sizes: 3
[34m[1mwandb[0m: 	cell_type: RNN
[34m[1mwandb[0m: 	decoding_strategy: beam_search
[34m[1mwandb[0m: 	dropout: 0
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_size: 512
[34m[1mwandb[0m: 	input_embedding_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.0005
[34m[1mwandb[0m: 	num_decoder_layers: 1
[34m[1mwandb[0m: 	num_encoder_layers: 4


Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10


VBox(children=(Label(value='28.292 MB of 28.292 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
accuracy,▁▄▆▆▇▇▇███
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▄▃▃▂▂▂▁▁▁
val_accuracy,▁▄▅▆▇█████
val_loss,█▄▃▂▁▁▁▁▁▁
validation_word_accuracy,▁▆▁▄▂▂▄▂▅▅▅▆▅▇▆▆▆▆▆▆▆▇▆▇▇▇▇▇▇▇█████▇▇▇▇▇
word_val_accuracy,▁

0,1
accuracy,0.84667
best_epoch,7.0
best_val_loss,0.0374
epoch,9.0
loss,0.18765
val_accuracy,0.77104
val_loss,0.03773
validation_word_accuracy,0.16322
word_val_accuracy,0.16315


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: ugzu8ubm with config:
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	beam_sizes: 3
[34m[1mwandb[0m: 	cell_type: GRU
[34m[1mwandb[0m: 	decoding_strategy: greedy
[34m[1mwandb[0m: 	dropout: 0
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_size: 512
[34m[1mwandb[0m: 	input_embedding_size: 256
[34m[1mwandb[0m: 	learning_rate: 0.0005
[34m[1mwandb[0m: 	num_decoder_layers: 1
[34m[1mwandb[0m: 	num_encoder_layers: 1


Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10


VBox(children=(Label(value='32.481 MB of 32.481 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
accuracy,▁▅▆▇▇▇████
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▃▂▂▂▁▁▁▁▁
val_accuracy,▁▆▇▇██████
val_loss,█▃▂▁▁▁▁▁▁▁
validation_word_accuracy,▁█▆▆▆▆▇▆▅▅▅▄▅▅▅▆▅▆▆▆▆▆▆▆▆▆▆▆▆▆▆▆▆▆▆▆▆▆▆▆
word_val_accuracy,▁

0,1
accuracy,0.96511
best_epoch,6.0
best_val_loss,0.02045
epoch,9.0
loss,0.04465
val_accuracy,0.87183
val_loss,0.02249
validation_word_accuracy,0.35448
word_val_accuracy,0.35475


[34m[1mwandb[0m: Agent Starting Run: xe6meklv with config:
[34m[1mwandb[0m: 	batch_size: 128
[34m[1mwandb[0m: 	beam_sizes: 7
[34m[1mwandb[0m: 	cell_type: LSTM
[34m[1mwandb[0m: 	decoding_strategy: beam_search
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	epochs: 20
[34m[1mwandb[0m: 	hidden_size: 512
[34m[1mwandb[0m: 	input_embedding_size: 256
[34m[1mwandb[0m: 	learning_rate: 0.0005
[34m[1mwandb[0m: 	num_decoder_layers: 3
[34m[1mwandb[0m: 	num_encoder_layers: 1


Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20


VBox(children=(Label(value='91.031 MB of 91.031 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
accuracy,▁▄▆▆▇▇▇▇▇███████████
epoch,▁▁▂▂▂▃▃▄▄▄▅▅▅▆▆▇▇▇██
loss,█▄▃▂▂▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁
val_accuracy,▁▅▇▇▇███████████████
val_loss,█▄▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
validation_word_accuracy,▂█▄▅▃▅▄▃▄▃▂▂▂▃▃▃▃▃▃▃▂▂▂▂▂▁▁▁▁▁▂▂▁▁▁▁▁▁▁▁
word_val_accuracy,▁

0,1
accuracy,0.97638
best_epoch,9.0
best_val_loss,0.01949
epoch,19.0
loss,0.0289
val_accuracy,0.87861
val_loss,0.02261
validation_word_accuracy,0.37471
word_val_accuracy,0.37448


[34m[1mwandb[0m: Agent Starting Run: 6dgfj91b with config:
[34m[1mwandb[0m: 	batch_size: 128
[34m[1mwandb[0m: 	beam_sizes: 3
[34m[1mwandb[0m: 	cell_type: GRU
[34m[1mwandb[0m: 	decoding_strategy: beam_search
[34m[1mwandb[0m: 	dropout: 0
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_size: 512
[34m[1mwandb[0m: 	input_embedding_size: 128
[34m[1mwandb[0m: 	learning_rate: 0.0005
[34m[1mwandb[0m: 	num_decoder_layers: 4
[34m[1mwandb[0m: 	num_encoder_layers: 1


Epoch 1/5
Epoch 2/5
Epoch 3/5
Epoch 4/5
Epoch 5/5


VBox(children=(Label(value='84.333 MB of 84.333 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
accuracy,▁▄▇██
epoch,▁▃▅▆█
loss,█▄▂▁▁
val_accuracy,▁▅▇██
val_loss,█▃▂▁▁
validation_word_accuracy,▁▇▄█▆▇▅▆▆▅▄▄▄▅▄▅▅▆▇▆▇██▇▇██████▇▇██▇▇▇▆▆
word_val_accuracy,▁

0,1
accuracy,0.86567
best_epoch,4.0
best_val_loss,0.02477
epoch,4.0
loss,0.17065
val_accuracy,0.8438
val_loss,0.02477
validation_word_accuracy,0.30782
word_val_accuracy,0.30748


[34m[1mwandb[0m: Agent Starting Run: 3zp3srti with config:
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	beam_sizes: 3
[34m[1mwandb[0m: 	cell_type: GRU
[34m[1mwandb[0m: 	decoding_strategy: greedy
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	epochs: 20
[34m[1mwandb[0m: 	hidden_size: 512
[34m[1mwandb[0m: 	input_embedding_size: 512
[34m[1mwandb[0m: 	learning_rate: 0.0005
[34m[1mwandb[0m: 	num_decoder_layers: 1
[34m[1mwandb[0m: 	num_encoder_layers: 1


Epoch 1/20
Epoch 2/20
Epoch 3/20

In [None]:
wandb.agent("96qio1zu", function = spawn_fn , count=20)

[34m[1mwandb[0m: Agent Starting Run: yux58zfg with config:
[34m[1mwandb[0m: 	batch_size: 128
[34m[1mwandb[0m: 	beam_sizes: 7
[34m[1mwandb[0m: 	cell_type: GRU
[34m[1mwandb[0m: 	decoding_strategy: beam_search
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	epochs: 30
[34m[1mwandb[0m: 	hidden_size: 512
[34m[1mwandb[0m: 	input_embedding_size: 128
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	num_decoder_layers: 3
[34m[1mwandb[0m: 	num_encoder_layers: 1


Epoch 1/30
Epoch 2/30
Epoch 3/30
Epoch 4/30
Epoch 5/30
Epoch 6/30
Epoch 7/30
Epoch 8/30
Epoch 9/30
Epoch 10/30
Epoch 11/30
Epoch 12/30
Epoch 13/30
Epoch 14/30
Epoch 15/30
Epoch 16/30
Epoch 17/30
Epoch 18/30
Epoch 19/30
Epoch 20/30
Epoch 21/30
Epoch 22/30
Epoch 23/30
Epoch 24/30
Epoch 25/30
Epoch 26/30
Epoch 27/30
Epoch 28/30
Epoch 29/30
Epoch 30/30


VBox(children=(Label(value='66.288 MB of 66.288 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
accuracy,▁▅▆▇▇▇▇███████████████████████
epoch,▁▁▁▂▂▂▂▃▃▃▃▄▄▄▄▅▅▅▅▆▆▆▆▇▇▇▇███
loss,█▃▂▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
val_accuracy,▁▆▇███████████████████████████
val_loss,█▃▂▁▁▁▁▁▁▁▂▂▂▂▂▂▂▂▂▂▃▃▃▃▃▃▃▃▃▃
validation_word_accuracy,▁▁▄▃▆▆▆█▇█▇███▇████▇▇▇▇▇██▇▇▇▇▇▇██▇▇▇▇▇▇
word_val_accuracy,▁

0,1
accuracy,0.97291
best_epoch,5.0
best_val_loss,0.01962
epoch,29.0
loss,0.0316
val_accuracy,0.87558
val_loss,0.02788
validation_word_accuracy,0.36575
word_val_accuracy,0.36553


[34m[1mwandb[0m: Agent Starting Run: 7huyo8sj with config:
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	beam_sizes: 5
[34m[1mwandb[0m: 	cell_type: RNN
[34m[1mwandb[0m: 	decoding_strategy: beam_search
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	epochs: 30
[34m[1mwandb[0m: 	hidden_size: 256
[34m[1mwandb[0m: 	input_embedding_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.0001
[34m[1mwandb[0m: 	num_decoder_layers: 2
[34m[1mwandb[0m: 	num_encoder_layers: 1


Epoch 1/30
Epoch 2/30
Epoch 3/30
Epoch 4/30
Epoch 5/30
Epoch 6/30
Epoch 7/30
Epoch 8/30
Epoch 9/30
Epoch 10/30
Epoch 11/30
Epoch 12/30
Epoch 13/30
Epoch 14/30
Epoch 15/30

[34m[1mwandb[0m: Network error (HTTPError), entering retry loop.


Epoch 16/30
Epoch 17/30
Epoch 18/30
Epoch 19/30
Epoch 20/30
Epoch 21/30
Epoch 22/30
Epoch 23/30
Epoch 24/30
Epoch 25/30
Epoch 26/30
Epoch 27/30
Epoch 28/30
Epoch 29/30
Epoch 30/30


VBox(children=(Label(value='4.420 MB of 4.420 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
accuracy,▁▃▄▅▅▆▆▆▆▇▇▇▇▇▇▇▇▇▇███████████
epoch,▁▁▁▂▂▂▂▃▃▃▃▄▄▄▄▅▅▅▅▆▆▆▆▇▇▇▇███
loss,█▆▅▄▃▃▃▂▂▂▂▂▂▂▂▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁
val_accuracy,▁▃▄▅▅▆▆▆▇▇▇▇▇▇▇▇▇▇████████████
val_loss,█▆▅▄▃▃▃▂▂▂▂▂▂▂▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁
validation_word_accuracy,▁█▆▆█▇▇▇███▇█▇▇█████████████████████████
word_val_accuracy,▁

0,1
accuracy,0.79056
best_epoch,29.0
best_val_loss,0.031
epoch,29.0
loss,0.262
val_accuracy,0.80308
val_loss,0.031
validation_word_accuracy,0.2131
word_val_accuracy,0.21294


[34m[1mwandb[0m: Agent Starting Run: homttswc with config:
[34m[1mwandb[0m: 	batch_size: 128
[34m[1mwandb[0m: 	beam_sizes: 5
[34m[1mwandb[0m: 	cell_type: GRU
[34m[1mwandb[0m: 	decoding_strategy: beam_search
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	epochs: 30
[34m[1mwandb[0m: 	hidden_size: 512
[34m[1mwandb[0m: 	input_embedding_size: 128
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	num_decoder_layers: 3
[34m[1mwandb[0m: 	num_encoder_layers: 1


Epoch 1/30
Epoch 2/30
Epoch 3/30
Epoch 4/30
Epoch 5/30
Epoch 6/30
Epoch 7/30
Epoch 8/30
Epoch 9/30
Epoch 10/30
Epoch 11/30
Epoch 12/30
Epoch 13/30
Epoch 14/30
Epoch 15/30
Epoch 16/30
Epoch 17/30
Epoch 18/30
Epoch 19/30
Epoch 20/30
Epoch 21/30
Epoch 22/30
Epoch 23/30
Epoch 24/30
Epoch 25/30
Epoch 26/30
Epoch 27/30
Epoch 28/30
Epoch 29/30
Epoch 30/30


VBox(children=(Label(value='66.288 MB of 66.288 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
accuracy,▁▅▆▇▇▇▇███████████████████████
epoch,▁▁▁▂▂▂▂▃▃▃▃▄▄▄▄▅▅▅▅▆▆▆▆▇▇▇▇███
loss,█▄▃▂▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
val_accuracy,▁▆▇▇██████████████████████████
val_loss,█▃▂▁▁▁▁▁▁▁▂▂▂▂▂▂▂▂▂▂▂▂▂▃▃▃▃▃▃▃
validation_word_accuracy,▁▇▆▄█▇▇▇▆▆▆▆▆▇▆▇▇▇▇▇▇▇▇▇▇▆▆▆▆▆▆▆▇▆▆▆▆▇▇▇
word_val_accuracy,▁

0,1
accuracy,0.97046
best_epoch,4.0
best_val_loss,0.01971
epoch,29.0
loss,0.03381
val_accuracy,0.87835
val_loss,0.02763
validation_word_accuracy,0.37379
word_val_accuracy,0.37425


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: xdu9pir3 with config:
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	beam_sizes: 5
[34m[1mwandb[0m: 	cell_type: GRU
[34m[1mwandb[0m: 	decoding_strategy: greedy
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	epochs: 30
[34m[1mwandb[0m: 	hidden_size: 256
[34m[1mwandb[0m: 	input_embedding_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	num_decoder_layers: 4
[34m[1mwandb[0m: 	num_encoder_layers: 1


Epoch 1/30
Epoch 2/30
Epoch 3/30
Epoch 4/30
Epoch 5/30
Epoch 6/30
Epoch 7/30
Epoch 8/30
Epoch 9/30
Epoch 10/30
Epoch 11/30
Epoch 12/30
Epoch 13/30
Epoch 14/30
Epoch 15/30
Epoch 16/30
Epoch 17/30
Epoch 18/30
Epoch 19/30
Epoch 20/30
Epoch 21/30
Epoch 22/30
Epoch 23/30
Epoch 24/30
Epoch 25/30
Epoch 26/30
Epoch 27/30
Epoch 28/30
Epoch 29/30
Epoch 30/30


VBox(children=(Label(value='21.110 MB of 21.110 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
accuracy,▁▄▅▆▇▇▇▇▇▇▇███████████████████
epoch,▁▁▁▂▂▂▂▃▃▃▃▄▄▄▄▅▅▅▅▆▆▆▆▇▇▇▇███
loss,█▅▃▃▂▂▂▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
val_accuracy,▁▅▆▇▇▇████████████████████████
val_loss,█▄▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
validation_word_accuracy,▁█▅▄▆▆▆▆▆▆▅▅▆▆▅▆▆▆▆▆▆▆▆▆▆▆▆▆▆▆▆▆▆▆▆▆▆▆▆▆
word_val_accuracy,▁

0,1
accuracy,0.94267
best_epoch,11.0
best_val_loss,0.02097
epoch,29.0
loss,0.06585
val_accuracy,0.87238
val_loss,0.02422
validation_word_accuracy,0.35632
word_val_accuracy,0.35659


[34m[1mwandb[0m: Agent Starting Run: 13dgtu0p with config:
[34m[1mwandb[0m: 	batch_size: 256
[34m[1mwandb[0m: 	beam_sizes: 3
[34m[1mwandb[0m: 	cell_type: GRU
[34m[1mwandb[0m: 	decoding_strategy: beam_search
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	epochs: 30
[34m[1mwandb[0m: 	hidden_size: 512
[34m[1mwandb[0m: 	input_embedding_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	num_decoder_layers: 3
[34m[1mwandb[0m: 	num_encoder_layers: 1


Epoch 1/30
Epoch 2/30
Epoch 3/30
Epoch 4/30
Epoch 5/30

[34m[1mwandb[0m: [32m[41mERROR[0m Error while calling W&B API: driver: bad connection (<Response [500]>)


Epoch 6/30
Epoch 7/30
Epoch 8/30
Epoch 9/30
Epoch 10/30
Epoch 11/30
Epoch 12/30
Epoch 13/30
Epoch 14/30
Epoch 15/30
Epoch 16/30
Epoch 17/30
Epoch 18/30
Epoch 19/30
Epoch 20/30
Epoch 21/30
Epoch 22/30
Epoch 23/30
Epoch 24/30
Epoch 25/30
Epoch 26/30
Epoch 27/30
Epoch 28/30
Epoch 29/30
Epoch 30/30


VBox(children=(Label(value='65.143 MB of 65.143 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
accuracy,▁▃▅▆▆▇▇▇▇▇████████████████████
epoch,▁▁▁▂▂▂▂▃▃▃▃▄▄▄▄▅▅▅▅▆▆▆▆▇▇▇▇███
loss,█▅▃▃▂▂▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
val_accuracy,▁▅▆▇▇█████████████████████████
val_loss,█▄▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▂▂▂▂
validation_word_accuracy,▁▆▇▆█▇▅▆▆▆▆▆▇▆▅▇▆▇█▇▇▇▇▇▇▇▇▇▇▆▇▇▇▇▇▇▇███
word_val_accuracy,▁

0,1
accuracy,0.97476
best_epoch,10.0
best_val_loss,0.02027
epoch,29.0
loss,0.02976
val_accuracy,0.87481
val_loss,0.02632
validation_word_accuracy,0.35908
word_val_accuracy,0.35888


[34m[1mwandb[0m: Agent Starting Run: y4fl5o3g with config:
[34m[1mwandb[0m: 	batch_size: 128
[34m[1mwandb[0m: 	beam_sizes: 3
[34m[1mwandb[0m: 	cell_type: GRU
[34m[1mwandb[0m: 	decoding_strategy: greedy
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	epochs: 30
[34m[1mwandb[0m: 	hidden_size: 256
[34m[1mwandb[0m: 	input_embedding_size: 128
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	num_decoder_layers: 4
[34m[1mwandb[0m: 	num_encoder_layers: 1


Epoch 1/30
Epoch 2/30
Epoch 3/30
Epoch 4/30
Epoch 5/30
Epoch 6/30
Epoch 7/30
Epoch 8/30
Epoch 9/30
Epoch 10/30
Epoch 11/30
Epoch 12/30
Epoch 13/30
Epoch 14/30
Epoch 15/30
Epoch 16/30
Epoch 17/30
Epoch 18/30
Epoch 19/30
Epoch 20/30
Epoch 21/30
Epoch 22/30
Epoch 23/30
Epoch 24/30
Epoch 25/30
Epoch 26/30
Epoch 27/30
Epoch 28/30
Epoch 29/30
Epoch 30/30


VBox(children=(Label(value='21.984 MB of 21.984 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
accuracy,▁▄▆▆▇▇▇▇▇▇▇▇██████████████████
epoch,▁▁▁▂▂▂▂▃▃▃▃▄▄▄▄▅▅▅▅▆▆▆▆▇▇▇▇███
loss,█▅▃▂▂▂▂▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
val_accuracy,▁▅▇▇▇█████████████████████████
val_loss,█▄▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
validation_word_accuracy,▁▅█▄▇▆▅▆▇▇▇▆▆▇▇▇▇▇▇▇▇▆▆▆▆▇▇▆▆▆▆▆▇▆▆▆▆▆▇▇
word_val_accuracy,▁

0,1
accuracy,0.95662
best_epoch,9.0
best_val_loss,0.01975
epoch,29.0
loss,0.0498
val_accuracy,0.87535
val_loss,0.02386
validation_word_accuracy,0.37126
word_val_accuracy,0.37127


[34m[1mwandb[0m: Agent Starting Run: u1kpdrzy with config:
[34m[1mwandb[0m: 	batch_size: 256
[34m[1mwandb[0m: 	beam_sizes: 7
[34m[1mwandb[0m: 	cell_type: GRU
[34m[1mwandb[0m: 	decoding_strategy: greedy
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	epochs: 30
[34m[1mwandb[0m: 	hidden_size: 256
[34m[1mwandb[0m: 	input_embedding_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	num_decoder_layers: 4
[34m[1mwandb[0m: 	num_encoder_layers: 2


Epoch 1/30
Epoch 2/30
Epoch 3/30
Epoch 4/30
Epoch 5/30
Epoch 6/30
Epoch 7/30
Epoch 8/30
Epoch 9/30
Epoch 10/30
Epoch 11/30
Epoch 12/30
Epoch 13/30
Epoch 14/30
Epoch 15/30
Epoch 16/30
Epoch 17/30
Epoch 18/30
Epoch 19/30
Epoch 20/30
Epoch 21/30
Epoch 22/30
Epoch 23/30
Epoch 24/30
Epoch 25/30
Epoch 26/30
Epoch 27/30
Epoch 28/30
Epoch 29/30
Epoch 30/30


VBox(children=(Label(value='25.933 MB of 25.933 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
accuracy,▁▃▅▆▆▇▇▇▇▇▇▇▇█████████████████
epoch,▁▁▁▂▂▂▂▃▃▃▃▄▄▄▄▅▅▅▅▆▆▆▆▇▇▇▇███
loss,█▆▄▃▃▂▂▂▂▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
val_accuracy,▁▄▆▇▇▇████████████████████████
val_loss,█▅▃▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
validation_word_accuracy,▁▄▅▅▆▇▇▇▇███████████████████████████████
word_val_accuracy,▁

0,1
accuracy,0.94833
best_epoch,15.0
best_val_loss,0.01973
epoch,29.0
loss,0.06054
val_accuracy,0.8776
val_loss,0.02172
validation_word_accuracy,0.37379
word_val_accuracy,0.37357


[34m[1mwandb[0m: Agent Starting Run: vn73k0g3 with config:
[34m[1mwandb[0m: 	batch_size: 128
[34m[1mwandb[0m: 	beam_sizes: 3
[34m[1mwandb[0m: 	cell_type: GRU
[34m[1mwandb[0m: 	decoding_strategy: greedy
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	epochs: 30
[34m[1mwandb[0m: 	hidden_size: 256
[34m[1mwandb[0m: 	input_embedding_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.0001
[34m[1mwandb[0m: 	num_decoder_layers: 4
[34m[1mwandb[0m: 	num_encoder_layers: 4


Epoch 1/30
Epoch 2/30
Epoch 3/30
Epoch 4/30
Epoch 5/30
Epoch 6/30
Epoch 7/30
Epoch 8/30
Epoch 9/30
Epoch 10/30
Epoch 11/30
Epoch 12/30
Epoch 13/30
Epoch 14/30
Epoch 15/30
Epoch 16/30
Epoch 17/30
Epoch 18/30
Epoch 19/30
Epoch 20/30
Epoch 21/30
Epoch 22/30
Epoch 23/30
Epoch 24/30
Epoch 25/30
Epoch 26/30
Epoch 27/30
Epoch 28/30
Epoch 29/30
Epoch 30/30


VBox(children=(Label(value='34.994 MB of 34.994 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
accuracy,▁▂▃▃▃▄▄▄▄▅▅▅▅▅▆▆▆▆▆▇▇▇▇▇▇▇████
epoch,▁▁▁▂▂▂▂▃▃▃▃▄▄▄▄▅▅▅▅▆▆▆▆▇▇▇▇███
loss,█▇▆▅▅▅▅▄▄▄▄▄▃▃▃▃▃▃▂▂▂▂▂▂▂▁▁▁▁▁
val_accuracy,▁▂▂▃▃▃▄▄▄▅▅▅▅▆▆▆▆▆▆▇▇▇▇▇▇█████
val_loss,█▇▆▆▆▅▅▅▄▄▄▄▃▃▃▃▃▃▂▂▂▂▂▂▂▁▁▁▁▁
validation_word_accuracy,▁▆▄▄█▇▇▇▇▇▇▇▇▇▆▇████▇▇▇▇▇▇▇█████████████
word_val_accuracy,▁

0,1
accuracy,0.76101
best_epoch,29.0
best_val_loss,0.03574
epoch,29.0
loss,0.31208
val_accuracy,0.78595
val_loss,0.03574
validation_word_accuracy,0.18437
word_val_accuracy,0.18449


[34m[1mwandb[0m: Agent Starting Run: y9gdbnx7 with config:
[34m[1mwandb[0m: 	batch_size: 256
[34m[1mwandb[0m: 	beam_sizes: 7
[34m[1mwandb[0m: 	cell_type: GRU
[34m[1mwandb[0m: 	decoding_strategy: greedy
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	epochs: 40
[34m[1mwandb[0m: 	hidden_size: 512
[34m[1mwandb[0m: 	input_embedding_size: 256
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	num_decoder_layers: 1
[34m[1mwandb[0m: 	num_encoder_layers: 1


Epoch 1/40
Epoch 2/40
Epoch 3/40
Epoch 4/40
Epoch 5/40
Epoch 6/40
Epoch 7/40
Epoch 8/40
Epoch 9/40
Epoch 10/40
Epoch 11/40
Epoch 12/40
Epoch 13/40
Epoch 14/40
Epoch 15/40
Epoch 16/40
Epoch 17/40
Epoch 18/40
Epoch 19/40
Epoch 20/40
Epoch 21/40
Epoch 22/40
Epoch 23/40
Epoch 24/40
Epoch 25/40
Epoch 26/40
Epoch 27/40
Epoch 28/40
Epoch 29/40
Epoch 30/40
Epoch 31/40
Epoch 32/40
Epoch 33/40
Epoch 34/40
Epoch 35/40
Epoch 36/40
Epoch 37/40
Epoch 38/40
Epoch 39/40
Epoch 40/40


VBox(children=(Label(value='32.481 MB of 32.481 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
accuracy,▁▄▆▆▇▇▇▇▇███████████████████████████████
epoch,▁▁▁▂▂▂▂▂▂▃▃▃▃▃▄▄▄▄▄▄▅▅▅▅▅▅▆▆▆▆▆▇▇▇▇▇▇███
loss,█▄▃▂▂▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
val_accuracy,▁▆▇█████████████████████████████████████
val_loss,█▃▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▂▂▂▂▂▂▂▂▂▂▂▂▂▂▂▂▂▂▂▂▂▂▂
validation_word_accuracy,▁█▇▃█▇▅█▇▇▆▆▇▆▅▆▅▆▆▅▅▅▅▆▆▆▆▆▆▆▆▅▆▅▅▅▅▅▅▅
word_val_accuracy,▁

0,1
accuracy,0.98692
best_epoch,7.0
best_val_loss,0.02011
epoch,39.0
loss,0.01579
val_accuracy,0.8701
val_loss,0.03074
validation_word_accuracy,0.34529
word_val_accuracy,0.34534


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: 50iehbp6 with config:
[34m[1mwandb[0m: 	batch_size: 256
[34m[1mwandb[0m: 	beam_sizes: 7
[34m[1mwandb[0m: 	cell_type: GRU
[34m[1mwandb[0m: 	decoding_strategy: greedy
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	epochs: 35
[34m[1mwandb[0m: 	hidden_size: 256
[34m[1mwandb[0m: 	input_embedding_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	num_decoder_layers: 4
[34m[1mwandb[0m: 	num_encoder_layers: 1


Epoch 1/35
Epoch 2/35
Epoch 3/35
Epoch 4/35
Epoch 5/35
Epoch 6/35
Epoch 7/35
Epoch 8/35
Epoch 9/35
Epoch 10/35
Epoch 11/35
Epoch 12/35
Epoch 13/35
Epoch 14/35
Epoch 15/35
Epoch 16/35
Epoch 17/35
Epoch 18/35
Epoch 19/35
Epoch 20/35
Epoch 21/35
Epoch 22/35
Epoch 23/35
Epoch 24/35
Epoch 25/35
Epoch 26/35
Epoch 27/35
Epoch 28/35
Epoch 29/35
Epoch 30/35
Epoch 31/35
Epoch 32/35
Epoch 33/35
Epoch 34/35
Epoch 35/35


VBox(children=(Label(value='21.401 MB of 21.401 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
accuracy,▁▂▄▅▅▆▆▇▇▇▇▇▇▇▇▇▇██████████████████
epoch,▁▁▁▂▂▂▂▂▃▃▃▃▃▄▄▄▄▅▅▅▅▅▆▆▆▆▆▇▇▇▇▇███
loss,█▆▅▄▃▃▂▂▂▂▂▂▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
val_accuracy,▁▃▅▆▆▇▇▇███████████████████████████
val_loss,█▆▄▃▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
validation_word_accuracy,▁▄▅▅▇▇▆▇▇▇▇▆▇▇▇▇▇▇█████████▇█▇▇▇▇▇▇▇▇███
word_val_accuracy,▁

0,1
accuracy,0.94885
best_epoch,19.0
best_val_loss,0.02008
epoch,34.0
loss,0.05962
val_accuracy,0.87432
val_loss,0.02276
validation_word_accuracy,0.36759
word_val_accuracy,0.36783


[34m[1mwandb[0m: Agent Starting Run: upghza5l with config:
[34m[1mwandb[0m: 	batch_size: 256
[34m[1mwandb[0m: 	beam_sizes: 7
[34m[1mwandb[0m: 	cell_type: GRU
[34m[1mwandb[0m: 	decoding_strategy: greedy
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	epochs: 30
[34m[1mwandb[0m: 	hidden_size: 256
[34m[1mwandb[0m: 	input_embedding_size: 512
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	num_decoder_layers: 4
[34m[1mwandb[0m: 	num_encoder_layers: 1


Epoch 1/30
Epoch 2/30
Epoch 3/30
Epoch 4/30
Epoch 5/30
Epoch 6/30
Epoch 7/30
Epoch 8/30
Epoch 9/30
Epoch 10/30
Epoch 11/30
Epoch 12/30
Epoch 13/30
Epoch 14/30
Epoch 15/30
Epoch 16/30
Epoch 17/30
Epoch 18/30
Epoch 19/30
Epoch 20/30
Epoch 21/30
Epoch 22/30
Epoch 23/30
Epoch 24/30
Epoch 25/30
Epoch 26/30
Epoch 27/30
Epoch 28/30
Epoch 29/30
Epoch 30/30


VBox(children=(Label(value='25.477 MB of 25.477 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
accuracy,▁▄▆▆▇▇▇▇▇▇▇▇██████████████████
epoch,▁▁▁▂▂▂▂▃▃▃▃▄▄▄▄▅▅▅▅▆▆▆▆▇▇▇▇███
loss,█▅▃▂▂▂▂▂▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
val_accuracy,▁▅▆▇▇▇████████████████████████
val_loss,█▄▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
validation_word_accuracy,▅▁▅▄█▆▅▆▅▅▅▅▆▅▅▅▅▅▆▅▅▅▅▅▅▅▅▅▅▅▅▅▅▅▅▅▅▅▅▅
word_val_accuracy,▁

0,1
accuracy,0.96329
best_epoch,12.0
best_val_loss,0.01951
epoch,29.0
loss,0.04313
val_accuracy,0.87694
val_loss,0.02355
validation_word_accuracy,0.38023
word_val_accuracy,0.38068


[34m[1mwandb[0m: Agent Starting Run: 8xohvqz6 with config:
[34m[1mwandb[0m: 	batch_size: 256
[34m[1mwandb[0m: 	beam_sizes: 7
[34m[1mwandb[0m: 	cell_type: GRU
[34m[1mwandb[0m: 	decoding_strategy: greedy
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	epochs: 35
[34m[1mwandb[0m: 	hidden_size: 512
[34m[1mwandb[0m: 	input_embedding_size: 512
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	num_decoder_layers: 3
[34m[1mwandb[0m: 	num_encoder_layers: 1


Epoch 1/35
Epoch 2/35
Epoch 3/35
Epoch 4/35
Epoch 5/35
Epoch 6/35
Epoch 7/35
Epoch 8/35
Epoch 9/35
Epoch 10/35
Epoch 11/35
Epoch 12/35
Epoch 13/35
Epoch 14/35
Epoch 15/35
Epoch 16/35
Epoch 17/35
Epoch 18/35
Epoch 19/35
Epoch 20/35
Epoch 21/35
Epoch 22/35
Epoch 23/35
Epoch 24/35
Epoch 25/35
Epoch 26/35
Epoch 27/35
Epoch 28/35
Epoch 29/35
Epoch 30/35
Epoch 31/35
Epoch 32/35
Epoch 33/35
Epoch 34/35
Epoch 35/35


VBox(children=(Label(value='73.157 MB of 73.157 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
accuracy,▁▅▆▇▇▇▇████████████████████████████
epoch,▁▁▁▂▂▂▂▂▃▃▃▃▃▄▄▄▄▅▅▅▅▅▆▆▆▆▆▇▇▇▇▇███
loss,█▃▂▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
val_accuracy,▁▆▇▇███████████████████████████████
val_loss,█▃▂▁▁▁▁▁▁▁▁▁▂▂▂▂▂▂▂▂▂▂▂▂▂▂▃▂▃▃▃▃▃▃▃
validation_word_accuracy,▄▅▄▂█▆▂▄▃▂▃▂▃▃▂▃▂▃▃▃▂▂▂▂▂▂▂▁▁▁▂▁▂▁▁▁▁▁▁▂
word_val_accuracy,▁

0,1
accuracy,0.98407
best_epoch,5.0
best_val_loss,0.01913
epoch,34.0
loss,0.01917
val_accuracy,0.87939
val_loss,0.02803
validation_word_accuracy,0.36966
word_val_accuracy,0.37012


[34m[1mwandb[0m: Agent Starting Run: ko2e5ks9 with config:
[34m[1mwandb[0m: 	batch_size: 128
[34m[1mwandb[0m: 	beam_sizes: 5
[34m[1mwandb[0m: 	cell_type: GRU
[34m[1mwandb[0m: 	decoding_strategy: beam_search
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	epochs: 30
[34m[1mwandb[0m: 	hidden_size: 256
[34m[1mwandb[0m: 	input_embedding_size: 128
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	num_decoder_layers: 4
[34m[1mwandb[0m: 	num_encoder_layers: 1


Epoch 1/30
Epoch 2/30
Epoch 3/30
Epoch 4/30
Epoch 5/30
Epoch 6/30
Epoch 7/30
Epoch 8/30
Epoch 9/30
Epoch 10/30
Epoch 11/30
Epoch 12/30
Epoch 13/30
Epoch 14/30
Epoch 15/30
Epoch 16/30
Epoch 17/30
Epoch 18/30
Epoch 19/30
Epoch 20/30
Epoch 21/30
Epoch 22/30
Epoch 23/30
Epoch 24/30
Epoch 25/30
Epoch 26/30
Epoch 27/30
Epoch 28/30
Epoch 29/30
Epoch 30/30


VBox(children=(Label(value='21.984 MB of 21.984 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
accuracy,▁▄▆▆▇▇▇▇▇▇▇███████████████████
epoch,▁▁▁▂▂▂▂▃▃▃▃▄▄▄▄▅▅▅▅▆▆▆▆▇▇▇▇███
loss,█▄▃▂▂▂▂▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
val_accuracy,▁▅▇▇▇█████████████████████████
val_loss,█▄▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▂▂▂▂▂▂
validation_word_accuracy,▁█▄▄▇▆▆█▇▇▆▆▇▇▇▇▇▇██▇█▇▇▇█▇▇████████████
word_val_accuracy,▁

0,1
accuracy,0.96445
best_epoch,9.0
best_val_loss,0.02006
epoch,29.0
loss,0.04065
val_accuracy,0.87233
val_loss,0.02585
validation_word_accuracy,0.3623
word_val_accuracy,0.36255


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: extn7301 with config:
[34m[1mwandb[0m: 	batch_size: 256
[34m[1mwandb[0m: 	beam_sizes: 5
[34m[1mwandb[0m: 	cell_type: GRU
[34m[1mwandb[0m: 	decoding_strategy: greedy
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	epochs: 35
[34m[1mwandb[0m: 	hidden_size: 256
[34m[1mwandb[0m: 	input_embedding_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	num_decoder_layers: 4
[34m[1mwandb[0m: 	num_encoder_layers: 1


Epoch 1/35
Epoch 2/35
Epoch 3/35
Epoch 4/35
Epoch 5/35
Epoch 6/35
Epoch 7/35
Epoch 8/35
Epoch 9/35
Epoch 10/35
Epoch 11/35
Epoch 12/35
Epoch 13/35
Epoch 14/35
Epoch 15/35
Epoch 16/35
Epoch 17/35
Epoch 18/35
Epoch 19/35
Epoch 20/35
Epoch 21/35
Epoch 22/35
Epoch 23/35
Epoch 24/35
Epoch 25/35
Epoch 26/35
Epoch 27/35
Epoch 28/35
Epoch 29/35
Epoch 30/35
Epoch 31/35
Epoch 32/35
Epoch 33/35
Epoch 34/35
Epoch 35/35


VBox(children=(Label(value='7.150 MB of 7.150 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
accuracy,▁▂▄▅▆▆▆▇▇▇▇▇▇▇▇▇███████████████████
epoch,▁▁▁▂▂▂▂▂▃▃▃▃▃▄▄▄▄▅▅▅▅▅▆▆▆▆▆▇▇▇▇▇███
loss,█▆▅▄▃▃▂▂▂▂▂▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
val_accuracy,▁▃▅▆▇▇▇▇███████████████████████████
val_loss,█▆▄▃▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
validation_word_accuracy,▃█▅▁▂▃▂▃▄▄▃▃▃▃▃▄▄▄▄▄▄▃▃▃▃▃▃▂▂▂▂▂▂▂▂▂▃▃▃▃
word_val_accuracy,▁

0,1
accuracy,0.95047
best_epoch,17.0
best_val_loss,0.0202
epoch,34.0
loss,0.05849
val_accuracy,0.87342
val_loss,0.02273
validation_word_accuracy,0.36207
word_val_accuracy,0.36209


[34m[1mwandb[0m: Agent Starting Run: x2puhth7 with config:
[34m[1mwandb[0m: 	batch_size: 256
[34m[1mwandb[0m: 	beam_sizes: 5
[34m[1mwandb[0m: 	cell_type: GRU
[34m[1mwandb[0m: 	decoding_strategy: beam_search
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	epochs: 40
[34m[1mwandb[0m: 	hidden_size: 512
[34m[1mwandb[0m: 	input_embedding_size: 512
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	num_decoder_layers: 4
[34m[1mwandb[0m: 	num_encoder_layers: 1


Epoch 1/40
Epoch 2/40
Epoch 3/40
Epoch 4/40
Epoch 5/40
Epoch 6/40
Epoch 7/40
Epoch 8/40
Epoch 9/40
Epoch 10/40
Epoch 11/40
Epoch 12/40
Epoch 13/40
Epoch 14/40
Epoch 15/40
Epoch 16/40
Epoch 17/40
Epoch 18/40
Epoch 19/40
Epoch 20/40
Epoch 21/40
Epoch 22/40
Epoch 23/40
Epoch 24/40
Epoch 25/40
Epoch 26/40
Epoch 27/40
Epoch 28/40
Epoch 29/40
Epoch 30/40
Epoch 31/40
Epoch 32/40
Epoch 33/40
Epoch 34/40
Epoch 35/40
Epoch 36/40
Epoch 37/40
Epoch 38/40
Epoch 39/40
Epoch 40/40


VBox(children=(Label(value='91.202 MB of 91.202 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
accuracy,▁▅▆▇▇▇▇█████████████████████████████████
epoch,▁▁▁▂▂▂▂▂▂▃▃▃▃▃▄▄▄▄▄▄▅▅▅▅▅▅▆▆▆▆▆▇▇▇▇▇▇███
loss,█▄▂▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
val_accuracy,▁▆▇▇████████████████████████████████████
val_loss,█▃▂▁▁▁▁▁▁▁▁▁▂▂▂▂▂▂▂▂▂▂▂▂▂▂▂▂▂▂▂▃▂▃▃▃▃▃▃▃
validation_word_accuracy,▁█▇▄▇▅▅▅▅▅▄▄▅▅▅▅▅▅▅▅▄▄▅▅▅▅▅▅▅▅▅▅▅▄▄▄▄▄▄▄
word_val_accuracy,▁

0,1
accuracy,0.9836
best_epoch,5.0
best_val_loss,0.01985
epoch,39.0
loss,0.01936
val_accuracy,0.87668
val_loss,0.02916
validation_word_accuracy,0.3692
word_val_accuracy,0.36921


[34m[1mwandb[0m: Agent Starting Run: 8dxxg0c0 with config:
[34m[1mwandb[0m: 	batch_size: 256
[34m[1mwandb[0m: 	beam_sizes: 7
[34m[1mwandb[0m: 	cell_type: GRU
[34m[1mwandb[0m: 	decoding_strategy: greedy
[34m[1mwandb[0m: 	dropout: 0
[34m[1mwandb[0m: 	epochs: 30
[34m[1mwandb[0m: 	hidden_size: 128
[34m[1mwandb[0m: 	input_embedding_size: 256
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	num_decoder_layers: 4
[34m[1mwandb[0m: 	num_encoder_layers: 1


Epoch 1/30
Epoch 2/30
Epoch 3/30
Epoch 4/30
Epoch 5/30
Epoch 6/30
Epoch 7/30
Epoch 8/30
Epoch 9/30
Epoch 10/30
Epoch 11/30
Epoch 12/30
Epoch 13/30
Epoch 14/30
Epoch 15/30
Epoch 16/30
Epoch 17/30
Epoch 18/30
Epoch 19/30
Epoch 20/30
Epoch 21/30
Epoch 22/30
Epoch 23/30
Epoch 24/30
Epoch 25/30
Epoch 26/30
Epoch 27/30
Epoch 28/30
Epoch 29/30
Epoch 30/30


VBox(children=(Label(value='6.598 MB of 6.598 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
accuracy,▁▃▄▅▆▆▆▇▇▇▇▇▇▇▇▇▇█████████████
epoch,▁▁▁▂▂▂▂▃▃▃▃▄▄▄▄▅▅▅▅▆▆▆▆▇▇▇▇███
loss,█▆▅▄▃▃▂▂▂▂▂▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
val_accuracy,▁▃▄▆▆▇▇▇▇█████████████████████
val_loss,█▆▄▃▂▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
validation_word_accuracy,▁█▆▅▆▆▅▆▆▆▆▆▇▇▆▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▆▆▆▆▆▆▆▇▇▇
word_val_accuracy,▁

0,1
accuracy,0.95448
best_epoch,17.0
best_val_loss,0.02251
epoch,29.0
loss,0.05888
val_accuracy,0.85228
val_loss,0.02548
validation_word_accuracy,0.30276
word_val_accuracy,0.30289


[34m[1mwandb[0m: Agent Starting Run: 7qrr3p7z with config:
[34m[1mwandb[0m: 	batch_size: 256
[34m[1mwandb[0m: 	beam_sizes: 7
[34m[1mwandb[0m: 	cell_type: LSTM
[34m[1mwandb[0m: 	decoding_strategy: beam_search
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	epochs: 40
[34m[1mwandb[0m: 	hidden_size: 256
[34m[1mwandb[0m: 	input_embedding_size: 128
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	num_decoder_layers: 4
[34m[1mwandb[0m: 	num_encoder_layers: 1


Epoch 1/40
Epoch 2/40
Epoch 3/40
Epoch 4/40
Epoch 5/40
Epoch 6/40
Epoch 7/40
Epoch 8/40
Epoch 9/40
Epoch 10/40
Epoch 11/40
Epoch 12/40
Epoch 13/40
Epoch 14/40
Epoch 15/40
Epoch 16/40
Epoch 17/40
Epoch 18/40
Epoch 19/40
Epoch 20/40
Epoch 21/40
Epoch 22/40
Epoch 23/40
Epoch 24/40
Epoch 25/40
Epoch 26/40
Epoch 27/40
Epoch 28/40
Epoch 29/40
Epoch 30/40
Epoch 31/40
Epoch 32/40
Epoch 33/40
Epoch 34/40
Epoch 35/40
Epoch 36/40
Epoch 37/40
Epoch 38/40
Epoch 39/40
Epoch 40/40


VBox(children=(Label(value='29.080 MB of 29.080 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
accuracy,▁▃▅▅▆▆▇▇▇▇▇▇▇▇▇▇████████████████████████
epoch,▁▁▁▂▂▂▂▂▂▃▃▃▃▃▄▄▄▄▄▄▅▅▅▅▅▅▆▆▆▆▆▇▇▇▇▇▇███
loss,█▅▄▃▃▂▂▂▂▂▂▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
val_accuracy,▁▄▆▆▇▇▇█████████████████████████████████
val_loss,█▅▃▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
validation_word_accuracy,▁▇▆▄██▇█▇▇▆▆▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▆▆▇▆▇▇▆▇▇▇
word_val_accuracy,▁

0,1
accuracy,0.97455
best_epoch,15.0
best_val_loss,0.02087
epoch,39.0
loss,0.02998
val_accuracy,0.86976
val_loss,0.02642
validation_word_accuracy,0.35172
word_val_accuracy,0.35154


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: kz2rqupn with config:
[34m[1mwandb[0m: 	batch_size: 128
[34m[1mwandb[0m: 	beam_sizes: 7
[34m[1mwandb[0m: 	cell_type: GRU
[34m[1mwandb[0m: 	decoding_strategy: greedy
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	epochs: 35
[34m[1mwandb[0m: 	hidden_size: 512
[34m[1mwandb[0m: 	input_embedding_size: 256
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	num_decoder_layers: 4
[34m[1mwandb[0m: 	num_encoder_layers: 2


Epoch 1/35
Epoch 2/35
Epoch 3/35
Epoch 4/35
Epoch 5/35
Epoch 6/35
Epoch 7/35
Epoch 8/35
Epoch 9/35
Epoch 10/35
Epoch 11/35
Epoch 12/35
Epoch 13/35
Epoch 14/35
Epoch 15/35
Epoch 16/35
Epoch 17/35
Epoch 18/35
Epoch 19/35
Epoch 20/35
Epoch 21/35
Epoch 22/35
Epoch 23/35
Epoch 24/35
Epoch 25/35
Epoch 26/35
Epoch 27/35
Epoch 28/35
Epoch 29/35
Epoch 30/35
Epoch 31/35
Epoch 32/35
Epoch 33/35
Epoch 34/35
Epoch 35/35


VBox(children=(Label(value='104.672 MB of 104.672 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0,…

0,1
accuracy,▁▆▇▇▇▇█████████████████████████████
epoch,▁▁▁▂▂▂▂▂▃▃▃▃▃▄▄▄▄▅▅▅▅▅▆▆▆▆▆▇▇▇▇▇███
loss,█▃▂▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
val_accuracy,▁▆▇████████████████████████████████
val_loss,█▃▁▁▁▁▁▁▂▂▂▂▂▃▃▃▃▃▃▃▃▄▄▄▄▄▄▄▄▄▄▄▄▄▄
validation_word_accuracy,▁▅▅▄▇█▇██▇▇██▇▇▇▇▇█▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇
word_val_accuracy,▁

0,1
accuracy,0.96648
best_epoch,3.0
best_val_loss,0.01949
epoch,34.0
loss,0.03861
val_accuracy,0.87651
val_loss,0.02726
validation_word_accuracy,0.37149
word_val_accuracy,0.37196


[34m[1mwandb[0m: Agent Starting Run: vsbhks4k with config:
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	beam_sizes: 3
[34m[1mwandb[0m: 	cell_type: GRU
[34m[1mwandb[0m: 	decoding_strategy: beam_search
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	epochs: 35
[34m[1mwandb[0m: 	hidden_size: 512
[34m[1mwandb[0m: 	input_embedding_size: 256
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	num_decoder_layers: 4
[34m[1mwandb[0m: 	num_encoder_layers: 1


Epoch 1/35
Epoch 2/35
Epoch 3/35
Epoch 4/35
Epoch 5/35
Epoch 6/35
Epoch 7/35
Epoch 8/35
Epoch 9/35
Epoch 10/35
Epoch 11/35
Epoch 12/35
Epoch 13/35
Epoch 14/35
Epoch 15/35
Epoch 16/35
Epoch 17/35
Epoch 18/35
Epoch 19/35
Epoch 20/35
Epoch 21/35
Epoch 22/35
Epoch 23/35
Epoch 24/35
Epoch 25/35
Epoch 26/35
Epoch 27/35
Epoch 28/35
Epoch 29/35
Epoch 30/35
Epoch 31/35
Epoch 32/35
Epoch 33/35
Epoch 34/35
Epoch 35/35


VBox(children=(Label(value='86.623 MB of 86.623 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
accuracy,▁▆▇▇▇▇█████████████████████████████
epoch,▁▁▁▂▂▂▂▂▃▃▃▃▃▄▄▄▄▅▅▅▅▅▆▆▆▆▆▇▇▇▇▇███
loss,█▃▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
val_accuracy,▁▆▇▇███████▇██▇█▇█▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇
val_loss,█▃▂▁▁▁▂▂▃▃▃▄▄▄▄▄▄▄▅▅▅▅▅▆▆▆▆▆▆▆▇▆▆▆▆
validation_word_accuracy,▁▇█▃▅▄▃▄▅▅▄▄▄▅▄▅▅▅▅▅▅▅▅▅▅▅▅▄▅▅▅▅▅▅▅▅▅▅▅▅
word_val_accuracy,▁

0,1
accuracy,0.94589
best_epoch,4.0
best_val_loss,0.02003
epoch,34.0
loss,0.06269
val_accuracy,0.86474
val_loss,0.02779
validation_word_accuracy,0.33632
word_val_accuracy,0.33685


[34m[1mwandb[0m: Agent Starting Run: k9r60n8i with config:
[34m[1mwandb[0m: 	batch_size: 128
[34m[1mwandb[0m: 	beam_sizes: 3
[34m[1mwandb[0m: 	cell_type: GRU
[34m[1mwandb[0m: 	decoding_strategy: beam_search
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	epochs: 30
[34m[1mwandb[0m: 	hidden_size: 256
[34m[1mwandb[0m: 	input_embedding_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	num_decoder_layers: 4
[34m[1mwandb[0m: 	num_encoder_layers: 1


Epoch 1/30
Epoch 2/30
Epoch 3/30
Epoch 4/30
Epoch 5/30
Epoch 6/30
Epoch 7/30
Epoch 8/30
Epoch 9/30
Epoch 10/30
Epoch 11/30
Epoch 12/30
Epoch 13/30
Epoch 14/30
Epoch 15/30
Epoch 16/30
Epoch 17/30
Epoch 18/30
Epoch 19/30
Epoch 20/30
Epoch 21/30
Epoch 22/30
Epoch 23/30
Epoch 24/30
Epoch 25/30
Epoch 26/30
Epoch 27/30
Epoch 28/30
Epoch 29/30
Epoch 30/30


VBox(children=(Label(value='21.110 MB of 21.110 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, m…

0,1
accuracy,▁▃▅▆▆▆▇▇▇▇▇▇▇▇████████████████
epoch,▁▁▁▂▂▂▂▃▃▃▃▄▄▄▄▅▅▅▅▆▆▆▆▇▇▇▇███
loss,█▆▄▃▃▂▂▂▂▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
val_accuracy,▁▄▆▇▇▇████████████████████████
val_loss,█▅▃▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
validation_word_accuracy,▂▆▃▁▅▅▅▇▇▇▇▇▇▇▇▇▇▇██▇▇█▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▆▆
word_val_accuracy,▁

0,1
accuracy,0.94633
best_epoch,13.0
best_val_loss,0.02068
epoch,29.0
loss,0.0633
val_accuracy,0.87506
val_loss,0.02331
validation_word_accuracy,0.37839
word_val_accuracy,0.37838
