#### Library Imports

In [1]:
import torch
from torch import nn
import pandas as pd
import torch.optim as optim
import torch.nn.functional as F
import copy
from torch.utils.data import Dataset, DataLoader
import random
import wandb

#### WanDB login

In [2]:
wandb.login(key="b4dc866a06ba17317c20de0d13c1a64cc23096dd")

[34m[1mwandb[0m: Using wandb-core as the SDK backend.  Please refer to https://wandb.me/wandb-core for more information.
[34m[1mwandb[0m: No netrc file found, creating one.
[34m[1mwandb[0m: Appending key for api.wandb.ai to your netrc file: /root/.netrc
[34m[1mwandb[0m: Currently logged in as: [33mcs23s025[0m ([33mcs23s025-indian-institute-of-technology-madras[0m) to [32mhttps://api.wandb.ai[0m. Use [1m`wandb login --relogin`[0m to force relogin


True

#### check and use GPU if available

In [3]:
device = torch.device("cuda" if torch.cuda.is_available() else "cpu")

#### Paths for loading data-sets (train/test/validate)

In [None]:

train_csv = "/kaggle/input/dakshina-dataset-hindi/DakshinaDataSet_Hindi/hindi_Train_dataset.csv"
test_csv = "/kaggle/input/dakshina-dataset-hindi/DakshinaDataSet_Hindi/hindi_Test_dataset.csv"
val_csv = "/kaggle/input/dakshina-dataset-hindi/DakshinaDataSet_Hindi/hindi_Validation_dataset.csv"

In [5]:
# Data loading
train_data = pd.read_csv(train_csv, header=None)
train_input = train_data[0].to_numpy()
train_output = train_data[1].to_numpy()
val_data = pd.read_csv(val_csv, header=None)
val_input = val_data[0].to_numpy()
val_output = val_data[1].to_numpy()
test_data = pd.read_csv(test_csv, header=None)

In [6]:
def pre_processing(train_input, train_output):
    data = {
        "all_characters": [],
        "char_num_map": {},
        "num_char_map": {},
        "source_charToNum": torch.zeros(len(train_input), 30, dtype=torch.int, device=device),
        "source_data": train_input,
        "all_characters_2": [],
        "char_num_map_2": {},
        "num_char_map_2": {},
        "val_charToNum": torch.zeros(len(train_output), 23, dtype=torch.int, device=device),
        "target_data": train_output,
        "source_len": 0,
        "target_len": 0
    }
    
    for i in range(len(train_input)):
        train_input[i] = "{" + train_input[i] + "}" * (29 - len(train_input[i]))
        charToNum = []
        for char in train_input[i]:
            if char not in data["all_characters"]:
                data["all_characters"].append(char)
                index = len(data["all_characters"]) - 1
                data["char_num_map"][char] = index
                data["num_char_map"][index] = char
            else:
                index = data["char_num_map"][char]
            charToNum.append(index)
        data["source_charToNum"][i] = torch.tensor(charToNum, device=device)

        train_output[i] = "{" + train_output[i] + "}" * (22 - len(train_output[i]))
        charToNum1 = []
        for char in train_output[i]:
            if char not in data["all_characters_2"]:
                data["all_characters_2"].append(char)
                index = len(data["all_characters_2"]) - 1
                data["char_num_map_2"][char] = index
                data["num_char_map_2"][index] = char
            else:
                index = data["char_num_map_2"][char]
            charToNum1.append(index)
        data["val_charToNum"][i] = torch.tensor(charToNum1, device=device)
    
    data["source_len"] = len(data["all_characters"])
    data["target_len"] = len(data["all_characters_2"])
    return data

data = pre_processing(copy.copy(train_input), copy.copy(train_output))

In [7]:
def pre_processing_validation(val_input, val_output):
    data2 = {
        "source_charToNum": torch.zeros(len(val_input), 30, dtype=torch.int, device=device),
        "val_charToNum": torch.zeros(len(val_output), 23, dtype=torch.int, device=device)
    }
    m1 = data["char_num_map"]
    m2 = data["char_num_map_2"]
    
    for i in range(len(val_input)):
        val_input[i] = "{" + val_input[i] + "}" * (29 - len(val_input[i]))
        charToNum = [m1[char] for char in val_input[i]]
        data2["source_charToNum"][i] = torch.tensor(charToNum, device=device)
        
        val_output[i] = "{" + val_output[i] + "}" * (22 - len(val_output[i]))
        charToNum1 = [m2[char] for char in val_output[i]]
        data2["val_charToNum"][i] = torch.tensor(charToNum1, device=device)
    
    return data2

data2 = pre_processing_validation(copy.copy(val_input), copy.copy(val_output))

In [8]:
class MyDataset(Dataset):
    def __init__(self, x, y):
        self.source = x
        self.target = y
    
    def __len__(self):
        return len(self.source)
    
    def __getitem__(self, idx):
        return self.source[idx], self.target[idx]

def dataLoaderFun(dataName, batch_size):
    if dataName == 'train':
        dataset = MyDataset(data["source_charToNum"], data['val_charToNum'])
    else:
        dataset = MyDataset(data2["source_charToNum"], data2['val_charToNum'])
    return DataLoader(dataset, batch_size=batch_size, shuffle=True)

class Encoder(nn.Module):
    def __init__(self, inputDim, embSize, encoderLayers, hiddenLayerNuerons, cellType, bidirection):
        super(Encoder, self).__init__()
        self.embedding = nn.Embedding(inputDim, embSize)
        self.encoderLayers = encoderLayers
        self.hiddenLayerNuerons = hiddenLayerNuerons
        self.bidirection = bidirection
        self.num_directions = 2 if bidirection == "Yes" else 1

        if cellType == 'GRU':
            self.rnn = nn.GRU(embSize, hiddenLayerNuerons, 
                            num_layers=encoderLayers,
                            bidirectional=(bidirection == "Yes"),
                            batch_first=True)
        elif cellType == 'LSTM':
            self.rnn = nn.LSTM(embSize, hiddenLayerNuerons,
                             num_layers=encoderLayers,
                             bidirectional=(bidirection == "Yes"),
                             batch_first=True)
        else:
            self.rnn = nn.RNN(embSize, hiddenLayerNuerons,
                            num_layers=encoderLayers,
                            bidirectional=(bidirection == "Yes"),
                            batch_first=True)

    def forward(self, currentInput, prevState):
        embdInput = self.embedding(currentInput)
        return self.rnn(embdInput, prevState)

    def getInitialState(self, batch_size):
        return torch.zeros(self.encoderLayers * self.num_directions, 
                          batch_size, 
                          self.hiddenLayerNuerons, 
                          device=device)

class Decoder(nn.Module):
    def __init__(self, outputDim, embSize, hiddenLayerNuerons, decoderLayers, cellType, dropout_p):
        super(Decoder, self).__init__()
        self.embedding = nn.Embedding(outputDim, embSize)
        self.decoderLayers = decoderLayers

        if cellType == 'GRU':
            self.rnn = nn.GRU(embSize, hiddenLayerNuerons,
                            num_layers=decoderLayers,
                            batch_first=True)
        elif cellType == 'LSTM':
            self.rnn = nn.LSTM(embSize, hiddenLayerNuerons,
                             num_layers=decoderLayers,
                             batch_first=True)
        else:
            self.rnn = nn.RNN(embSize, hiddenLayerNuerons,
                            num_layers=decoderLayers,
                            batch_first=True)

        self.fc = nn.Linear(hiddenLayerNuerons, outputDim)
        self.softmax = nn.LogSoftmax(dim=2)
        self.dropout = nn.Dropout(dropout_p)

    def forward(self, currentInput, prevState):
        embdInput = self.embedding(currentInput)
        output, prevState = self.rnn(embdInput, prevState)
        output = self.dropout(output)
        output = self.softmax(self.fc(output))
        return output, prevState

def init_decoder_state(encoder_state, encoderLayers, decoderLayers, cellType):
    if cellType == 'LSTM':
        h, c = encoder_state
        if encoderLayers >= decoderLayers:
            h_dec = h[-decoderLayers:]
            c_dec = c[-decoderLayers:]
        else:
            h_dec = torch.cat([h] + [h[-1:]]*(decoderLayers-encoderLayers), dim=0)
            c_dec = torch.cat([c] + [c[-1:]]*(decoderLayers-encoderLayers), dim=0)
        return (h_dec, c_dec)
    else:
        h = encoder_state
        if encoderLayers >= decoderLayers:
            h_dec = h[-decoderLayers:]
        else:
            h_dec = torch.cat([h] + [h[-1:]]*(decoderLayers-encoderLayers), dim=0)
        return h_dec

def train(embSize, encoderLayers, decoderLayers, hiddenLayerNuerons, cellType, bidirection, dropout, epochs, batchsize, learningRate, optimizer, tf_ratio):
    dataLoader = dataLoaderFun("train", batchsize)
    lossFunction = nn.NLLLoss()
    
    encoder = Encoder(data["source_len"], embSize, encoderLayers, 
                     hiddenLayerNuerons, cellType, bidirection).to(device)
    decoder = Decoder(data["target_len"], embSize, hiddenLayerNuerons,
                     decoderLayers, cellType, dropout).to(device)

    if optimizer == 'Adam':
        encoderOptimizer = optim.Adam(encoder.parameters(), lr=learningRate)
        decoderOptimizer = optim.Adam(decoder.parameters(), lr=learningRate)
    else:
        encoderOptimizer = optim.NAdam(encoder.parameters(), lr=learningRate)
        decoderOptimizer = optim.NAdam(decoder.parameters(), lr=learningRate)

    for epoch in range(epochs):
        train_accuracy = 0
        train_loss = 0
        total_samples = 0
        
        for batch_num, (sourceBatch, targetBatch) in enumerate(dataLoader):
            current_batch_size = sourceBatch.size(0)
            encoderInitialState = encoder.getInitialState(current_batch_size)
            
            if bidirection == "Yes":
                reversed_batch = torch.flip(sourceBatch, dims=[1])
                sourceBatch = (sourceBatch + reversed_batch) // 2
            
            if cellType == 'LSTM':
                encoderInitialState = (encoderInitialState, 
                                      torch.zeros_like(encoderInitialState))

            encoder_output, encoderCurrentState = encoder(sourceBatch, encoderInitialState)
            
            # Handle bidirectional state reduction
            if bidirection == "Yes":
                if cellType == 'LSTM':
                    encoderCurrentState = (
                        encoderCurrentState[0].view(encoderLayers, 2, current_batch_size, -1).sum(1),
                        encoderCurrentState[1].view(encoderLayers, 2, current_batch_size, -1).sum(1)
                    )
                else:
                    encoderCurrentState = encoderCurrentState.view(
                        encoderLayers, 2, current_batch_size, -1
                    ).sum(1)
            
            # Initialize decoder state
            decoderCurrState = init_decoder_state(
                encoderCurrentState, encoderLayers, decoderLayers, cellType
            )
            
            loss = 0
            sequenceLen = targetBatch.shape[1]
            Output = []
            randNumber = random.random()

            for i in range(sequenceLen):
                if i == 0:
                    decoderInput = targetBatch[:, i].reshape(current_batch_size, 1)
                else:
                    if randNumber < tf_ratio:
                        decoderInput = targetBatch[:, i].reshape(current_batch_size, 1)
                    else:
                        decoderInput = decoderInput.reshape(current_batch_size, 1)

                decoderOutput, decoderCurrState = decoder(decoderInput, decoderCurrState)
                _, topIndeces = decoderOutput.topk(1)
                decoderOutput = decoderOutput[:, -1, :]
                targetChars = targetBatch[:, i].type(dtype=torch.long)
                loss += lossFunction(decoderOutput, targetChars)
                decoderInput = topIndeces.squeeze().detach()
                Output.append(decoderInput)

            tensor_2d = torch.stack(Output)
            Output = tensor_2d.t()
            train_accuracy += (Output == targetBatch).all(dim=1).sum().item()
            train_loss += (loss.item() / sequenceLen)
            total_samples += targetBatch.size(0)

            encoderOptimizer.zero_grad()
            decoderOptimizer.zero_grad()
            loss.backward()
            encoderOptimizer.step()
            decoderOptimizer.step()
        
        val_acc, val_loss = validationAccuracy(encoder, decoder, batchsize, tf_ratio, cellType, bidirection)

        wandb.log({
            "epoch": epoch + 1,
            "train_loss": train_loss / len(dataLoader),
            "train_accuracy": train_accuracy / total_samples,
            "validation_loss": val_loss / len(dataLoaderFun("validation", batchsize)),
            "validation_accuracy": val_acc / sum(len(b) for b, _ in dataLoaderFun("validation", batchsize))
        })

def validationAccuracy(encoder, decoder, batchsize, tf_ratio, cellType, bidirection):
    dataLoader = dataLoaderFun("validation", batchsize)
    encoder.eval()
    decoder.eval()
    validation_accuracy = 0
    validation_loss = 0
    total_samples = 0
    lossFunction = nn.NLLLoss()

    for batch_num, (sourceBatch, targetBatch) in enumerate(dataLoader):
        current_batch_size = sourceBatch.size(0)
        encoderInitialState = encoder.getInitialState(current_batch_size)
        
        if cellType == 'LSTM':
            encoderInitialState = (encoderInitialState, 
                                  torch.zeros_like(encoderInitialState))
        
        if bidirection == "Yes":
            reversed_batch = torch.flip(sourceBatch, dims=[1])
            sourceBatch = (sourceBatch + reversed_batch) // 2

        encoder_output, encoderCurrentState = encoder(sourceBatch, encoderInitialState)
        
        # Handle bidirectional state reduction
        if bidirection == "Yes":
            if cellType == 'LSTM':
                encoderCurrentState = (
                    encoderCurrentState[0].view(encoder.encoderLayers, 2, current_batch_size, -1).sum(1),
                    encoderCurrentState[1].view(encoder.encoderLayers, 2, current_batch_size, -1).sum(1)
                )
            else:
                encoderCurrentState = encoderCurrentState.view(
                    encoder.encoderLayers, 2, current_batch_size, -1
                ).sum(1)
        
        decoderCurrState = init_decoder_state(
            encoderCurrentState, encoder.encoderLayers, decoder.decoderLayers, cellType
        )
        
        loss = 0
        outputSeqLen = targetBatch.shape[1]
        Output = []
        randNumber = random.random()

        for i in range(outputSeqLen):
            if i == 0:
                decoderInputensor = targetBatch[:, i].reshape(current_batch_size, 1)
            else:
                if randNumber < tf_ratio:
                    decoderInputensor = targetBatch[:, i].reshape(current_batch_size, 1)
                else:
                    decoderInputensor = decoderInputensor.reshape(current_batch_size, 1)

            decoderOutput, decoderCurrState = decoder(decoderInputensor, decoderCurrState)
            _, topIndeces = decoderOutput.topk(1)
            decoderOutput = decoderOutput[:, -1, :]
            curr_target_chars = targetBatch[:, i].type(dtype=torch.long)
            loss += lossFunction(decoderOutput, curr_target_chars)
            decoderInputensor = topIndeces.squeeze().detach()
            Output.append(decoderInputensor)

        tensor_2d = torch.stack(Output)
        Output = tensor_2d.t()
        validation_accuracy += (Output == targetBatch).all(dim=1).sum().item()
        validation_loss += (loss.item() / outputSeqLen)
        total_samples += targetBatch.size(0)

    encoder.train()
    decoder.train()
    return validation_accuracy, validation_loss

In [9]:
def main_fun():
    wandb.init(project='CS23S025-Assignment-3-DL')
    params = wandb.config
    train(params.embSize, params.encoderLayers, params.decoderLayers,
          params.hiddenLayerNuerons, params.cellType, params.bidirection,
          params.dropout, params.epochs, params.batchsize, params.learningRate,
          params.optimizer, params.tf_ratio)

sweep_params = {
    'method': 'bayes',
    'name': 'Assignment_3_WITHOUT_Attention_2',
    'metric': {
        'goal': 'maximize',
        'name': 'validation_accuracy',
    },
    'parameters': {
        'embSize': {'values': [32, 64,128,256]},
        'encoderLayers': {'values': [2,3,4,5,7]},
        'decoderLayers': {'values': [2,3,4,5]},
        'hiddenLayerNuerons': {'values': [64, 256, 512]},
        'cellType': {'values': ['GRU', 'RNN', 'LSTM']},
        'bidirection': {'values': ['no', 'Yes']},
        'dropout': {'values': [0, 0.2, 0.3,0.5]},
        'epochs': {'values': [10, 15,20,25]},
        'batchsize': {'values': [32, 64,128]},
        'learningRate': {'values': [1e-2, 1e-3, 1e-4]},
        'optimizer': {'values': ['Adam', 'Nadam']},
        'tf_ratio': {'values': [0.2, 0.4, 0.5,0.7]}
    }
}

In [10]:
sweepId = wandb.sweep(sweep_params, project='CS23S025-Assignment-3-DL')
wandb.agent(sweepId, function=main_fun, count=50, entity="cs23s025-indian-institute-of-technology-madras", project="CS23S025-Assignment-3-DL")

Create sweep with ID: wfnp37oj
Sweep URL: https://wandb.ai/cs23s025-indian-institute-of-technology-madras/CS23S025-Assignment-3-DL/sweeps/wfnp37oj


[34m[1mwandb[0m: Agent Starting Run: 390l47mo with config:
[34m[1mwandb[0m: 	batchsize: 32
[34m[1mwandb[0m: 	bidirection: no
[34m[1mwandb[0m: 	cellType: LSTM
[34m[1mwandb[0m: 	decoderLayers: 5
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embSize: 32
[34m[1mwandb[0m: 	encoderLayers: 1
[34m[1mwandb[0m: 	epochs: 15
[34m[1mwandb[0m: 	hiddenLayerNuerons: 256
[34m[1mwandb[0m: 	learningRate: 0.001
[34m[1mwandb[0m: 	optimizer: Adam
[34m[1mwandb[0m: 	tf_ratio: 0.4


0,1
epoch,▁▁▂▃▃▃▄▅▅▅▆▇▇▇█
train_accuracy,▁▂▅▆▆▆▆▇▇▇█████
train_loss,█▅▃▂▂▂▂▂▁▁▁▁▁▁▁
validation_accuracy,▁▅▆▇▆▇▇▇▇▇▇▇█▇█
validation_loss,█▃▂▂▂▂▂▁▂▁▁▁▁▁▁

0,1
epoch,15.0
train_accuracy,0.60764
train_loss,0.123
validation_accuracy,0.55851
validation_loss,0.19666


[34m[1mwandb[0m: Agent Starting Run: hw2v6dsb with config:
[34m[1mwandb[0m: 	batchsize: 32
[34m[1mwandb[0m: 	bidirection: no
[34m[1mwandb[0m: 	cellType: GRU
[34m[1mwandb[0m: 	decoderLayers: 5
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embSize: 16
[34m[1mwandb[0m: 	encoderLayers: 1
[34m[1mwandb[0m: 	epochs: 15
[34m[1mwandb[0m: 	hiddenLayerNuerons: 512
[34m[1mwandb[0m: 	learningRate: 0.0001
[34m[1mwandb[0m: 	optimizer: Nadam
[34m[1mwandb[0m: 	tf_ratio: 0.4


0,1
epoch,▁▁▂▃▃▃▄▅▅▅▆▇▇▇█
train_accuracy,▁▁▃▆▇█▇▇▇▇▇██▇▇
train_loss,█▇▄▃▃▂▂▂▂▂▁▁▁▁▁
validation_accuracy,▁▁▅▇▆█▇█▇▇▆▆▇██
validation_loss,█▆▄▃▄▂▂▂▂▂▃▂▂▁▁

0,1
epoch,15.0
train_accuracy,0.37987
train_loss,0.42844
validation_accuracy,0.43575
validation_loss,0.36092


[34m[1mwandb[0m: Agent Starting Run: o0p52m5d with config:
[34m[1mwandb[0m: 	batchsize: 64
[34m[1mwandb[0m: 	bidirection: Yes
[34m[1mwandb[0m: 	cellType: GRU
[34m[1mwandb[0m: 	decoderLayers: 10
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	embSize: 32
[34m[1mwandb[0m: 	encoderLayers: 5
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hiddenLayerNuerons: 64
[34m[1mwandb[0m: 	learningRate: 0.01
[34m[1mwandb[0m: 	optimizer: Nadam
[34m[1mwandb[0m: 	tf_ratio: 0.5


0,1
epoch,▁▂▃▃▄▅▆▆▇█
train_accuracy,█▆▃▃▃▆▃██▁
train_loss,▄▁▁▁▁▁▆█▆▄
validation_accuracy,▁▁▁▁▁▁▁▁▁▁
validation_loss,▁▁▁▁▁▁█▄▆▂

0,1
epoch,10.0
train_accuracy,0.0
train_loss,1.17127
validation_accuracy,0.0
validation_loss,1.03836


[34m[1mwandb[0m: Agent Starting Run: 3mm2w4i6 with config:
[34m[1mwandb[0m: 	batchsize: 32
[34m[1mwandb[0m: 	bidirection: Yes
[34m[1mwandb[0m: 	cellType: LSTM
[34m[1mwandb[0m: 	decoderLayers: 5
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	embSize: 64
[34m[1mwandb[0m: 	encoderLayers: 1
[34m[1mwandb[0m: 	epochs: 15
[34m[1mwandb[0m: 	hiddenLayerNuerons: 256
[34m[1mwandb[0m: 	learningRate: 0.0001
[34m[1mwandb[0m: 	optimizer: Adam
[34m[1mwandb[0m: 	tf_ratio: 0.5


0,1
epoch,▁▁▂▃▃▃▄▅▅▅▆▇▇▇█
train_accuracy,▁▁▁▂▂▃▄▅▆▇▇████
train_loss,█▅▄▃▃▂▂▂▂▁▁▁▁▁▁
validation_accuracy,▁▁▁▂▃▄▅▆▆▆▇▇█▇█
validation_loss,█▆▅▄▃▃▂▂▂▂▁▂▁▁▁

0,1
epoch,15.0
train_accuracy,0.49903
train_loss,0.23241
validation_accuracy,0.50872
validation_loss,0.22314


[34m[1mwandb[0m: Agent Starting Run: wfbqshl1 with config:
[34m[1mwandb[0m: 	batchsize: 32
[34m[1mwandb[0m: 	bidirection: Yes
[34m[1mwandb[0m: 	cellType: LSTM
[34m[1mwandb[0m: 	decoderLayers: 5
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	embSize: 64
[34m[1mwandb[0m: 	encoderLayers: 1
[34m[1mwandb[0m: 	epochs: 15
[34m[1mwandb[0m: 	hiddenLayerNuerons: 512
[34m[1mwandb[0m: 	learningRate: 0.0001
[34m[1mwandb[0m: 	optimizer: Nadam
[34m[1mwandb[0m: 	tf_ratio: 0.4


0,1
epoch,▁▁▂▃▃▃▄▅▅▅▆▇▇▇█
train_accuracy,▁▁▂▃▄▅▅▆▆▇▇▇███
train_loss,█▅▄▃▃▂▂▂▂▂▂▁▁▁▁
validation_accuracy,▁▁▂▄▅▅▆▇▇█▇████
validation_loss,█▅▄▂▂▂▂▁▁▁▁▁▁▁▁

0,1
epoch,15.0
train_accuracy,0.50864
train_loss,0.16872
validation_accuracy,0.42336
validation_loss,0.27545


[34m[1mwandb[0m: Agent Starting Run: wq6ec8gr with config:
[34m[1mwandb[0m: 	batchsize: 32
[34m[1mwandb[0m: 	bidirection: Yes
[34m[1mwandb[0m: 	cellType: LSTM
[34m[1mwandb[0m: 	decoderLayers: 1
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	embSize: 64
[34m[1mwandb[0m: 	encoderLayers: 1
[34m[1mwandb[0m: 	epochs: 15
[34m[1mwandb[0m: 	hiddenLayerNuerons: 256
[34m[1mwandb[0m: 	learningRate: 0.001
[34m[1mwandb[0m: 	optimizer: Nadam
[34m[1mwandb[0m: 	tf_ratio: 0.5


0,1
epoch,▁▁▂▃▃▃▄▅▅▅▆▇▇▇█
train_accuracy,▁▅▆▅▅▆▆▆▆▇▇▇█▇█
train_loss,█▄▃▃▃▂▂▂▂▂▂▂▁▁▁
validation_accuracy,▆▁▂▅▄▃▄█▇▁▆▆▆▆▆
validation_loss,▆█▆▄▄▅▅▁▂▆▂▃▃▃▃

0,1
epoch,15.0
train_accuracy,0.59312
train_loss,0.15522
validation_accuracy,0.57067
validation_loss,0.19636


[34m[1mwandb[0m: Agent Starting Run: cslk6k5k with config:
[34m[1mwandb[0m: 	batchsize: 32
[34m[1mwandb[0m: 	bidirection: no
[34m[1mwandb[0m: 	cellType: LSTM
[34m[1mwandb[0m: 	decoderLayers: 1
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embSize: 64
[34m[1mwandb[0m: 	encoderLayers: 5
[34m[1mwandb[0m: 	epochs: 15
[34m[1mwandb[0m: 	hiddenLayerNuerons: 64
[34m[1mwandb[0m: 	learningRate: 0.0001
[34m[1mwandb[0m: 	optimizer: Adam
[34m[1mwandb[0m: 	tf_ratio: 0.4


0,1
epoch,▁▁▂▃▃▃▄▅▅▅▆▇▇▇█
train_accuracy,▁▁▃▅▆▇▇▇███████
train_loss,█▄▃▂▂▂▂▂▁▁▁▁▁▁▁
validation_accuracy,▁▂▄▅▆▅▇█▇▆▆▇█▇▇
validation_loss,█▆▄▄▃▃▂▁▂▃▂▂▁▂▂

0,1
epoch,15.0
train_accuracy,0.40711
train_loss,0.55989
validation_accuracy,0.37219
validation_loss,0.56132


[34m[1mwandb[0m: Agent Starting Run: ojt1fj7k with config:
[34m[1mwandb[0m: 	batchsize: 32
[34m[1mwandb[0m: 	bidirection: Yes
[34m[1mwandb[0m: 	cellType: LSTM
[34m[1mwandb[0m: 	decoderLayers: 1
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	embSize: 64
[34m[1mwandb[0m: 	encoderLayers: 1
[34m[1mwandb[0m: 	epochs: 15
[34m[1mwandb[0m: 	hiddenLayerNuerons: 512
[34m[1mwandb[0m: 	learningRate: 0.0001
[34m[1mwandb[0m: 	optimizer: Nadam
[34m[1mwandb[0m: 	tf_ratio: 0.5


0,1
epoch,▁▁▂▃▃▃▄▅▅▅▆▇▇▇█
train_accuracy,▁▆▇▇▇▇██▇▇▇████
train_loss,█▄▃▂▂▂▂▁▂▁▁▁▁▁▁
validation_accuracy,▁▃▄▅▅▅▇▅▅▆▆▇▅█▆
validation_loss,█▆▄▃▃▃▂▃▃▂▂▂▂▁▂

0,1
epoch,15.0
train_accuracy,0.53312
train_loss,0.21023
validation_accuracy,0.53924
validation_loss,0.21192


[34m[1mwandb[0m: Agent Starting Run: l47mo22v with config:
[34m[1mwandb[0m: 	batchsize: 32
[34m[1mwandb[0m: 	bidirection: no
[34m[1mwandb[0m: 	cellType: LSTM
[34m[1mwandb[0m: 	decoderLayers: 5
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embSize: 16
[34m[1mwandb[0m: 	encoderLayers: 1
[34m[1mwandb[0m: 	epochs: 15
[34m[1mwandb[0m: 	hiddenLayerNuerons: 512
[34m[1mwandb[0m: 	learningRate: 0.0001
[34m[1mwandb[0m: 	optimizer: Adam
[34m[1mwandb[0m: 	tf_ratio: 0.4


0,1
epoch,▁▁▂▃▃▃▄▅▅▅▆▇▇▇█
train_accuracy,▁▁▁▁▂▃▄▅▆▇▇█▇█▇
train_loss,█▆▅▄▂▂▂▁▁▁▁▁▁▁▁
validation_accuracy,▁▁▁▁▂▃▄▄▇▇▇▆█▇▇
validation_loss,█▇▆▄▃▂▃▃▂▂▂▂▁▃▂

0,1
epoch,15.0
train_accuracy,0.30171
train_loss,0.5995
validation_accuracy,0.36806
validation_loss,0.54163


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: gaovofrg with config:
[34m[1mwandb[0m: 	batchsize: 32
[34m[1mwandb[0m: 	bidirection: no
[34m[1mwandb[0m: 	cellType: LSTM
[34m[1mwandb[0m: 	decoderLayers: 5
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	embSize: 64
[34m[1mwandb[0m: 	encoderLayers: 1
[34m[1mwandb[0m: 	epochs: 15
[34m[1mwandb[0m: 	hiddenLayerNuerons: 512
[34m[1mwandb[0m: 	learningRate: 0.001
[34m[1mwandb[0m: 	optimizer: Adam
[34m[1mwandb[0m: 	tf_ratio: 0.4


0,1
epoch,▁▁▂▃▃▃▄▅▅▅▆▇▇▇█
train_accuracy,▁▃▅▅▆▆▆▇▇▇▇████
train_loss,█▄▃▂▂▂▂▂▁▁▁▁▁▁▁
validation_accuracy,▁▄▆▇▇█▇▇▇▇▇█▇██
validation_loss,█▃▂▁▁▁▁▁▁▁▁▁▂▁▁

0,1
epoch,15.0
train_accuracy,0.71757
train_loss,0.0739
validation_accuracy,0.53534
validation_loss,0.22388


[34m[1mwandb[0m: Agent Starting Run: 28kpj1et with config:
[34m[1mwandb[0m: 	batchsize: 64
[34m[1mwandb[0m: 	bidirection: no
[34m[1mwandb[0m: 	cellType: LSTM
[34m[1mwandb[0m: 	decoderLayers: 1
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embSize: 64
[34m[1mwandb[0m: 	encoderLayers: 1
[34m[1mwandb[0m: 	epochs: 15
[34m[1mwandb[0m: 	hiddenLayerNuerons: 512
[34m[1mwandb[0m: 	learningRate: 0.001
[34m[1mwandb[0m: 	optimizer: Nadam
[34m[1mwandb[0m: 	tf_ratio: 0.5


0,1
epoch,▁▁▂▃▃▃▄▅▅▅▆▇▇▇█
train_accuracy,▁▃▄▅▅▅▆▆▆▇▇▇███
train_loss,█▅▃▂▂▂▂▂▂▁▁▁▁▁▁
validation_accuracy,▂▁▁▅▃▆▅▅▇▅▅▄█▆▇
validation_loss,█▅▃▂▂▁▂▂▁▂▂▂▁▂▂

0,1
epoch,15.0
train_accuracy,0.75524
train_loss,0.07273
validation_accuracy,0.67003
validation_loss,0.13855


[34m[1mwandb[0m: Agent Starting Run: o5oowe9c with config:
[34m[1mwandb[0m: 	batchsize: 64
[34m[1mwandb[0m: 	bidirection: no
[34m[1mwandb[0m: 	cellType: LSTM
[34m[1mwandb[0m: 	decoderLayers: 1
[34m[1mwandb[0m: 	dropout: 0
[34m[1mwandb[0m: 	embSize: 64
[34m[1mwandb[0m: 	encoderLayers: 1
[34m[1mwandb[0m: 	epochs: 15
[34m[1mwandb[0m: 	hiddenLayerNuerons: 256
[34m[1mwandb[0m: 	learningRate: 0.01
[34m[1mwandb[0m: 	optimizer: Adam
[34m[1mwandb[0m: 	tf_ratio: 0.5


0,1
epoch,▁▁▂▃▃▃▄▅▅▅▆▇▇▇█
train_accuracy,▁▃▆▃▆▅▇▅▇▆▇▆▇█▇
train_loss,█▅▃▃▂▂▂▂▁▂▁▁▁▁▁
validation_accuracy,▂▇▄▃▇▇▅▄▁█▄▃▆▆▅
validation_loss,█▄▄▄▂▂▂▃▃▁▂▃▂▁▂

0,1
epoch,15.0
train_accuracy,0.55328
train_loss,0.22282
validation_accuracy,0.55507
validation_loss,0.21941


[34m[1mwandb[0m: Agent Starting Run: vx4hm9m4 with config:
[34m[1mwandb[0m: 	batchsize: 64
[34m[1mwandb[0m: 	bidirection: no
[34m[1mwandb[0m: 	cellType: LSTM
[34m[1mwandb[0m: 	decoderLayers: 1
[34m[1mwandb[0m: 	dropout: 0
[34m[1mwandb[0m: 	embSize: 64
[34m[1mwandb[0m: 	encoderLayers: 1
[34m[1mwandb[0m: 	epochs: 15
[34m[1mwandb[0m: 	hiddenLayerNuerons: 512
[34m[1mwandb[0m: 	learningRate: 0.01
[34m[1mwandb[0m: 	optimizer: Nadam
[34m[1mwandb[0m: 	tf_ratio: 0.4


0,1
epoch,▁▁▂▃▃▃▄▅▅▅▆▇▇▇█
train_accuracy,▁▆▅▆▆▆▇▇▇▇██▇██
train_loss,█▃▃▂▂▂▂▂▁▁▁▁▁▁▁
validation_accuracy,▁▃▁▄▅▃▂▄▆█▃▇▅▃▄
validation_loss,█▅▅▃▂▃▂▂▁▁▂▁▂▂▂

0,1
epoch,15.0
train_accuracy,0.48292
train_loss,0.22384
validation_accuracy,0.43506
validation_loss,0.26262


[34m[1mwandb[0m: Agent Starting Run: cx436swr with config:
[34m[1mwandb[0m: 	batchsize: 64
[34m[1mwandb[0m: 	bidirection: no
[34m[1mwandb[0m: 	cellType: LSTM
[34m[1mwandb[0m: 	decoderLayers: 10
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	embSize: 64
[34m[1mwandb[0m: 	encoderLayers: 5
[34m[1mwandb[0m: 	epochs: 15
[34m[1mwandb[0m: 	hiddenLayerNuerons: 512
[34m[1mwandb[0m: 	learningRate: 0.01
[34m[1mwandb[0m: 	optimizer: Adam
[34m[1mwandb[0m: 	tf_ratio: 0.5


0,1
epoch,▁▁▂▃▃▃▄▅▅▅▆▇▇▇█
train_accuracy,▁█▁▆▃▃▁▃▁██▁▃▁▁
train_loss,█▃▂▂▁▂▂▁▂▂▁▂▁▂▂
validation_accuracy,▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
validation_loss,▇▆▃█▆▅▃▁▆▃▃▄▃▄▂

0,1
epoch,15.0
train_accuracy,0.0
train_loss,1.10019
validation_accuracy,0.0
validation_loss,1.02253


[34m[1mwandb[0m: Agent Starting Run: kgcrz73n with config:
[34m[1mwandb[0m: 	batchsize: 32
[34m[1mwandb[0m: 	bidirection: no
[34m[1mwandb[0m: 	cellType: LSTM
[34m[1mwandb[0m: 	decoderLayers: 5
[34m[1mwandb[0m: 	dropout: 0
[34m[1mwandb[0m: 	embSize: 64
[34m[1mwandb[0m: 	encoderLayers: 1
[34m[1mwandb[0m: 	epochs: 15
[34m[1mwandb[0m: 	hiddenLayerNuerons: 512
[34m[1mwandb[0m: 	learningRate: 0.001
[34m[1mwandb[0m: 	optimizer: Nadam
[34m[1mwandb[0m: 	tf_ratio: 0.5


0,1
epoch,▁▁▂▃▃▃▄▅▅▅▆▇▇▇█
train_accuracy,▁▅▆▆▆▆▆▆▇▇▇▇███
train_loss,█▅▄▄▃▃▂▂▂▂▂▁▁▁▁
validation_accuracy,▁▅▆▆▆▇▇▆▇█▇▇▇█▇
validation_loss,█▆▅▄▄▃▂▂▂▁▁▂▂▁▂

0,1
epoch,15.0
train_accuracy,0.70368
train_loss,0.09033
validation_accuracy,0.54543
validation_loss,0.21429


[34m[1mwandb[0m: Agent Starting Run: cg5rotdt with config:
[34m[1mwandb[0m: 	batchsize: 32
[34m[1mwandb[0m: 	bidirection: no
[34m[1mwandb[0m: 	cellType: LSTM
[34m[1mwandb[0m: 	decoderLayers: 1
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	embSize: 32
[34m[1mwandb[0m: 	encoderLayers: 1
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hiddenLayerNuerons: 512
[34m[1mwandb[0m: 	learningRate: 0.001
[34m[1mwandb[0m: 	optimizer: Nadam
[34m[1mwandb[0m: 	tf_ratio: 0.4


0,1
epoch,▁▂▃▃▄▅▆▆▇█
train_accuracy,▁▄▄▅▆▆▇▇██
train_loss,█▄▃▂▂▂▁▁▁▁
validation_accuracy,▁▂▄▄▄▅▆▅█▇
validation_loss,█▅▃▂▂▂▂▂▁▁

0,1
epoch,10.0
train_accuracy,0.63063
train_loss,0.12057
validation_accuracy,0.57136
validation_loss,0.17939


[34m[1mwandb[0m: Agent Starting Run: socc60v9 with config:
[34m[1mwandb[0m: 	batchsize: 32
[34m[1mwandb[0m: 	bidirection: no
[34m[1mwandb[0m: 	cellType: LSTM
[34m[1mwandb[0m: 	decoderLayers: 5
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embSize: 32
[34m[1mwandb[0m: 	encoderLayers: 1
[34m[1mwandb[0m: 	epochs: 15
[34m[1mwandb[0m: 	hiddenLayerNuerons: 512
[34m[1mwandb[0m: 	learningRate: 0.001
[34m[1mwandb[0m: 	optimizer: Nadam
[34m[1mwandb[0m: 	tf_ratio: 0.4


0,1
epoch,▁▁▂▃▃▃▄▅▅▅▆▇▇▇█
train_accuracy,▁▅▅▅▅▅▆▆▇▇▇▇███
train_loss,█▆▅▅▄▃▂▂▂▂▂▁▁▁▁
validation_accuracy,▁▅▂▃▄▅▇▅▅▅▆▆███
validation_loss,█▇▆▅▃▂▁▂▂▂▁▁▁▁▁

0,1
epoch,15.0
train_accuracy,0.59624
train_loss,0.12397
validation_accuracy,0.49541
validation_loss,0.22263


[34m[1mwandb[0m: Agent Starting Run: m142928d with config:
[34m[1mwandb[0m: 	batchsize: 64
[34m[1mwandb[0m: 	bidirection: no
[34m[1mwandb[0m: 	cellType: LSTM
[34m[1mwandb[0m: 	decoderLayers: 1
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	embSize: 64
[34m[1mwandb[0m: 	encoderLayers: 1
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hiddenLayerNuerons: 256
[34m[1mwandb[0m: 	learningRate: 0.001
[34m[1mwandb[0m: 	optimizer: Adam
[34m[1mwandb[0m: 	tf_ratio: 0.5


0,1
epoch,▁▂▃▃▄▅▆▆▇█
train_accuracy,▁▅▅▅▆▆▇▇██
train_loss,█▅▄▃▂▂▂▁▁▁
validation_accuracy,▁▂▂▃▂▇█▅▅▇
validation_loss,█▆▄▃▃▂▁▂▂▁

0,1
epoch,10.0
train_accuracy,0.59138
train_loss,0.16835
validation_accuracy,0.61726
validation_loss,0.14971


[34m[1mwandb[0m: Agent Starting Run: 1s7i17ar with config:
[34m[1mwandb[0m: 	batchsize: 64
[34m[1mwandb[0m: 	bidirection: Yes
[34m[1mwandb[0m: 	cellType: LSTM
[34m[1mwandb[0m: 	decoderLayers: 1
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embSize: 32
[34m[1mwandb[0m: 	encoderLayers: 1
[34m[1mwandb[0m: 	epochs: 15
[34m[1mwandb[0m: 	hiddenLayerNuerons: 512
[34m[1mwandb[0m: 	learningRate: 0.001
[34m[1mwandb[0m: 	optimizer: Nadam
[34m[1mwandb[0m: 	tf_ratio: 0.5


0,1
epoch,▁▁▂▃▃▃▄▅▅▅▆▇▇▇█
train_accuracy,▁▅▄▄▆▆▆▆▇▇▇▇███
train_loss,█▃▃▃▂▂▂▂▂▁▁▁▁▁▁
validation_accuracy,▇▅▃█▇▅▆▇▆▇▂▅▃▁▂
validation_loss,▇▄▅▁▂▂▂▁▃▂▆▄▆██

0,1
epoch,15.0
train_accuracy,0.66173
train_loss,0.10466
validation_accuracy,0.48531
validation_loss,0.26666


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: 9eyp8qwf with config:
[34m[1mwandb[0m: 	batchsize: 64
[34m[1mwandb[0m: 	bidirection: no
[34m[1mwandb[0m: 	cellType: LSTM
[34m[1mwandb[0m: 	decoderLayers: 1
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	embSize: 32
[34m[1mwandb[0m: 	encoderLayers: 5
[34m[1mwandb[0m: 	epochs: 15
[34m[1mwandb[0m: 	hiddenLayerNuerons: 512
[34m[1mwandb[0m: 	learningRate: 0.001
[34m[1mwandb[0m: 	optimizer: Adam
[34m[1mwandb[0m: 	tf_ratio: 0.5


0,1
epoch,▁▁▂▃▃▃▄▅▅▅▆▇▇▇█
train_accuracy,▁███▆▇▇▇█▇▇██▇▇
train_loss,█▃▃▃▄▃▃▃▂▂▂▁▁▁▁
validation_accuracy,▅▄▆▆▇▅▅▅▅█▆█▇▁▅
validation_loss,▇█▅▅▄▆▆▅▅▁▂▁▁▆▃

0,1
epoch,15.0
train_accuracy,0.4826
train_loss,0.36633
validation_accuracy,0.47017
validation_loss,0.36685


[34m[1mwandb[0m: Agent Starting Run: 8rmjkmp2 with config:
[34m[1mwandb[0m: 	batchsize: 64
[34m[1mwandb[0m: 	bidirection: no
[34m[1mwandb[0m: 	cellType: LSTM
[34m[1mwandb[0m: 	decoderLayers: 1
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	embSize: 64
[34m[1mwandb[0m: 	encoderLayers: 5
[34m[1mwandb[0m: 	epochs: 15
[34m[1mwandb[0m: 	hiddenLayerNuerons: 512
[34m[1mwandb[0m: 	learningRate: 0.0001
[34m[1mwandb[0m: 	optimizer: Nadam
[34m[1mwandb[0m: 	tf_ratio: 0.5


0,1
epoch,▁▁▂▃▃▃▄▅▅▅▆▇▇▇█
train_accuracy,▁▅▇█▇████▇█████
train_loss,█▄▃▂▂▂▁▁▁▁▁▁▁▁▁
validation_accuracy,▁▄▆▆▅▆▆▆▆▇▆▅█▆▆
validation_loss,█▅▃▄▄▃▃▃▃▂▃▃▁▂▂

0,1
epoch,15.0
train_accuracy,0.49061
train_loss,0.37415
validation_accuracy,0.51606
validation_loss,0.33331


[34m[1mwandb[0m: Agent Starting Run: yef6l17o with config:
[34m[1mwandb[0m: 	batchsize: 64
[34m[1mwandb[0m: 	bidirection: no
[34m[1mwandb[0m: 	cellType: RNN
[34m[1mwandb[0m: 	decoderLayers: 1
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	embSize: 64
[34m[1mwandb[0m: 	encoderLayers: 1
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hiddenLayerNuerons: 512
[34m[1mwandb[0m: 	learningRate: 0.0001
[34m[1mwandb[0m: 	optimizer: Adam
[34m[1mwandb[0m: 	tf_ratio: 0.5


0,1
epoch,▁▂▃▃▄▅▆▆▇█
train_accuracy,▁▆▇▇▇█▇██▇
train_loss,█▃▃▂▂▂▂▁▁▂
validation_accuracy,▁▆▅▆▆▅█▆▆▆
validation_loss,█▄▄▃▄▄▁▄▃▄

0,1
epoch,10.0
train_accuracy,0.46086
train_loss,0.59593
validation_accuracy,0.49954
validation_loss,0.51225


[34m[1mwandb[0m: Agent Starting Run: ncb87gpm with config:
[34m[1mwandb[0m: 	batchsize: 64
[34m[1mwandb[0m: 	bidirection: no
[34m[1mwandb[0m: 	cellType: LSTM
[34m[1mwandb[0m: 	decoderLayers: 1
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	embSize: 64
[34m[1mwandb[0m: 	encoderLayers: 5
[34m[1mwandb[0m: 	epochs: 15
[34m[1mwandb[0m: 	hiddenLayerNuerons: 512
[34m[1mwandb[0m: 	learningRate: 0.001
[34m[1mwandb[0m: 	optimizer: Nadam
[34m[1mwandb[0m: 	tf_ratio: 0.5


0,1
epoch,▁▁▂▃▃▃▄▅▅▅▆▇▇▇█
train_accuracy,▁▇█▇▇▇▇▇▆▇▆▇▇▇▇
train_loss,█▅▃▃▃▃▃▂▃▂▂▂▁▁▁
validation_accuracy,▃▃▄█▇▂▇▄▁█▃▅▃▇▅
validation_loss,██▅▂▃▅▂▄▅▁▃▂▃▁▂

0,1
epoch,15.0
train_accuracy,0.5117
train_loss,0.29467
validation_accuracy,0.52019
validation_loss,0.27842


[34m[1mwandb[0m: Agent Starting Run: fgr6rt4w with config:
[34m[1mwandb[0m: 	batchsize: 32
[34m[1mwandb[0m: 	bidirection: no
[34m[1mwandb[0m: 	cellType: LSTM
[34m[1mwandb[0m: 	decoderLayers: 1
[34m[1mwandb[0m: 	dropout: 0
[34m[1mwandb[0m: 	embSize: 64
[34m[1mwandb[0m: 	encoderLayers: 1
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hiddenLayerNuerons: 256
[34m[1mwandb[0m: 	learningRate: 0.01
[34m[1mwandb[0m: 	optimizer: Nadam
[34m[1mwandb[0m: 	tf_ratio: 0.5


0,1
epoch,▁▂▃▃▄▅▆▆▇█
train_accuracy,▁▅▃▂▅▆▇▆█▆
train_loss,█▄▄▃▂▂▁▁▁▁
validation_accuracy,▃█▁▅▅▇▃▆▂▃
validation_loss,█▂▅▂▂▁▂▁▂▂

0,1
epoch,10.0
train_accuracy,0.52448
train_loss,0.25765
validation_accuracy,0.4922
validation_loss,0.26231


[34m[1mwandb[0m: Agent Starting Run: 6waxcmb4 with config:
[34m[1mwandb[0m: 	batchsize: 64
[34m[1mwandb[0m: 	bidirection: no
[34m[1mwandb[0m: 	cellType: LSTM
[34m[1mwandb[0m: 	decoderLayers: 1
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	embSize: 32
[34m[1mwandb[0m: 	encoderLayers: 1
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hiddenLayerNuerons: 512
[34m[1mwandb[0m: 	learningRate: 0.001
[34m[1mwandb[0m: 	optimizer: Nadam
[34m[1mwandb[0m: 	tf_ratio: 0.5


0,1
epoch,▁▂▃▃▄▅▆▆▇█
train_accuracy,▁▄▅▅▆▆▇▇▇█
train_loss,█▄▃▂▂▂▁▁▁▁
validation_accuracy,▁▄▅▇▆▇▇▆▇█
validation_loss,█▄▂▂▂▁▁▂▁▁

0,1
epoch,10.0
train_accuracy,0.67642
train_loss,0.11358
validation_accuracy,0.66361
validation_loss,0.13143


[34m[1mwandb[0m: Agent Starting Run: u4k3uqev with config:
[34m[1mwandb[0m: 	batchsize: 64
[34m[1mwandb[0m: 	bidirection: Yes
[34m[1mwandb[0m: 	cellType: LSTM
[34m[1mwandb[0m: 	decoderLayers: 1
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	embSize: 64
[34m[1mwandb[0m: 	encoderLayers: 1
[34m[1mwandb[0m: 	epochs: 15
[34m[1mwandb[0m: 	hiddenLayerNuerons: 256
[34m[1mwandb[0m: 	learningRate: 0.01
[34m[1mwandb[0m: 	optimizer: Adam
[34m[1mwandb[0m: 	tf_ratio: 0.4


0,1
epoch,▁▁▂▃▃▃▄▅▅▅▆▇▇▇█
train_accuracy,▁█▅▆▇▇█▇▇▆▅▆▇▇▇
train_loss,█▃▃▂▂▁▁▁▁▂▂▁▁▁▁
validation_accuracy,▁▅▄▆▄▄▄▄▄▃▄▃▅█▃
validation_loss,█▄▄▃▄▃▃▄▃▄▃▃▃▁▄

0,1
epoch,15.0
train_accuracy,0.42376
train_loss,0.29986
validation_accuracy,0.39123
validation_loss,0.30956


[34m[1mwandb[0m: Agent Starting Run: 86u0cni5 with config:
[34m[1mwandb[0m: 	batchsize: 64
[34m[1mwandb[0m: 	bidirection: no
[34m[1mwandb[0m: 	cellType: LSTM
[34m[1mwandb[0m: 	decoderLayers: 1
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embSize: 32
[34m[1mwandb[0m: 	encoderLayers: 1
[34m[1mwandb[0m: 	epochs: 15
[34m[1mwandb[0m: 	hiddenLayerNuerons: 256
[34m[1mwandb[0m: 	learningRate: 0.001
[34m[1mwandb[0m: 	optimizer: Adam
[34m[1mwandb[0m: 	tf_ratio: 0.5


0,1
epoch,▁▁▂▃▃▃▄▅▅▅▆▇▇▇█
train_accuracy,▁▅▆▅▆▆▆▇▇▇▇▇██▇
train_loss,█▅▄▃▂▂▂▂▁▁▁▁▁▁▁
validation_accuracy,▁▁▁▃▇▂▃▅▃█▅▆▆▇▇
validation_loss,█▆▅▃▂▃▂▂▂▁▂▁▁▁▁

0,1
epoch,15.0
train_accuracy,0.60884
train_loss,0.14079
validation_accuracy,0.66269
validation_loss,0.13239


[34m[1mwandb[0m: Agent Starting Run: euypiz81 with config:
[34m[1mwandb[0m: 	batchsize: 32
[34m[1mwandb[0m: 	bidirection: no
[34m[1mwandb[0m: 	cellType: RNN
[34m[1mwandb[0m: 	decoderLayers: 1
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	embSize: 32
[34m[1mwandb[0m: 	encoderLayers: 1
[34m[1mwandb[0m: 	epochs: 15
[34m[1mwandb[0m: 	hiddenLayerNuerons: 256
[34m[1mwandb[0m: 	learningRate: 0.001
[34m[1mwandb[0m: 	optimizer: Nadam
[34m[1mwandb[0m: 	tf_ratio: 0.5


0,1
epoch,▁▁▂▃▃▃▄▅▅▅▆▇▇▇█
train_accuracy,▁▆█▆▇▇▆▇▆▇▅█▆▆▇
train_loss,█▄▂▃▂▂▃▂▃▂▄▁▃▃▂
validation_accuracy,▃▅▅▄█▃▇▅▁█▂▄▄▆▆
validation_loss,▆▅▄▅▂▅▂▄█▁█▅▄▃▃

0,1
epoch,15.0
train_accuracy,0.50023
train_loss,0.55516
validation_accuracy,0.52272
validation_loss,0.48756


[34m[1mwandb[0m: Agent Starting Run: 4c7r3nw9 with config:
[34m[1mwandb[0m: 	batchsize: 64
[34m[1mwandb[0m: 	bidirection: no
[34m[1mwandb[0m: 	cellType: LSTM
[34m[1mwandb[0m: 	decoderLayers: 1
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	embSize: 64
[34m[1mwandb[0m: 	encoderLayers: 1
[34m[1mwandb[0m: 	epochs: 15
[34m[1mwandb[0m: 	hiddenLayerNuerons: 256
[34m[1mwandb[0m: 	learningRate: 0.0001
[34m[1mwandb[0m: 	optimizer: Nadam
[34m[1mwandb[0m: 	tf_ratio: 0.5


0,1
epoch,▁▁▂▃▃▃▄▅▅▅▆▇▇▇█
train_accuracy,▁▃▅▇███▇███████
train_loss,█▄▃▂▂▂▂▂▂▂▂▁▁▁▁
validation_accuracy,▁▄▆▇▇▆▇▆▇▇█▇█▆▇
validation_loss,█▄▃▂▂▃▂▃▂▂▁▁▁▂▁

0,1
epoch,15.0
train_accuracy,0.49593
train_loss,0.40789
validation_accuracy,0.51331
validation_loss,0.36937


[34m[1mwandb[0m: Agent Starting Run: yar5a4d7 with config:
[34m[1mwandb[0m: 	batchsize: 32
[34m[1mwandb[0m: 	bidirection: no
[34m[1mwandb[0m: 	cellType: LSTM
[34m[1mwandb[0m: 	decoderLayers: 1
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	embSize: 64
[34m[1mwandb[0m: 	encoderLayers: 1
[34m[1mwandb[0m: 	epochs: 15
[34m[1mwandb[0m: 	hiddenLayerNuerons: 256
[34m[1mwandb[0m: 	learningRate: 0.001
[34m[1mwandb[0m: 	optimizer: Nadam
[34m[1mwandb[0m: 	tf_ratio: 0.5


0,1
epoch,▁▁▂▃▃▃▄▅▅▅▆▇▇▇█
train_accuracy,▁▄▄▄▅▆▆▆▇▇▇▇▇██
train_loss,█▄▃▃▂▂▂▂▁▁▁▁▁▁▁
validation_accuracy,▃▁▃▃▄▃▄▇█▅▆▆▆▆▅
validation_loss,█▆▄▃▃▃▂▁▁▂▂▂▂▂▂

0,1
epoch,15.0
train_accuracy,0.66929
train_loss,0.11407
validation_accuracy,0.58238
validation_loss,0.17434


[34m[1mwandb[0m: Agent Starting Run: m2quewjj with config:
[34m[1mwandb[0m: 	batchsize: 64
[34m[1mwandb[0m: 	bidirection: no
[34m[1mwandb[0m: 	cellType: LSTM
[34m[1mwandb[0m: 	decoderLayers: 1
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embSize: 64
[34m[1mwandb[0m: 	encoderLayers: 1
[34m[1mwandb[0m: 	epochs: 15
[34m[1mwandb[0m: 	hiddenLayerNuerons: 512
[34m[1mwandb[0m: 	learningRate: 0.0001
[34m[1mwandb[0m: 	optimizer: Adam
[34m[1mwandb[0m: 	tf_ratio: 0.5


0,1
epoch,▁▁▂▃▃▃▄▅▅▅▆▇▇▇█
train_accuracy,▁▅▇▇▇█▇█▇██████
train_loss,█▄▃▃▃▃▃▂▃▂▂▂▁▁▁
validation_accuracy,▁▅▆▇██▆▇▆▆▅▆▇▅▇
validation_loss,█▅▄▄▃▃▄▃▄▄▄▃▂▂▁

0,1
epoch,15.0
train_accuracy,0.52421
train_loss,0.281
validation_accuracy,0.52455
validation_loss,0.26351


[34m[1mwandb[0m: Agent Starting Run: wsge53v6 with config:
[34m[1mwandb[0m: 	batchsize: 64
[34m[1mwandb[0m: 	bidirection: no
[34m[1mwandb[0m: 	cellType: LSTM
[34m[1mwandb[0m: 	decoderLayers: 1
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	embSize: 16
[34m[1mwandb[0m: 	encoderLayers: 1
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hiddenLayerNuerons: 512
[34m[1mwandb[0m: 	learningRate: 0.001
[34m[1mwandb[0m: 	optimizer: Nadam
[34m[1mwandb[0m: 	tf_ratio: 0.4


0,1
epoch,▁▂▃▃▄▅▆▆▇█
train_accuracy,▁▅▅▅▆▆▇▇██
train_loss,█▅▄▃▂▂▂▁▁▁
validation_accuracy,▂▁▂▅▄▆▆▆▇█
validation_loss,█▆▄▂▂▁▂▁▁▁

0,1
epoch,10.0
train_accuracy,0.57016
train_loss,0.15578
validation_accuracy,0.59615
validation_loss,0.16072


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: gbt29be1 with config:
[34m[1mwandb[0m: 	batchsize: 64
[34m[1mwandb[0m: 	bidirection: no
[34m[1mwandb[0m: 	cellType: RNN
[34m[1mwandb[0m: 	decoderLayers: 1
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embSize: 32
[34m[1mwandb[0m: 	encoderLayers: 1
[34m[1mwandb[0m: 	epochs: 15
[34m[1mwandb[0m: 	hiddenLayerNuerons: 512
[34m[1mwandb[0m: 	learningRate: 0.0001
[34m[1mwandb[0m: 	optimizer: Nadam
[34m[1mwandb[0m: 	tf_ratio: 0.5


0,1
epoch,▁▁▂▃▃▃▄▅▅▅▆▇▇▇█
train_accuracy,▁▄▇█▇▇█▇███▇███
train_loss,█▃▂▂▂▂▁▂▁▁▁▂▁▁▁
validation_accuracy,▁▆▆▆▇█▇█▇█▇█▇▇▇
validation_loss,█▃▄▄▃▁▄▂▃▁▂▁▄▃▃

0,1
epoch,15.0
train_accuracy,0.49468
train_loss,0.55573
validation_accuracy,0.46948
validation_loss,0.53235


[34m[1mwandb[0m: Agent Starting Run: m4bya6h2 with config:
[34m[1mwandb[0m: 	batchsize: 64
[34m[1mwandb[0m: 	bidirection: no
[34m[1mwandb[0m: 	cellType: LSTM
[34m[1mwandb[0m: 	decoderLayers: 1
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	embSize: 32
[34m[1mwandb[0m: 	encoderLayers: 1
[34m[1mwandb[0m: 	epochs: 15
[34m[1mwandb[0m: 	hiddenLayerNuerons: 256
[34m[1mwandb[0m: 	learningRate: 0.001
[34m[1mwandb[0m: 	optimizer: Adam
[34m[1mwandb[0m: 	tf_ratio: 0.5


0,1
epoch,▁▁▂▃▃▃▄▅▅▅▆▇▇▇█
train_accuracy,▁▅▅▆▆▇▇▇▇▇▇▇███
train_loss,█▄▄▃▂▂▂▂▁▁▁▁▁▁▁
validation_accuracy,▃▅▆▅▁▁▆▇▅▅▅██▆▅
validation_loss,█▅▄▃▄▄▂▂▂▂▂▁▁▂▂

0,1
epoch,15.0
train_accuracy,0.6059
train_loss,0.15218
validation_accuracy,0.56815
validation_loss,0.17188


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: feho8ox5 with config:
[34m[1mwandb[0m: 	batchsize: 32
[34m[1mwandb[0m: 	bidirection: no
[34m[1mwandb[0m: 	cellType: LSTM
[34m[1mwandb[0m: 	decoderLayers: 1
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embSize: 64
[34m[1mwandb[0m: 	encoderLayers: 1
[34m[1mwandb[0m: 	epochs: 15
[34m[1mwandb[0m: 	hiddenLayerNuerons: 512
[34m[1mwandb[0m: 	learningRate: 0.01
[34m[1mwandb[0m: 	optimizer: Adam
[34m[1mwandb[0m: 	tf_ratio: 0.5


0,1
epoch,▁▁▂▃▃▃▄▅▅▅▆▇▇▇█
train_accuracy,▁▆▆▆▆▅▅▇█▃▅▇█▇▃
train_loss,█▆▅▄▃▂▂▂▁▂▂▁▁▁▂
validation_accuracy,▄▁▄▇▂▄▃▅▄██▁▅▂█
validation_loss,██▆▃▄▃▃▃▃▂▁▃▂▃▁

0,1
epoch,15.0
train_accuracy,0.47819
train_loss,0.33061
validation_accuracy,0.55599
validation_loss,0.25865


[34m[1mwandb[0m: Agent Starting Run: jg53uf0f with config:
[34m[1mwandb[0m: 	batchsize: 64
[34m[1mwandb[0m: 	bidirection: no
[34m[1mwandb[0m: 	cellType: LSTM
[34m[1mwandb[0m: 	decoderLayers: 1
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	embSize: 64
[34m[1mwandb[0m: 	encoderLayers: 1
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hiddenLayerNuerons: 512
[34m[1mwandb[0m: 	learningRate: 0.01
[34m[1mwandb[0m: 	optimizer: Adam
[34m[1mwandb[0m: 	tf_ratio: 0.5


0,1
epoch,▁▂▃▃▄▅▆▆▇█
train_accuracy,▁▆▃█▆▅▇█▇▇
train_loss,█▆▆▃▃▂▂▁▁▁
validation_accuracy,▇▁▇██▇█▇▇▇
validation_loss,▃█▂▁▁▂▁▁▁▁

0,1
epoch,10.0
train_accuracy,0.51007
train_loss,0.37512
validation_accuracy,0.4424
validation_loss,0.38284


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: 92a1qwdr with config:
[34m[1mwandb[0m: 	batchsize: 64
[34m[1mwandb[0m: 	bidirection: no
[34m[1mwandb[0m: 	cellType: LSTM
[34m[1mwandb[0m: 	decoderLayers: 1
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	embSize: 64
[34m[1mwandb[0m: 	encoderLayers: 1
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hiddenLayerNuerons: 64
[34m[1mwandb[0m: 	learningRate: 0.001
[34m[1mwandb[0m: 	optimizer: Adam
[34m[1mwandb[0m: 	tf_ratio: 0.4


0,1
epoch,▁▂▃▃▄▅▆▆▇█
train_accuracy,▁▇▇███████
train_loss,█▄▃▂▂▂▁▁▁▁
validation_accuracy,▁▂▂▃█▆▆▄▃▄
validation_loss,█▇▆▄▁▂▂▁▂▁

0,1
epoch,10.0
train_accuracy,0.41668
train_loss,0.40942
validation_accuracy,0.38825
validation_loss,0.39402


[34m[1mwandb[0m: Agent Starting Run: i9hswjif with config:
[34m[1mwandb[0m: 	batchsize: 64
[34m[1mwandb[0m: 	bidirection: no
[34m[1mwandb[0m: 	cellType: LSTM
[34m[1mwandb[0m: 	decoderLayers: 5
[34m[1mwandb[0m: 	dropout: 0
[34m[1mwandb[0m: 	embSize: 32
[34m[1mwandb[0m: 	encoderLayers: 1
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hiddenLayerNuerons: 512
[34m[1mwandb[0m: 	learningRate: 0.001
[34m[1mwandb[0m: 	optimizer: Nadam
[34m[1mwandb[0m: 	tf_ratio: 0.5


0,1
epoch,▁▂▃▃▄▅▆▆▇█
train_accuracy,▁▁▄▇▇▇▇▇██
train_loss,█▅▅▄▃▃▂▂▁▁
validation_accuracy,▁▂▇█▇████▇
validation_loss,█▆▄▄▄▂▂▁▁▁

0,1
epoch,10.0
train_accuracy,0.53274
train_loss,0.20896
validation_accuracy,0.46352
validation_loss,0.21072


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: s4dqpfy9 with config:
[34m[1mwandb[0m: 	batchsize: 64
[34m[1mwandb[0m: 	bidirection: no
[34m[1mwandb[0m: 	cellType: LSTM
[34m[1mwandb[0m: 	decoderLayers: 1
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	embSize: 16
[34m[1mwandb[0m: 	encoderLayers: 1
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hiddenLayerNuerons: 512
[34m[1mwandb[0m: 	learningRate: 0.0001
[34m[1mwandb[0m: 	optimizer: Nadam
[34m[1mwandb[0m: 	tf_ratio: 0.5


0,1
epoch,▁▂▃▃▄▅▆▆▇█
train_accuracy,▁▁▂▄▆▇▇▇██
train_loss,█▅▄▃▂▁▁▁▁▁
validation_accuracy,▁▂▃▅▆▇▇▇██
validation_loss,█▆▄▄▃▂▂▂▁▁

0,1
epoch,10.0
train_accuracy,0.48328
train_loss,0.49905
validation_accuracy,0.52524
validation_loss,0.42897


[34m[1mwandb[0m: Agent Starting Run: y7sd2ars with config:
[34m[1mwandb[0m: 	batchsize: 64
[34m[1mwandb[0m: 	bidirection: Yes
[34m[1mwandb[0m: 	cellType: LSTM
[34m[1mwandb[0m: 	decoderLayers: 1
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	embSize: 32
[34m[1mwandb[0m: 	encoderLayers: 1
[34m[1mwandb[0m: 	epochs: 15
[34m[1mwandb[0m: 	hiddenLayerNuerons: 512
[34m[1mwandb[0m: 	learningRate: 0.001
[34m[1mwandb[0m: 	optimizer: Nadam
[34m[1mwandb[0m: 	tf_ratio: 0.5


0,1
epoch,▁▁▂▃▃▃▄▅▅▅▆▇▇▇█
train_accuracy,▁▅▅▅▅▅▆▆▆▇█▇███
train_loss,█▄▃▃▃▂▂▂▂▁▁▁▁▁▁
validation_accuracy,▃▁▂▄▂▂▃▃▃▃▂▄▃▆█
validation_loss,█▇▅▃▄▅▃▃▄▄▅▃▅▃▁

0,1
epoch,15.0
train_accuracy,0.66554
train_loss,0.10535
validation_accuracy,0.62643
validation_loss,0.18455


[34m[1mwandb[0m: Agent Starting Run: 5s1g52d6 with config:
[34m[1mwandb[0m: 	batchsize: 64
[34m[1mwandb[0m: 	bidirection: Yes
[34m[1mwandb[0m: 	cellType: LSTM
[34m[1mwandb[0m: 	decoderLayers: 1
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	embSize: 64
[34m[1mwandb[0m: 	encoderLayers: 1
[34m[1mwandb[0m: 	epochs: 15
[34m[1mwandb[0m: 	hiddenLayerNuerons: 512
[34m[1mwandb[0m: 	learningRate: 0.001
[34m[1mwandb[0m: 	optimizer: Adam
[34m[1mwandb[0m: 	tf_ratio: 0.5


0,1
epoch,▁▁▂▃▃▃▄▅▅▅▆▇▇▇█
train_accuracy,▁▄▄▄▅▅▆▆▆▆▇▇▇██
train_loss,█▄▃▃▃▂▂▂▂▂▁▁▁▁▁
validation_accuracy,▂▃▄▁▆▇▃▇▅█▁▅▅▆▂
validation_loss,█▅▃▅▁▁▄▂▃▁▆▄▃▃▅

0,1
epoch,15.0
train_accuracy,0.67578
train_loss,0.10433
validation_accuracy,0.48256
validation_loss,0.25426


[34m[1mwandb[0m: Agent Starting Run: cq2qx525 with config:
[34m[1mwandb[0m: 	batchsize: 64
[34m[1mwandb[0m: 	bidirection: no
[34m[1mwandb[0m: 	cellType: LSTM
[34m[1mwandb[0m: 	decoderLayers: 1
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embSize: 16
[34m[1mwandb[0m: 	encoderLayers: 5
[34m[1mwandb[0m: 	epochs: 15
[34m[1mwandb[0m: 	hiddenLayerNuerons: 512
[34m[1mwandb[0m: 	learningRate: 0.01
[34m[1mwandb[0m: 	optimizer: Nadam
[34m[1mwandb[0m: 	tf_ratio: 0.5


0,1
epoch,▁▁▂▃▃▃▄▅▅▅▆▇▇▇█
train_accuracy,▁▃▄▅▆▅▇▅▄▄▄▅▅█▅
train_loss,█▅█▄▃▃▂▃▄▄▄▄▄▁▃
validation_accuracy,▃█▄▄█▆▆▃▄▆▁▃▇▇▅
validation_loss,█▂▆▆▁▄▅█▇▄▇▇▃▃▅

0,1
epoch,15.0
train_accuracy,0.499
train_loss,0.53651
validation_accuracy,0.49931
validation_loss,0.51208


[34m[1mwandb[0m: Agent Starting Run: nnrul050 with config:
[34m[1mwandb[0m: 	batchsize: 32
[34m[1mwandb[0m: 	bidirection: no
[34m[1mwandb[0m: 	cellType: LSTM
[34m[1mwandb[0m: 	decoderLayers: 1
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embSize: 64
[34m[1mwandb[0m: 	encoderLayers: 1
[34m[1mwandb[0m: 	epochs: 15
[34m[1mwandb[0m: 	hiddenLayerNuerons: 256
[34m[1mwandb[0m: 	learningRate: 0.01
[34m[1mwandb[0m: 	optimizer: Adam
[34m[1mwandb[0m: 	tf_ratio: 0.5


0,1
epoch,▁▁▂▃▃▃▄▅▅▅▆▇▇▇█
train_accuracy,▁▄▄▆▄▅▄▆█▆▅▆▇▇▆
train_loss,█▄▃▂▂▂▂▂▁▁▂▁▁▁▁
validation_accuracy,▄▃▅▁▆▇▂▁▆▇▃▇▃▂█
validation_loss,█▇▄▆▂▂▄▄▂▂▃▁▃▄▁

0,1
epoch,15.0
train_accuracy,0.51995
train_loss,0.2624
validation_accuracy,0.60005
validation_loss,0.21072


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: bp9gvplf with config:
[34m[1mwandb[0m: 	batchsize: 64
[34m[1mwandb[0m: 	bidirection: no
[34m[1mwandb[0m: 	cellType: LSTM
[34m[1mwandb[0m: 	decoderLayers: 1
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embSize: 64
[34m[1mwandb[0m: 	encoderLayers: 1
[34m[1mwandb[0m: 	epochs: 15
[34m[1mwandb[0m: 	hiddenLayerNuerons: 256
[34m[1mwandb[0m: 	learningRate: 0.0001
[34m[1mwandb[0m: 	optimizer: Nadam
[34m[1mwandb[0m: 	tf_ratio: 0.5


0,1
epoch,▁▁▂▃▃▃▄▅▅▅▆▇▇▇█
train_accuracy,▁▃▅▆▇█▇▇██▇▇███
train_loss,█▄▃▃▃▂▂▂▂▂▂▁▁▁▁
validation_accuracy,▁▄▅▇▅▆▆█▇▇▆█▇▇█
validation_loss,█▅▅▃▅▄▃▂▂▂▂▁▁▂▁

0,1
epoch,15.0
train_accuracy,0.51756
train_loss,0.27929
validation_accuracy,0.57458
validation_loss,0.23342


[34m[1mwandb[0m: Agent Starting Run: 0ora7crn with config:
[34m[1mwandb[0m: 	batchsize: 64
[34m[1mwandb[0m: 	bidirection: no
[34m[1mwandb[0m: 	cellType: RNN
[34m[1mwandb[0m: 	decoderLayers: 1
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embSize: 64
[34m[1mwandb[0m: 	encoderLayers: 1
[34m[1mwandb[0m: 	epochs: 15
[34m[1mwandb[0m: 	hiddenLayerNuerons: 512
[34m[1mwandb[0m: 	learningRate: 0.001
[34m[1mwandb[0m: 	optimizer: Adam
[34m[1mwandb[0m: 	tf_ratio: 0.5


0,1
epoch,▁▁▂▃▃▃▄▅▅▅▆▇▇▇█
train_accuracy,▁▅▇▅▆▄█▄▅▇▇▆▄█▇
train_loss,█▅▂▄▃▄▁▄▃▂▂▃▅▁▂
validation_accuracy,▄▆▃▃▅▅▆▅▆▄█▃▁▃▆
validation_loss,▇▃▇▇▄▄▃▄▄▆▁▆█▆▃

0,1
epoch,15.0
train_accuracy,0.51495
train_loss,0.53197
validation_accuracy,0.57412
validation_loss,0.43366


[34m[1mwandb[0m: Agent Starting Run: pv4tfg3l with config:
[34m[1mwandb[0m: 	batchsize: 64
[34m[1mwandb[0m: 	bidirection: no
[34m[1mwandb[0m: 	cellType: LSTM
[34m[1mwandb[0m: 	decoderLayers: 1
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	embSize: 16
[34m[1mwandb[0m: 	encoderLayers: 1
[34m[1mwandb[0m: 	epochs: 15
[34m[1mwandb[0m: 	hiddenLayerNuerons: 256
[34m[1mwandb[0m: 	learningRate: 0.001
[34m[1mwandb[0m: 	optimizer: Adam
[34m[1mwandb[0m: 	tf_ratio: 0.5


0,1
epoch,▁▁▂▃▃▃▄▅▅▅▆▇▇▇█
train_accuracy,▁▇▇▇▇▆▆▇▇▇▇▇▇▇█
train_loss,█▄▄▃▃▃▃▂▂▂▂▂▁▁▁
validation_accuracy,▂▂▂▆▅▄▅▁▅▅▄█▆▅▆
validation_loss,█▇▆▃▃▄▃▄▂▂▂▁▁▂▁

0,1
epoch,15.0
train_accuracy,0.59481
train_loss,0.17314
validation_accuracy,0.57297
validation_loss,0.17802


[34m[1mwandb[0m: Agent Starting Run: iectolku with config:
[34m[1mwandb[0m: 	batchsize: 64
[34m[1mwandb[0m: 	bidirection: no
[34m[1mwandb[0m: 	cellType: RNN
[34m[1mwandb[0m: 	decoderLayers: 1
[34m[1mwandb[0m: 	dropout: 0.2
[34m[1mwandb[0m: 	embSize: 64
[34m[1mwandb[0m: 	encoderLayers: 1
[34m[1mwandb[0m: 	epochs: 15
[34m[1mwandb[0m: 	hiddenLayerNuerons: 512
[34m[1mwandb[0m: 	learningRate: 0.0001
[34m[1mwandb[0m: 	optimizer: Nadam
[34m[1mwandb[0m: 	tf_ratio: 0.5


0,1
epoch,▁▁▂▃▃▃▄▅▅▅▆▇▇▇█
train_accuracy,▁▆███▇▇██▇█▇▇█▇
train_loss,█▃▁▁▁▂▂▁▁▂▁▂▂▁▂
validation_accuracy,▁▅▄▆▃▇▆▆▇█▇▅██▇
validation_loss,█▅▇▄█▃▄▄▂▁▃▅▂▁▃

0,1
epoch,15.0
train_accuracy,0.48876
train_loss,0.55836
validation_accuracy,0.5296
validation_loss,0.46598


[34m[1mwandb[0m: Agent Starting Run: 9tmu6t2w with config:
[34m[1mwandb[0m: 	batchsize: 32
[34m[1mwandb[0m: 	bidirection: no
[34m[1mwandb[0m: 	cellType: LSTM
[34m[1mwandb[0m: 	decoderLayers: 1
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	embSize: 16
[34m[1mwandb[0m: 	encoderLayers: 5
[34m[1mwandb[0m: 	epochs: 15
[34m[1mwandb[0m: 	hiddenLayerNuerons: 256
[34m[1mwandb[0m: 	learningRate: 0.001
[34m[1mwandb[0m: 	optimizer: Adam
[34m[1mwandb[0m: 	tf_ratio: 0.5


[34m[1mwandb[0m: [32m[41mERROR[0m Error while calling W&B API: context deadline exceeded (<Response [500]>)
[34m[1mwandb[0m: [32m[41mERROR[0m Error while calling W&B API: context deadline exceeded (<Response [500]>)


0,1
epoch,▁▁▂▃▃▃▄▅▅▅▆▇▇▇█
train_accuracy,▁▇▇███▇█▇█▇████
train_loss,█▄▄▃▃▃▃▃▃▂▃▂▁▁▁
validation_accuracy,▂▆█▅▅▅▄▅▁▁▃▃▄▆▃
validation_loss,█▅▃▄▄▄▄▃▅▆▄▃▂▁▂

0,1
epoch,15.0
train_accuracy,0.50934
train_loss,0.35777
validation_accuracy,0.47912
validation_loss,0.3603


[34m[1mwandb[0m: Agent Starting Run: 1kz9jdkp with config:
[34m[1mwandb[0m: 	batchsize: 64
[34m[1mwandb[0m: 	bidirection: no
[34m[1mwandb[0m: 	cellType: LSTM
[34m[1mwandb[0m: 	decoderLayers: 1
[34m[1mwandb[0m: 	dropout: 0
[34m[1mwandb[0m: 	embSize: 64
[34m[1mwandb[0m: 	encoderLayers: 1
[34m[1mwandb[0m: 	epochs: 15
[34m[1mwandb[0m: 	hiddenLayerNuerons: 64
[34m[1mwandb[0m: 	learningRate: 0.001
[34m[1mwandb[0m: 	optimizer: Adam
[34m[1mwandb[0m: 	tf_ratio: 0.5


0,1
epoch,▁▁▂▃▃▃▄▅▅▅▆▇▇▇█
train_accuracy,▁▆▇▇▇▇▇██▇▇██▇█
train_loss,█▄▃▃▂▂▂▂▂▂▁▁▁▁▁
validation_accuracy,▁▃▄▃▇▇█▃▂▇▂▅▃▇▃
validation_loss,█▆▅▄▃▂▂▄▃▂▃▂▂▁▂

0,1
epoch,15.0
train_accuracy,0.51774
train_loss,0.26211
validation_accuracy,0.4548
validation_loss,0.28015


[34m[1mwandb[0m: Agent Starting Run: xwrs58yo with config:
[34m[1mwandb[0m: 	batchsize: 64
[34m[1mwandb[0m: 	bidirection: no
[34m[1mwandb[0m: 	cellType: RNN
[34m[1mwandb[0m: 	decoderLayers: 1
[34m[1mwandb[0m: 	dropout: 0.3
[34m[1mwandb[0m: 	embSize: 16
[34m[1mwandb[0m: 	encoderLayers: 1
[34m[1mwandb[0m: 	epochs: 15
[34m[1mwandb[0m: 	hiddenLayerNuerons: 512
[34m[1mwandb[0m: 	learningRate: 0.01
[34m[1mwandb[0m: 	optimizer: Adam
[34m[1mwandb[0m: 	tf_ratio: 0.5


[34m[1mwandb[0m: [32m[41mERROR[0m Error while calling W&B API: context deadline exceeded (<Response [500]>)


0,1
epoch,▁▁▂▃▃▃▄▅▅▅▆▇▇▇█
train_accuracy,▁▁▁▂▃▂▂▃▂▂▂▃▂▃█
train_loss,▅█▅▂▁▄▂▁▇▄▃▂▂▂▁
validation_accuracy,▂▁▁▁▃▁▁▄▁▁▂▁▁▃█
validation_loss,▁█▂▁▄▁▁▁▂▃▁▂▂▁▁

0,1
epoch,15.0
train_accuracy,0.00333
train_loss,1.11643
validation_accuracy,0.00688
validation_loss,0.99111
