Q1. Download the fashion-MNIST dataset and plot 1 sample image for each class as shown in the grid below. Use from keras.datasets import fashion_mnist for getting the fashion mnist dataset.

In [4]:
import pandas as pd
import numpy as np
from keras.datasets import fashion_mnist
import wandb

In [5]:
wandb.init(project="Assignment - 1", entity="da24m014-iit-madras")

# Load the Fashion-MNIST dataset
(x_train, y_train), (x_test, y_test) = fashion_mnist.load_data()



# Class names for Fashion-MNIST
class_names = ['T-shirt/top', 'Trouser', 'Pullover', 'Dress', 'Coat', 
               'Sandal', 'Shirt', 'Sneaker', 'Bag', 'Ankle boot']

# Log sample images to wandb
sample_images = []
unique_classes = np.unique(y_train)

for cls in unique_classes:
    sample_idx = np.where(y_train == cls)[0][0]  # Find an example for the class
    img = x_train[sample_idx]
    
    sample_images.append(wandb.Image(img, caption=class_names[cls]))

# Log images to wandb
wandb.log({"Sample Images": sample_images})

# Finish wandb run
wandb.finish()

[34m[1mwandb[0m: Using wandb-core as the SDK backend.  Please refer to https://wandb.me/wandb-core for more information.
[34m[1mwandb[0m: Currently logged in as: [33mda24m014[0m ([33mda24m014-iit-madras[0m) to [32mhttps://api.wandb.ai[0m. Use [1m`wandb login --relogin`[0m to force relogin


In [6]:
x_train, x_test = x_train / 255.0, x_test / 255.0
x_train, x_test = x_train.reshape(x_train.shape[0], -1), x_test.reshape(x_test.shape[0], -1)
num_classes = 10

In [7]:
def one_hot_encode(y, num_classes):
    encoded = np.zeros((y.size,num_classes))
    encoded[np.arange(y.size),y] = 1
    return encoded

y_train, y_test = one_hot_encode(y_train,num_classes), one_hot_encode(y_test, num_classes)

In [8]:
split_idx = int(0.9*len(x_train))
x_train, x_val = x_train[:split_idx], x_train[split_idx:]
y_train, y_val = y_train[:split_idx], y_train[split_idx:]

In [9]:
# Activation Functions
def relu(Z):
    return np.maximum(0, Z)

def sigmoid(Z):
    return 1 / (1 + np.exp(-Z))

def tanh(Z):
    return np.tanh(Z)

def softmax(Z):
    expZ = np.exp(Z - np.max(Z, axis=1, keepdims=True))
    return expZ / np.sum(expZ, axis=1, keepdims=True)

activation_functions = {"relu": relu, "sigmoid": sigmoid, "tanh": tanh}

In [10]:
# Optimizers
def optimizer_update(weights, biases, grads_W, grads_b, learning_rate, optimizer, velocity, momentum=0.9):
    if optimizer == "sgd":
        for i in range(len(weights)):
            weights[i] -= learning_rate * grads_W[i]
            biases[i] -= learning_rate * grads_b[i]
    elif optimizer == "momentum":
        for i in range(len(weights)):
            velocity[i] = momentum * velocity[i] - learning_rate * grads_W[i]
            weights[i] += velocity[i]
            biases[i] -= learning_rate * grads_b[i]
    elif optimizer == "nesterov":
        for i in range(len(weights)):
            prev_velocity = velocity[i]
            velocity[i] = momentum * velocity[i] - learning_rate * grads_W[i]
            weights[i] += -momentum * prev_velocity + (1 + momentum) * velocity[i]
            biases[i] -= learning_rate * grads_b[i]
    elif optimizer == "rmsprop":
        epsilon = 1e-8
        decay_rate = 0.99
        for i in range(len(weights)):
            velocity[i] = decay_rate * velocity[i] + (1 - decay_rate) * (grads_W[i] ** 2)
            weights[i] -= learning_rate * grads_W[i] / (np.sqrt(velocity[i]) + epsilon)
            biases[i] -= learning_rate * grads_b[i]
    elif optimizer == "adam" or optimizer == "nadam":
        beta1, beta2, epsilon = 0.9, 0.999, 1e-8
        for i in range(len(weights)):
            velocity[i] = beta1 * velocity[i] + (1 - beta1) * grads_W[i]
            velocity_corrected = velocity[i] / (1 - beta1)
            biases[i] -= learning_rate * grads_b[i]
            weights[i] -= learning_rate * velocity_corrected

In [15]:
class NeuralNetwork:
    def __init__(self,layers, learning_rate=0.001,activation="relu",optimizer="sgd",weight_init="random"):
        self.layers = layers
        self.activation = activation
        self.optimizer = optimizer
        self.learning_rate = learning_rate
        self.weight_init = weight_init
        self.init_weights(weight_init)
        self.velocity = [np.zeros_like(W) for W in self.weights]

    def init_weights(self, method):
        self.weights = []
        self.biases = []
        for i in range(len(self.layers) - 1):
            if method == "xavier":
                limit = np.sqrt(6 / (self.layers[i] + self.layers[i+1]))
            else:  # Default to "random"
                limit = 0.1
            W = np.random.uniform(-limit, limit, (self.layers[i], self.layers[i+1]))
            self.weights.append(W)
            self.biases.append(np.zeros((1, self.layers[i+1])))

    def forward(self, X):
        self.A = [X]
        for i in range(len(self.weights) - 1):
            Z = self.A[-1] @ self.weights[i] + self.biases[i]
            A = activation_functions[self.activation](Z)
            self.A.append(A)
        Z = self.A[-1] @ self.weights[-1] + self.biases[-1]
        A = softmax(Z)
        self.A.append(A)
        return A
    
    def compute_loss(self, y_true, y_pred):
        return -np.mean(np.sum(y_true * np.log(y_pred + 1e-8), axis=1))
    
    def backward(self, X, y):
        grads_W, grads_b = [], []
        if not hasattr(self, 'A') or len(self.A) == 0:
            raise ValueError("Activations A are not stored correctly. Check forward propagation.")

        dA = self.A[-1] - y
        for i in reversed(range(len(self.weights))):
            dW = self.A[i].T @ dA / X.shape[0]
            db = np.sum(dA, axis=0, keepdims=True) / X.shape[0]
            grads_W.append(dW)
            grads_b.append(db)
            if i > 0:
                dA = (dA @ self.weights[i].T) * (self.A[i] > 0)
        return grads_W[::-1], grads_b[::-1]
    

    def train(self, X_train, y_train, X_test, y_test, epochs, batch_size):
        for epoch in range(epochs):
            y_pred= self.forward(x_train)
            train_loss = self.compute_loss(y_train, y_pred)
            train_accuracy = np.mean(np.argmax(y_pred, axis=1) == np.argmax(y_train,axis=1))
            grads_W, grads_b = self.backward(X_train, y_train)
            optimizer_update(self.weights, self.biases, grads_W, grads_b, self.learning_rate, self.optimizer, self.velocity)
            y_pred_val = self.forward(x_val)
            val_loss = self.compute_loss(y_val, y_pred_val)
            val_accuracy = np.mean(np.argmax(y_pred_val, axis=1) == np.argmax(y_val, axis=1))
            wandb.log({"epoch": epoch+1,"loss": train_loss,"accuracy":train_accuracy,"val_loss": val_loss,"val_accuracy": val_accuracy})





In [16]:
sweep_config = {
    'method': 'random',
    'metric': {'name': 'loss', 'goal': 'minimize'},
    'parameters': {
        'learning_rate': {'values': [0.001, 0.01, 0.1]},
        'batch_size': {'values': [16, 32, 64]},
        'epochs': {'values': [5, 10]},
        'hidden_layers': {'values': [2, 3]},
        'hidden_size': {'values': [32, 64]},
        'activation': {'values': ['relu', 'sigmoid']},
        'optimizer': {'values': ['sgd', 'momentum']},
        'weight_init': {'values': ['random', 'xavier']}
    }
}

# wandb.init(project="Assignment - 1")  # Ensure WandB is initialized before using config
sweep_id = wandb.sweep(sweep_config)

Create sweep with ID: z5v1zv1m
Sweep URL: https://wandb.ai/da24m014-iit-madras/uncategorized/sweeps/z5v1zv1m


In [17]:
def train_with_wandb():
    wandb.init(project="Assignment - 1")  # Ensure WandB is initialized before using config
    config = wandb.config
    model = NeuralNetwork([784] + [config.hidden_size] * config.hidden_layers + [10],
                          learning_rate=config.learning_rate,
                          activation=config.activation,
                          optimizer=config.optimizer,
                          weight_init=config.weight_init)
    model.train(x_train, y_train, x_test, y_test, config.epochs, config.batch_size)

wandb.agent(sweep_id, function=train_with_wandb)

[34m[1mwandb[0m: Agent Starting Run: 205tiuxp with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▁▁▁▁
epoch,▁▃▅▆█
loss,█▆▄▃▁
val_accuracy,▁▁▁▁▁
val_loss,█▆▄▃▁

0,1
accuracy,0.1003
epoch,5.0
loss,2.31052
val_accuracy,0.09733
val_loss,2.31307


[34m[1mwandb[0m: Agent Starting Run: p5rwy30i with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▁▂▂▂▃▅▆▇█
epoch,▁▂▃▃▄▅▆▆▇█
loss,██▇▇▆▅▄▃▂▁
val_accuracy,▁▁▂▂▃▅▆▇▇█
val_loss,██▇▇▆▅▄▃▂▁

0,1
accuracy,0.12348
epoch,10.0
loss,2.30111
val_accuracy,0.1245
val_loss,2.30101


[34m[1mwandb[0m: Agent Starting Run: 3t8xhcft with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▁▁▁▁▁▁▁▁▁
epoch,▁▂▃▃▄▅▆▆▇█
loss,██▇▆▅▄▃▃▂▁
val_accuracy,▁▁▁▁▁▁▁▁▁▁
val_loss,█▇▇▆▅▄▃▂▂▁

0,1
accuracy,0.10017
epoch,10.0
loss,2.30994
val_accuracy,0.0985
val_loss,2.31002


[34m[1mwandb[0m: Agent Starting Run: pq70mvyu with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▁▁▁▁▁▁▁▁▁
epoch,▁▂▃▃▄▅▆▆▇█
loss,██▇▇▆▅▄▃▂▁
val_accuracy,▁▁▁▁▁▁▁▁▁▁
val_loss,██▇▆▆▅▄▃▂▁

0,1
accuracy,0.09944
epoch,10.0
loss,2.44928
val_accuracy,0.105
val_loss,2.41979


[34m[1mwandb[0m: Agent Starting Run: pbwy5tb9 with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: random
[34m[1mwandb[0m: W&B API key is configured. Use [1m`wandb login --relogin`[0m to force relogin


0,1
accuracy,▁▃▅▅▇█▇▅▅▆
epoch,▁▂▃▃▄▅▆▆▇█
loss,██▇▇▆▅▄▃▂▁
val_accuracy,█▄▄██▄▄▁▄▄
val_loss,██▇▇▆▅▄▃▂▁

0,1
accuracy,0.10313
epoch,10.0
loss,2.29922
val_accuracy,0.1085
val_loss,2.2988


[34m[1mwandb[0m: Agent Starting Run: mzh1w8m3 with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.1
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▁▁▁▁
epoch,▁▃▅▆█
loss,█▅▃▂▁
val_accuracy,▁▁▁▁▁
val_loss,█▅▃▂▁

0,1
accuracy,0.1003
epoch,5.0
loss,2.35531
val_accuracy,0.09733
val_loss,2.33458


[34m[1mwandb[0m: Agent Starting Run: rhf7ducz with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▂▃▄▄▅▆▇▇█
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▇▆▅▄▃▃▂▂▁
val_accuracy,▁▂▃▄▄▅▆▇▇█
val_loss,█▇▆▅▄▄▃▂▂▁

0,1
accuracy,0.16031
epoch,10.0
loss,2.23035
val_accuracy,0.17533
val_loss,2.21473


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: 20ylq4fb with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▁▂▃▄▅▆▇██
epoch,▁▂▃▃▄▅▆▆▇█
loss,██▇▆▆▅▄▃▂▁
val_accuracy,▁▂▂▃▅▆▇▇██
val_loss,█▇▇▆▅▄▃▂▂▁

0,1
accuracy,0.18448
epoch,10.0
loss,2.30285
val_accuracy,0.18417
val_loss,2.30126


[34m[1mwandb[0m: Agent Starting Run: d6ygj0eu with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▃▁▂▄▄▅▇█▆▆
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▇▆▆▅▄▃▃▂▁
val_accuracy,▁▁▁▁▁▁▁▁▁█
val_loss,█▇▆▆▅▄▃▃▂▁

0,1
accuracy,0.14083
epoch,10.0
loss,2.30197
val_accuracy,0.13967
val_loss,2.30222


[34m[1mwandb[0m: Agent Starting Run: k57q32jl with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.1
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▁▁▁█
epoch,▁▃▅▆█
loss,█▄▂▂▁
val_accuracy,▁▁▁▆█
val_loss,█▅▃▂▁

0,1
accuracy,0.12463
epoch,5.0
loss,2.32182
val_accuracy,0.13617
val_loss,2.30051


[34m[1mwandb[0m: Agent Starting Run: 6d21qtht with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▁▁▁▁▁▁▁▁▁
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▇▆▆▅▄▃▃▂▁
val_accuracy,▁▁▁▁▁▁▁▁▁▁
val_loss,█▇▆▆▅▄▃▃▂▁

0,1
accuracy,0.10065
epoch,10.0
loss,2.30507
val_accuracy,0.09417
val_loss,2.30589


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: bmldvnak with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.1
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▁▁▁▁▂▃▄▆█
epoch,▁▂▃▃▄▅▆▆▇█
loss,██▇▇▇▆▅▄▃▁
val_accuracy,▁▁▁▁▂▃▄▅▇█
val_loss,██▇▇▇▆▅▄▃▁

0,1
accuracy,0.44413
epoch,10.0
loss,1.95372
val_accuracy,0.50233
val_loss,1.84084


[34m[1mwandb[0m: Agent Starting Run: 44te3upj with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.1
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▃▃▅▆▇▇▇██
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▆▅▄▃▃▂▂▁▁
val_accuracy,▁▂▄▅▅▆▆▇▇█
val_loss,█▆▅▄▄▃▂▂▁▁

0,1
accuracy,0.42002
epoch,10.0
loss,2.14363
val_accuracy,0.45883
val_loss,2.12765


[34m[1mwandb[0m: Agent Starting Run: q8ze8vfc with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▂▃▄▄▅▅▆▇█
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▇▆▆▅▄▃▃▂▁
val_accuracy,▁▄▅▆▆▆▆▆▆█
val_loss,█▇▆▆▅▄▃▃▂▁

0,1
accuracy,0.10856
epoch,10.0
loss,2.30555
val_accuracy,0.11083
val_loss,2.30535


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: brztrox2 with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▁▁▁▁
epoch,▁▃▅▆█
loss,█▆▄▃▁
val_accuracy,▁▁▁▁▁
val_loss,█▆▄▃▁

0,1
accuracy,0.09939
epoch,5.0
loss,2.32201
val_accuracy,0.1055
val_loss,2.32074


[34m[1mwandb[0m: Agent Starting Run: zzk4at76 with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.1
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▁▁▁▁
epoch,▁▃▅▆█
loss,█▄▃▂▁
val_accuracy,▁▁▁▁█
val_loss,█▅▃▂▁

0,1
accuracy,0.1003
epoch,5.0
loss,2.29653
val_accuracy,0.10017
val_loss,2.28891


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: 0h1meyhq with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.1
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▁██▂
epoch,▁▃▅▆█
loss,█▆▄▂▁
val_accuracy,█▁▁▇█
val_loss,█▅▂▁▁

0,1
accuracy,0.09952
epoch,5.0
loss,2.30251
val_accuracy,0.105
val_loss,2.30002


[34m[1mwandb[0m: Agent Starting Run: olas44yu with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▁▁▁▁▁▁▁▁▁
epoch,▁▂▃▃▄▅▆▆▇█
loss,██▇▇▆▅▄▃▂▁
val_accuracy,▁▁▁▁▁▁▁▁▁▁
val_loss,██▇▆▆▅▄▃▂▁

0,1
accuracy,0.0997
epoch,10.0
loss,2.50511
val_accuracy,0.10267
val_loss,2.47535


[34m[1mwandb[0m: Agent Starting Run: 6hoqw54b with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▁▁▁▁
epoch,▁▃▅▆█
loss,█▇▆▄▁
val_accuracy,▁▁▁▁▁
val_loss,█▇▅▃▁

0,1
accuracy,0.0997
epoch,5.0
loss,2.41752
val_accuracy,0.10267
val_loss,2.41517


[34m[1mwandb[0m: Agent Starting Run: f314mbgi with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▂▄▆█
epoch,▁▃▅▆█
loss,█▇▆▄▁
val_accuracy,▁▃▆▇█
val_loss,█▇▅▃▁

0,1
accuracy,0.1103
epoch,5.0
loss,2.30263
val_accuracy,0.1095
val_loss,2.30291


[34m[1mwandb[0m: Agent Starting Run: ws9sk6jr with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,██▆▆▃▃▃▃▃▁
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▇▆▆▅▄▃▃▂▁
val_accuracy,▁▁▁▁▁▁▁▁▁▁
val_loss,█▇▆▆▅▄▃▃▂▁

0,1
accuracy,0.11461
epoch,10.0
loss,2.30282
val_accuracy,0.11483
val_loss,2.30337


[34m[1mwandb[0m: Agent Starting Run: 8d46apio with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▁██▆
epoch,▁▃▅▆█
loss,█▆▅▃▁
val_accuracy,▁▁▁▁▁
val_loss,█▆▅▃▁

0,1
accuracy,0.10033
epoch,5.0
loss,2.30159
val_accuracy,0.0935
val_loss,2.30188


[34m[1mwandb[0m: Agent Starting Run: p221i3gy with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.1
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▁▁▁█
epoch,▁▃▅▆█
loss,█▆▃▁▁
val_accuracy,▁▁▁█▂
val_loss,█▄▂▁▂

0,1
accuracy,0.15185
epoch,5.0
loss,2.30283
val_accuracy,0.10317
val_loss,2.30475


[34m[1mwandb[0m: Agent Starting Run: 8hsft09f with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,█▆▆▃▆▁▆▃▁▃
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▇▆▆▅▄▃▃▂▁
val_accuracy,▅▅█████▅▁▁
val_loss,█▇▇▆▅▄▃▃▂▁

0,1
accuracy,0.08363
epoch,10.0
loss,2.30293
val_accuracy,0.07517
val_loss,2.30299


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: fz9ic8x6 with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▁▁▁▁▁▁▁▁▁
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▇▆▆▅▄▃▃▂▁
val_accuracy,▁▁▁▁▁▁▁▁▁▁
val_loss,█▇▆▆▅▄▃▃▂▁

0,1
accuracy,0.09944
epoch,10.0
loss,2.33227
val_accuracy,0.105
val_loss,2.32392


[34m[1mwandb[0m: Agent Starting Run: 4y3v7wc4 with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.1
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▁▂▃▅▆▆▇██
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▅▄▃▂▂▁▁▁▁
val_accuracy,▁▂▃▅▆▆▇███
val_loss,█▅▄▃▂▂▂▁▁▁

0,1
accuracy,0.35722
epoch,10.0
loss,2.27549
val_accuracy,0.36267
val_loss,2.27322


[34m[1mwandb[0m: Agent Starting Run: ws5aim9f with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▁▁▁▁▁▁▁▁▁
epoch,▁▂▃▃▄▅▆▆▇█
loss,██▇▇▆▅▄▃▂▁
val_accuracy,▁▁▁▁▁▁▁▁▁▁
val_loss,██▇▇▆▅▄▃▂▁

0,1
accuracy,0.09996
epoch,10.0
loss,2.31601
val_accuracy,0.10033
val_loss,2.31339


[34m[1mwandb[0m: Agent Starting Run: vogedgx8 with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.1
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▁▁▁▁▁▁▁▁▁
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▆▄▃▂▂▂▁▁▁
val_accuracy,▁▁▁▁▁▁▁▁▁▁
val_loss,█▆▄▃▂▂▁▁▁▁

0,1
accuracy,0.09939
epoch,10.0
loss,2.30288
val_accuracy,0.1055
val_loss,2.30248


[34m[1mwandb[0m: Agent Starting Run: jfzs3i52 with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▁▁▁▁
epoch,▁▃▅▆█
loss,█▇▆▄▁
val_accuracy,▁▁▁▁▁
val_loss,█▇▅▃▁

0,1
accuracy,0.0997
epoch,5.0
loss,2.30723
val_accuracy,0.10267
val_loss,2.30597


[34m[1mwandb[0m: Agent Starting Run: l7alvfks with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.1
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▁▁▁▁▁▂▄▆█
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▅▃▃▂▂▁▁▁▁
val_accuracy,▁▁▁▁▁▂▃▅▇█
val_loss,█▅▄▃▂▂▂▁▁▁

0,1
accuracy,0.26741
epoch,10.0
loss,2.26709
val_accuracy,0.30083
val_loss,2.2628


[34m[1mwandb[0m: Agent Starting Run: mg453y7m with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▁▁▁▁
epoch,▁▃▅▆█
loss,█▆▄▃▁
val_accuracy,▁▁▁▁▁
val_loss,█▆▄▃▁

0,1
accuracy,0.09991
epoch,5.0
loss,2.36464
val_accuracy,0.10083
val_loss,2.36474


[34m[1mwandb[0m: Agent Starting Run: i2xl3ofw with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▂▃▄▃▁▄▆▇█▇
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▇▆▆▅▄▃▃▂▁
val_accuracy,▁▁▁▂▂▂▄▅██
val_loss,█▇▆▆▅▄▃▃▂▁

0,1
accuracy,0.09633
epoch,10.0
loss,2.30064
val_accuracy,0.09133
val_loss,2.30078


[34m[1mwandb[0m: Agent Starting Run: 8zo6kzmt with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.1
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▁▁▁▁
epoch,▁▃▅▆█
loss,█▅▃▂▁
val_accuracy,▁▁▁▁▁
val_loss,█▅▃▂▁

0,1
accuracy,0.10065
epoch,5.0
loss,2.37328
val_accuracy,0.09417
val_loss,2.35538


[34m[1mwandb[0m: Agent Starting Run: c2t54twt with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,█▅▂▂▁
epoch,▁▃▅▆█
loss,█▇▆▄▁
val_accuracy,▁▁▁▁█
val_loss,█▇▅▃▁

0,1
accuracy,0.03663
epoch,5.0
loss,2.307
val_accuracy,0.03633
val_loss,2.30693


[34m[1mwandb[0m: Agent Starting Run: 4qi7jdf5 with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▁▁▁▁▁▁▁▁▁
epoch,▁▂▃▃▄▅▆▆▇█
loss,██▇▆▅▅▄▃▂▁
val_accuracy,▁▁▁▁▁▁▁▁▁▁
val_loss,█▇▇▆▅▄▃▂▂▁

0,1
accuracy,0.09939
epoch,10.0
loss,2.30404
val_accuracy,0.1055
val_loss,2.303


[34m[1mwandb[0m: Agent Starting Run: ltatgbjn with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▂▃▅█
epoch,▁▃▅▆█
loss,█▇▆▄▁
val_accuracy,▁▂▄▅█
val_loss,█▇▅▃▁

0,1
accuracy,0.14622
epoch,5.0
loss,2.35157
val_accuracy,0.149
val_loss,2.35275


[34m[1mwandb[0m: Agent Starting Run: xzirj3gw with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▂▃▅█
epoch,▁▃▅▆█
loss,█▇▆▄▁
val_accuracy,▁▂▃▅█
val_loss,█▇▅▃▁

0,1
accuracy,0.11243
epoch,5.0
loss,2.35518
val_accuracy,0.12233
val_loss,2.34874


[34m[1mwandb[0m: Agent Starting Run: c2cnbypo with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▂▃▅█
epoch,▁▃▅▆█
loss,█▆▄▃▁
val_accuracy,▁▂▃▅█
val_loss,█▆▄▃▁

0,1
accuracy,0.05898
epoch,5.0
loss,2.32125
val_accuracy,0.0665
val_loss,2.31126


[34m[1mwandb[0m: Agent Starting Run: px3bv1qf with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▂▃▅█
epoch,▁▃▅▆█
loss,█▇▆▄▁
val_accuracy,▁▃▅▅█
val_loss,█▇▅▃▁

0,1
accuracy,0.15441
epoch,5.0
loss,2.29494
val_accuracy,0.158
val_loss,2.29373


[34m[1mwandb[0m: Agent Starting Run: 9dfdj855 with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.1
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▁▂▆█
epoch,▁▃▅▆█
loss,█▅▂▁▁
val_accuracy,▁▂▇█▅
val_loss,█▄▂▂▁

0,1
accuracy,0.30376
epoch,5.0
loss,2.23322
val_accuracy,0.22067
val_loss,2.21506


[34m[1mwandb[0m: Agent Starting Run: rvg4r7vh with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▁▁▁▁
epoch,▁▃▅▆█
loss,█▇▆▄▁
val_accuracy,▁▁▁▁▁
val_loss,█▇▅▃▁

0,1
accuracy,0.10065
epoch,5.0
loss,2.30648
val_accuracy,0.09417
val_loss,2.30712


[34m[1mwandb[0m: Agent Starting Run: g5idp97i with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▁▁▁▁
epoch,▁▃▅▆█
loss,█▇▆▃▁
val_accuracy,▁▁▁▁▁
val_loss,█▇▅▃▁

0,1
accuracy,0.0997
epoch,5.0
loss,2.32835
val_accuracy,0.10267
val_loss,2.32336


[34m[1mwandb[0m: Agent Starting Run: 7k9v2um6 with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▂▄▅▆▇▇▇██
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▆▅▄▃▂▂▂▁▁
val_accuracy,▁▃▄▅▆▇▇▇██
val_loss,█▆▅▄▃▃▂▂▁▁

0,1
accuracy,0.19115
epoch,10.0
loss,2.24489
val_accuracy,0.19667
val_loss,2.23702


[34m[1mwandb[0m: Agent Starting Run: hhz56v0z with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▂▃▄▄▅▅▆▇█
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▇▆▆▅▄▃▃▂▁
val_accuracy,▁▁▃▃▄▄▆▇▇█
val_loss,█▇▆▆▅▄▃▃▂▁

0,1
accuracy,0.10472
epoch,10.0
loss,2.30368
val_accuracy,0.0985
val_loss,2.30393


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: 2ur1dc3s with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.1
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▂▅▇█
epoch,▁▃▅▆█
loss,█▆▄▃▁
val_accuracy,▁▄▅▆█
val_loss,█▆▅▃▁

0,1
accuracy,0.30102
epoch,5.0
loss,2.11846
val_accuracy,0.36567
val_loss,2.0145


[34m[1mwandb[0m: Agent Starting Run: ch6zguyz with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.1
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▁▂▄▅▄▄▅▆█
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▆▆▆▅▄▄▃▂▁
val_accuracy,▁▂▃▄▄▄▅▆▇█
val_loss,██▇▇▆▅▄▃▂▁

0,1
accuracy,0.40031
epoch,10.0
loss,1.79069
val_accuracy,0.45117
val_loss,1.6689


[34m[1mwandb[0m: Agent Starting Run: dwuug075 with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,█▃▂▁▂
epoch,▁▃▅▆█
loss,█▆▄▃▁
val_accuracy,▁▁▁▁▁
val_loss,█▆▄▃▁

0,1
accuracy,0.03333
epoch,5.0
loss,2.3173
val_accuracy,0.033
val_loss,2.31667


[34m[1mwandb[0m: Agent Starting Run: 3q2pu7rh with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.1
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▃▅▇█
epoch,▁▃▅▆█
loss,█▆▄▃▁
val_accuracy,▁▃▅▇█
val_loss,█▆▄▃▁

0,1
accuracy,0.35211
epoch,5.0
loss,2.05605
val_accuracy,0.3995
val_loss,2.00034


[34m[1mwandb[0m: Agent Starting Run: bkq9cfd9 with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.1
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▃▇█▅▃▂▂▂▂
epoch,▁▂▃▃▄▅▆▆▇█
loss,██▇▇▆▆▅▄▃▁
val_accuracy,▂▆█▄▂▁▁▁▁▁
val_loss,██▇▇▆▆▅▄▃▁

0,1
accuracy,0.10091
epoch,10.0
loss,2.24384
val_accuracy,0.10717
val_loss,2.22327


[34m[1mwandb[0m: Agent Starting Run: bacpv92k with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▂▂▃▃▄▅▆▇█
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▇▆▆▅▄▃▃▂▁
val_accuracy,▁▂▃▄▄▅▅▆▇█
val_loss,█▇▆▆▅▄▃▃▂▁

0,1
accuracy,0.08622
epoch,10.0
loss,2.30384
val_accuracy,0.09183
val_loss,2.3038


[34m[1mwandb[0m: Agent Starting Run: meljl0n1 with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▁▁▁▁▁▁▁▁▁
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▇▆▅▄▃▃▂▂▁
val_accuracy,▁▁▁▁▁▁▁▁▁▁
val_loss,█▇▆▅▄▃▃▂▂▁

0,1
accuracy,0.09991
epoch,10.0
loss,2.45344
val_accuracy,0.10083
val_loss,2.44743


[34m[1mwandb[0m: Agent Starting Run: f1y5cnfu with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▁▁▁▁
epoch,▁▃▅▆█
loss,█▇▆▄▁
val_accuracy,▁▁▁▁▁
val_loss,█▇▅▃▁

0,1
accuracy,0.10065
epoch,5.0
loss,2.31486
val_accuracy,0.09417
val_loss,2.31473


[34m[1mwandb[0m: Agent Starting Run: tm8xryy6 with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.1
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▂▂▃▄▅▆▆▇█
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▇▆▆▅▄▃▂▂▁
val_accuracy,▁▂▂▃▄▅▆▆▇█
val_loss,█▇▆▆▅▄▃▂▂▁

0,1
accuracy,0.13213
epoch,10.0
loss,2.30194
val_accuracy,0.13017
val_loss,2.30188


[34m[1mwandb[0m: Agent Starting Run: 61rqq6cx with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.1
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▁▁▁▂▃▅▆▇█
epoch,▁▂▃▃▄▅▆▆▇█
loss,██▇▇▆▅▄▃▂▁
val_accuracy,▁▁▁▂▃▄▆▇██
val_loss,██▇▇▆▅▄▃▂▁

0,1
accuracy,0.23743
epoch,10.0
loss,2.29861
val_accuracy,0.25183
val_loss,2.29777


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: os8gezdf with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▂▂▃▃▄▅▆▇█
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▇▆▆▅▄▃▃▂▁
val_accuracy,▁▁▂▃▄▄▅▆▇█
val_loss,█▇▆▆▅▄▃▃▂▁

0,1
accuracy,0.083
epoch,10.0
loss,2.30162
val_accuracy,0.0825
val_loss,2.30079


[34m[1mwandb[0m: Agent Starting Run: r40t8rsq with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▂▃▃▄▅▆▆▇█
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▇▆▅▄▄▃▂▂▁
val_accuracy,▁▂▂▃▄▄▅▆▇█
val_loss,█▇▆▅▄▄▃▂▂▁

0,1
accuracy,0.2202
epoch,10.0
loss,2.26963
val_accuracy,0.22533
val_loss,2.25848


[34m[1mwandb[0m: Agent Starting Run: fqaovcpj with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▁▁▁▁▁▁▁▁▁
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▇▆▆▅▄▃▃▂▁
val_accuracy,▁▁▁▁▁▁▁▁▁▁
val_loss,█▇▆▆▅▄▃▃▂▁

0,1
accuracy,0.09996
epoch,10.0
loss,2.50223
val_accuracy,0.10033
val_loss,2.49834


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: 46cwyl98 with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▂▃▅█
epoch,▁▃▅▆█
loss,█▇▆▄▁
val_accuracy,▁▂▃▇█
val_loss,█▇▅▃▁

0,1
accuracy,0.08422
epoch,5.0
loss,2.29563
val_accuracy,0.08667
val_loss,2.29427


[34m[1mwandb[0m: Agent Starting Run: 8z9ncz9g with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▁▁▁▁
epoch,▁▃▅▆█
loss,█▇▆▄▁
val_accuracy,▁▁▁▁▁
val_loss,█▇▅▃▁

0,1
accuracy,0.10065
epoch,5.0
loss,2.30614
val_accuracy,0.09417
val_loss,2.30873


[34m[1mwandb[0m: Agent Starting Run: j9zhj0bd with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.1
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▁▁▁▁▁██▁▁
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▅▃▁▁▁▁▂▁▁
val_accuracy,▂▂▁▁▁██▁▁▁
val_loss,█▄▂▁▂▂▃▃▂▁

0,1
accuracy,0.1003
epoch,10.0
loss,2.31086
val_accuracy,0.09733
val_loss,2.30226


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: m5wn6p0c with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▃▃▃▃▁▃▆▆▆█
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▇▇▆▅▄▃▃▂▁
val_accuracy,▁▁▁▁▁▁▁▁▁▁
val_loss,█▇▆▆▅▄▃▃▂▁

0,1
accuracy,0.05472
epoch,10.0
loss,2.30256
val_accuracy,0.0555
val_loss,2.30261


[34m[1mwandb[0m: Agent Starting Run: 77128h03 with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▁▁▁▁▁▁▁▁▁
epoch,▁▂▃▃▄▅▆▆▇█
loss,██▇▇▆▅▄▃▂▁
val_accuracy,▁▁▁▁▁▁▁▁▁▁
val_loss,██▇▇▆▅▄▃▂▁

0,1
accuracy,0.10065
epoch,10.0
loss,2.32026
val_accuracy,0.09417
val_loss,2.32563


[34m[1mwandb[0m: Agent Starting Run: npazg6mg with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▁▁▁▁▁▁▁▁▁
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▇▆▅▅▄▃▂▂▁
val_accuracy,▁▁▁▁▁▁▁▁▁▁
val_loss,█▇▆▅▅▄▃▂▂▁

0,1
accuracy,0.0997
epoch,10.0
loss,2.38201
val_accuracy,0.10267
val_loss,2.37457


[34m[1mwandb[0m: Agent Starting Run: sc3it45z with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.1
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▁▁▂▄▆▆▆▆█
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▅▄▃▂▂▂▁▁▁
val_accuracy,▁▁▂▄▅▅▅▆▇█
val_loss,█▆▄▃▃▂▂▂▁▁

0,1
accuracy,0.32494
epoch,10.0
loss,2.26591
val_accuracy,0.358
val_loss,2.26143


[34m[1mwandb[0m: Agent Starting Run: m83ek415 with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▁▁▁▁▁▁▁▁▁
epoch,▁▂▃▃▄▅▆▆▇█
loss,██▇▇▆▅▄▃▂▁
val_accuracy,▁▁▁▁▁▁▁▁▁▁
val_loss,██▇▇▆▅▄▃▂▁

0,1
accuracy,0.10083
epoch,10.0
loss,2.30765
val_accuracy,0.0925
val_loss,2.30846


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: 69a51wzs with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▃▅▇█
epoch,▁▃▅▆█
loss,█▆▄▃▁
val_accuracy,▁▁▁██
val_loss,█▆▄▃▁

0,1
accuracy,0.16031
epoch,5.0
loss,2.3236
val_accuracy,0.15817
val_loss,2.3238


[34m[1mwandb[0m: Agent Starting Run: s4wkxcir with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.1
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▁▂▃▃▄▅▆▇█
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▇▇▆▅▄▄▃▂▁
val_accuracy,▁▂▂▃▄▅▆▆▇█
val_loss,█▇▇▆▅▄▄▃▂▁

0,1
accuracy,0.19902
epoch,10.0
loss,2.2882
val_accuracy,0.21833
val_loss,2.2862


[34m[1mwandb[0m: Agent Starting Run: ip85ug40 with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▁▁▁▁
epoch,▁▃▅▆█
loss,█▇▆▄▁
val_accuracy,▁▁▁▁▁
val_loss,█▇▅▃▁

0,1
accuracy,0.10065
epoch,5.0
loss,2.5703
val_accuracy,0.09417
val_loss,2.56011


[34m[1mwandb[0m: Agent Starting Run: gvsw6agv with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.1
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▁▁▆█▂▁▁▄▇
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▇▆▅▄▄▄▃▂▁
val_accuracy,▁▁▅▆▂▁▁▃▆█
val_loss,█▇▆▆▆▆▅▄▃▁

0,1
accuracy,0.20563
epoch,10.0
loss,2.2728
val_accuracy,0.242
val_loss,2.26496


[34m[1mwandb[0m: Agent Starting Run: 01q9bxci with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.1
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▁▁█▅
epoch,▁▃▅▆█
loss,█▅▂▁▁
val_accuracy,▁▁█▅▁
val_loss,█▃▁▁▂

0,1
accuracy,0.20285
epoch,5.0
loss,2.29392
val_accuracy,0.105
val_loss,2.30893


[34m[1mwandb[0m: Agent Starting Run: s9nxuyw8 with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▃▃▁▃█
epoch,▁▃▅▆█
loss,█▇▆▄▁
val_accuracy,▁▁▁▁▁
val_loss,█▇▅▃▁

0,1
accuracy,0.09826
epoch,5.0
loss,2.3014
val_accuracy,0.09883
val_loss,2.30084


[34m[1mwandb[0m: Agent Starting Run: auczrjrx with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.1
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▁▁▁▁
epoch,▁▃▅▆█
loss,█▅▃▂▁
val_accuracy,▁▁▁▁▁
val_loss,█▅▃▂▁

0,1
accuracy,0.09965
epoch,5.0
loss,2.30551
val_accuracy,0.10317
val_loss,2.30409


[34m[1mwandb[0m: Agent Starting Run: 5wi6uh7j with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▁▁▁▁▁▁▁▁▁
epoch,▁▂▃▃▄▅▆▆▇█
loss,██▇▇▆▅▄▃▂▁
val_accuracy,▁▁▁▁▁▁▁▁▁▁
val_loss,██▇▆▆▅▄▃▂▁

0,1
accuracy,0.10083
epoch,10.0
loss,2.46093
val_accuracy,0.0925
val_loss,2.45721


[34m[1mwandb[0m: Agent Starting Run: jqwqcqau with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▂▂▃▄▅▆▆▇█
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▇▆▆▅▄▃▃▂▁
val_accuracy,▁▂▃▄▅▆▆▆██
val_loss,█▇▆▆▅▄▃▃▂▁

0,1
accuracy,0.1172
epoch,10.0
loss,2.29246
val_accuracy,0.10967
val_loss,2.29324


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: 06fohi91 with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▁▁▁▁
epoch,▁▃▅▆█
loss,█▆▄▃▁
val_accuracy,▁▁▁▁▁
val_loss,█▆▄▃▁

0,1
accuracy,0.0997
epoch,5.0
loss,2.44324
val_accuracy,0.10267
val_loss,2.42677


[34m[1mwandb[0m: Agent Starting Run: imkwy5b3 with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▁▁▂▂▃▄▅▆█
epoch,▁▂▃▃▄▅▆▆▇█
loss,██▇▇▆▅▄▃▂▁
val_accuracy,▁▁▁▂▃▃▃▅▆█
val_loss,██▇▆▆▅▄▃▂▁

0,1
accuracy,0.10693
epoch,10.0
loss,2.29586
val_accuracy,0.109
val_loss,2.29462


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: rvquakw2 with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▂▃▆█
epoch,▁▃▅▆█
loss,█▇▆▄▁
val_accuracy,▁▂▄▅█
val_loss,█▇▅▃▁

0,1
accuracy,0.13976
epoch,5.0
loss,2.30185
val_accuracy,0.15117
val_loss,2.30137


[34m[1mwandb[0m: Agent Starting Run: 7wt6u5ux with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.1
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▁▁▁█
epoch,▁▃▅▆█
loss,█▇▅▃▁
val_accuracy,▁▁▁▄█
val_loss,█▆▄▂▁

0,1
accuracy,0.10756
epoch,5.0
loss,2.30225
val_accuracy,0.11483
val_loss,2.30152


[34m[1mwandb[0m: Agent Starting Run: 4ya4iv5d with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.1
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▃▅▆█
epoch,▁▃▅▆█
loss,█▆▄▃▁
val_accuracy,▁▃▄▆█
val_loss,█▆▄▃▁

0,1
accuracy,0.13669
epoch,5.0
loss,2.27551
val_accuracy,0.15983
val_loss,2.26551


[34m[1mwandb[0m: Agent Starting Run: a1t71tm4 with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▁▁▁▁
epoch,▁▃▅▆█
loss,█▇▆▃▁
val_accuracy,▁▁▁▁▁
val_loss,█▇▅▃▁

0,1
accuracy,0.09965
epoch,5.0
loss,2.38857
val_accuracy,0.10317
val_loss,2.37341


[34m[1mwandb[0m: Agent Starting Run: jwmzudzj with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▁▁▁▁▁▁▁▅█
epoch,▁▂▃▃▄▅▆▆▇█
loss,██▇▇▆▅▄▃▂▁
val_accuracy,▁▁▁▁▁▁▁▄▄█
val_loss,██▇▇▆▅▄▃▂▁

0,1
accuracy,0.10102
epoch,10.0
loss,2.29025
val_accuracy,0.09467
val_loss,2.29124


[34m[1mwandb[0m: Agent Starting Run: vm8tjs8g with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.1
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▂▄▅▅▆▇▇██
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▇▆▆▅▄▃▃▂▁
val_accuracy,▁▂▄▅▅▆▆▇██
val_loss,█▇▆▆▅▄▄▃▂▁

0,1
accuracy,0.3448
epoch,10.0
loss,2.23388
val_accuracy,0.3585
val_loss,2.22454


[34m[1mwandb[0m: Agent Starting Run: orqc5rwr with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▁▁▂▂▃▄▅▇█
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▇▆▅▄▃▃▂▂▁
val_accuracy,▁▁▁▂▃▄▄▅▇█
val_loss,█▇▆▅▄▃▃▂▂▁

0,1
accuracy,0.2233
epoch,10.0
loss,2.09339
val_accuracy,0.24617
val_loss,2.05529


[34m[1mwandb[0m: Agent Starting Run: dmckja43 with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▂▃▆█
epoch,▁▃▅▆█
loss,█▇▆▄▁
val_accuracy,▁▂▂▄█
val_loss,█▇▅▃▁

0,1
accuracy,0.10226
epoch,5.0
loss,2.30345
val_accuracy,0.10183
val_loss,2.30317


[34m[1mwandb[0m: Agent Starting Run: kc63v7mo with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▁▁▁▁
epoch,▁▃▅▆█
loss,█▇▆▃▁
val_accuracy,▁▁▁▁▁
val_loss,█▇▅▃▁

0,1
accuracy,0.0997
epoch,5.0
loss,2.31087
val_accuracy,0.10267
val_loss,2.31036


[34m[1mwandb[0m: Agent Starting Run: kq73sr5j with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▂▄▆█
epoch,▁▃▅▆█
loss,█▆▄▃▁
val_accuracy,▁▃▅▆█
val_loss,█▆▄▃▁

0,1
accuracy,0.16187
epoch,5.0
loss,2.30916
val_accuracy,0.17183
val_loss,2.298


[34m[1mwandb[0m: Agent Starting Run: rk31zijs with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.1
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▄▆▇█
epoch,▁▃▅▆█
loss,█▆▄▃▁
val_accuracy,▁▄▆▆█
val_loss,█▆▄▃▁

0,1
accuracy,0.14861
epoch,5.0
loss,2.3026
val_accuracy,0.14667
val_loss,2.30177


[34m[1mwandb[0m: Agent Starting Run: oacextp6 with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▂▂▃▄▅▆▆▇█
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▇▆▆▅▄▃▃▂▁
val_accuracy,▁▂▂▃▅▆▇▇▇█
val_loss,█▇▆▆▅▄▃▃▂▁

0,1
accuracy,0.10487
epoch,10.0
loss,2.30032
val_accuracy,0.1075
val_loss,2.30067


[34m[1mwandb[0m: Agent Starting Run: ciwq7k4x with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▁▁▁▁
epoch,▁▃▅▆█
loss,█▆▅▃▁
val_accuracy,▁▁▁▁▁
val_loss,█▆▅▃▁

0,1
accuracy,0.09996
epoch,5.0
loss,2.30929
val_accuracy,0.10033
val_loss,2.307


[34m[1mwandb[0m: Agent Starting Run: 0e98ju97 with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.1
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▃▄▆▇▇▇▇██
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▇▇▆▅▄▃▂▁▁
val_accuracy,▁▃▆▆▇▆▆███
val_loss,██▇▆▅▄▃▂▁▁

0,1
accuracy,0.59422
epoch,10.0
loss,1.09269
val_accuracy,0.58683
val_loss,1.0321


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: qu6y8vcu with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▁▁▁▁
epoch,▁▃▅▆█
loss,█▆▄▃▁
val_accuracy,▁▁▁▁▁
val_loss,█▆▄▃▁

0,1
accuracy,0.09944
epoch,5.0
loss,2.31608
val_accuracy,0.105
val_loss,2.31328


[34m[1mwandb[0m: Agent Starting Run: 2ovbr7gp with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▁▃▃▃▄▅▆▇█
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▇▆▆▅▄▃▃▂▁
val_accuracy,▁▁▁▁▂▄▆▇██
val_loss,█▇▆▆▅▄▃▃▂▁

0,1
accuracy,0.11361
epoch,10.0
loss,2.30196
val_accuracy,0.10583
val_loss,2.30203


[34m[1mwandb[0m: Agent Starting Run: 4hqekmya with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▂▃▄▅▆▆▇▇█
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▇▆▆▅▄▃▃▂▁
val_accuracy,▁▁▅▅▆▆▆▆▆█
val_loss,█▇▆▆▅▄▃▃▂▁

0,1
accuracy,0.10085
epoch,10.0
loss,2.3039
val_accuracy,0.10483
val_loss,2.30343


[34m[1mwandb[0m: Agent Starting Run: e099e51n with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▁▁▁▁▁▁▁▁▁
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▇▆▆▅▄▃▃▂▁
val_accuracy,▁▁▁▁▁▁▁▁▁▁
val_loss,█▇▆▆▅▄▃▃▂▁

0,1
accuracy,0.10017
epoch,10.0
loss,2.30659
val_accuracy,0.0985
val_loss,2.30902


[34m[1mwandb[0m: Agent Starting Run: jao4ybbj with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.1
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▁▁▁▁▂▄▆██
epoch,▁▂▃▃▄▅▆▆▇█
loss,██▇▇▆▅▄▃▂▁
val_accuracy,▁▁▁▁▂▄▆███
val_loss,██▇▆▅▅▄▃▂▁

0,1
accuracy,0.23007
epoch,10.0
loss,2.29854
val_accuracy,0.21883
val_loss,2.29769


[34m[1mwandb[0m: Agent Starting Run: 4wznukn5 with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.1
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▄▇▇█
epoch,▁▃▅▆█
loss,█▅▃▂▁
val_accuracy,▁▅▆▇█
val_loss,█▆▄▃▁

0,1
accuracy,0.27267
epoch,5.0
loss,2.13646
val_accuracy,0.2945
val_loss,2.08984


[34m[1mwandb[0m: Agent Starting Run: 7j4kwrwe with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▁▁▁▁▄▄▄██
epoch,▁▂▃▃▄▅▆▆▇█
loss,██▇▇▆▅▄▃▂▁
val_accuracy,▁▁▁▁▁▁▁▁▁▁
val_loss,██▇▇▆▅▄▃▂▁

0,1
accuracy,0.09985
epoch,10.0
loss,2.30041
val_accuracy,0.10267
val_loss,2.30051


[34m[1mwandb[0m: Agent Starting Run: ncv7yqxg with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.1
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▁▁▂█
epoch,▁▃▅▆█
loss,█▅▃▂▁
val_accuracy,▁▁▂▅█
val_loss,█▅▄▂▁

0,1
accuracy,0.18785
epoch,5.0
loss,2.24947
val_accuracy,0.24533
val_loss,2.22281


[34m[1mwandb[0m: Agent Starting Run: 23r32oup with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▁▁▂▂▃▄▆▇█
epoch,▁▂▃▃▄▅▆▆▇█
loss,██▇▇▆▅▄▃▂▁
val_accuracy,▁▁▂▁▂▄▇███
val_loss,██▇▇▆▅▄▃▂▁

0,1
accuracy,0.08748
epoch,10.0
loss,2.30227
val_accuracy,0.086
val_loss,2.30216


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: 6dhho403 with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▁▁▂▅▅▅▅▆█
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▇▆▅▄▃▃▂▂▁
val_accuracy,▁▁▂▄▅▄▅▅▇█
val_loss,█▇▅▄▄▃▃▂▂▁

0,1
accuracy,0.27957
epoch,10.0
loss,2.09896
val_accuracy,0.32733
val_loss,2.06562


[34m[1mwandb[0m: Agent Starting Run: m6yi0xyi with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▂▂▃▄▄▅▆▇█
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▇▆▆▅▄▃▃▂▁
val_accuracy,▁▂▂▃▄▄▅▆▇█
val_loss,█▇▆▆▅▄▃▃▂▁

0,1
accuracy,0.07963
epoch,10.0
loss,2.30416
val_accuracy,0.07817
val_loss,2.30399


[34m[1mwandb[0m: Agent Starting Run: pto20h67 with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▂▃▅█
epoch,▁▃▅▆█
loss,█▇▆▄▁
val_accuracy,▁▂▄▆█
val_loss,█▇▅▃▁

0,1
accuracy,0.11876
epoch,5.0
loss,2.29852
val_accuracy,0.11683
val_loss,2.29582


[34m[1mwandb[0m: Agent Starting Run: h7mtzwyr with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.1
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▁▁▁▁▁▁▁▁▁
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▆▄▃▂▂▂▁▁▁
val_accuracy,▁▁▁▁▁▁▁▁▁▁
val_loss,█▆▄▃▂▂▂▁▁▁

0,1
accuracy,0.10017
epoch,10.0
loss,2.30237
val_accuracy,0.0985
val_loss,2.30233


[34m[1mwandb[0m: Agent Starting Run: 6sa3d3oq with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▁▂▂▃▄▅▆▇█
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▇▆▅▄▄▃▂▂▁
val_accuracy,▁▁▂▃▃▄▅▆▇█
val_loss,█▇▆▅▄▄▃▂▂▁

0,1
accuracy,0.1353
epoch,10.0
loss,2.25727
val_accuracy,0.14967
val_loss,2.24832


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: 03endd16 with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▂▂▄▄▆▇▇▇█
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▇▆▆▅▄▃▃▂▁
val_accuracy,▁▁▁▄▅█████
val_loss,█▇▆▆▅▄▃▃▂▁

0,1
accuracy,0.1168
epoch,10.0
loss,2.31869
val_accuracy,0.12367
val_loss,2.31234


[34m[1mwandb[0m: Agent Starting Run: o6dy1y2y with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.1
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▁▂▄▅▅▅▆▇█
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▆▅▄▃▃▂▂▁▁
val_accuracy,▁▂▃▄▅▅▆▆▇█
val_loss,█▆▅▄▄▃▃▂▂▁

0,1
accuracy,0.51339
epoch,10.0
loss,2.18385
val_accuracy,0.55367
val_loss,2.16895


[34m[1mwandb[0m: Agent Starting Run: lck6n7cv with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▂▃▆█
epoch,▁▃▅▆█
loss,█▇▅▃▁
val_accuracy,▁▂▄▆█
val_loss,█▆▄▃▁

0,1
accuracy,0.18128
epoch,5.0
loss,2.26759
val_accuracy,0.2045
val_loss,2.23539


[34m[1mwandb[0m: Agent Starting Run: w326jxqm with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▂▃▆█
epoch,▁▃▅▆█
loss,█▇▆▄▁
val_accuracy,▁▂▃▅█
val_loss,█▇▅▃▁

0,1
accuracy,0.15365
epoch,5.0
loss,2.30868
val_accuracy,0.144
val_loss,2.31204


[34m[1mwandb[0m: Agent Starting Run: dyiircfx with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.1
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▁▁███▇▂▂▂
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▇▅▃▂▁▁▁▂▃
val_accuracy,██▁▁▁▂▇▇▇▇
val_loss,█▆▄▂▁▁▁▂▂▂

0,1
accuracy,0.09991
epoch,10.0
loss,2.30459
val_accuracy,0.10083
val_loss,2.30426


[34m[1mwandb[0m: Agent Starting Run: 6ptwijyj with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▃▄▆█
epoch,▁▃▅▆█
loss,█▆▄▃▁
val_accuracy,▁▃▅▇█
val_loss,█▆▄▃▁

0,1
accuracy,0.15985
epoch,5.0
loss,2.30121
val_accuracy,0.16183
val_loss,2.30022


[34m[1mwandb[0m: Agent Starting Run: 9rzb0gaa with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.1
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▁▁▁▁
epoch,▁▃▅▆█
loss,█▆▄▂▁
val_accuracy,▁▁▁▁▁
val_loss,█▆▄▂▁

0,1
accuracy,0.10065
epoch,5.0
loss,2.30542
val_accuracy,0.09417
val_loss,2.30533


[34m[1mwandb[0m: Agent Starting Run: ewi8sb2t with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.1
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▄▅▆█
epoch,▁▃▅▆█
loss,█▆▄▃▁
val_accuracy,▁▃▄▆█
val_loss,█▆▅▃▁

0,1
accuracy,0.23017
epoch,5.0
loss,2.19333
val_accuracy,0.26567
val_loss,2.15814


[34m[1mwandb[0m: Agent Starting Run: w3z74otb with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.1
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▁▁▁▁▁▁▃█▂
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▆▄▃▂▂▁▁▁▁
val_accuracy,▆▆▆▆▆▆██▁▁
val_loss,█▆▄▃▂▂▂▁▁▁

0,1
accuracy,0.10083
epoch,10.0
loss,2.30294
val_accuracy,0.0925
val_loss,2.30348


[34m[1mwandb[0m: Agent Starting Run: g4bdkkn5 with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▂▂▃▄▅▆▆▇█
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▇▆▆▅▄▃▂▂▁
val_accuracy,▁▂▃▄▄▅▅▆▇█
val_loss,█▇▆▆▅▄▃▂▂▁

0,1
accuracy,0.14152
epoch,10.0
loss,2.49333
val_accuracy,0.142
val_loss,2.49186


[34m[1mwandb[0m: Agent Starting Run: xfof92wb with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▁▁▁▁▁▁▁▁▁
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▇▆▆▅▄▃▃▂▁
val_accuracy,▁▁▁▁▁▁▁▁▁▁
val_loss,█▇▆▆▅▄▃▃▂▁

0,1
accuracy,0.09991
epoch,10.0
loss,2.31127
val_accuracy,0.10083
val_loss,2.30784


[34m[1mwandb[0m: Agent Starting Run: jho8ahgq with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▃▃▃▁█
epoch,▁▃▅▆█
loss,█▇▆▃▁
val_accuracy,▁▁▁▁█
val_loss,█▇▅▃▁

0,1
accuracy,0.09978
epoch,5.0
loss,2.42885
val_accuracy,0.11233
val_loss,2.39763


[34m[1mwandb[0m: Agent Starting Run: jqt4y5gy with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▁▂▂▃▄▅▆▇█
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▇▆▆▅▄▃▃▂▁
val_accuracy,▁▃█▆▄▆▆▄▄▆
val_loss,█▇▆▆▅▄▃▃▂▁

0,1
accuracy,0.14952
epoch,10.0
loss,2.30339
val_accuracy,0.14
val_loss,2.30362


[34m[1mwandb[0m: Agent Starting Run: 2p7mlw4r with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.1
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▂▃▄▄▅▆▇▇█
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▇▆▆▅▄▃▃▂▁
val_accuracy,▁▂▃▃▄▅▅▆▇█
val_loss,█▇▆▆▅▄▃▃▂▁

0,1
accuracy,0.14965
epoch,10.0
loss,2.29438
val_accuracy,0.15717
val_loss,2.29317


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: uu34f9sl with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▁▁▁▁▁▁▁▁▁
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▇▆▆▅▄▃▂▂▁
val_accuracy,▁▁▁▁▁▁▁▁▁▁
val_loss,█▇▆▆▅▄▃▂▂▁

0,1
accuracy,0.09944
epoch,10.0
loss,2.30997
val_accuracy,0.105
val_loss,2.30646


[34m[1mwandb[0m: Agent Starting Run: l919b6ef with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.1
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▁▁▁▁█▄▁▁▁
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▇▅▄▂▁▁▁▁▁
val_accuracy,▁▁▂▁█▅▁▁▁▁
val_loss,█▆▄▃▂▂▂▂▂▁

0,1
accuracy,0.0997
epoch,10.0
loss,2.29754
val_accuracy,0.10267
val_loss,2.29669


[34m[1mwandb[0m: Agent Starting Run: ln7vsml3 with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.1
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▁▅█▇
epoch,▁▃▅▆█
loss,█▅▃▂▁
val_accuracy,▁▅█▇▅
val_loss,█▅▃▂▁

0,1
accuracy,0.2405
epoch,5.0
loss,2.27909
val_accuracy,0.187
val_loss,2.26521


[34m[1mwandb[0m: Agent Starting Run: rudx0o77 with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▁▃▃█
epoch,▁▃▅▆█
loss,█▆▅▃▁
val_accuracy,███▁▁
val_loss,█▆▅▃▁

0,1
accuracy,0.11394
epoch,5.0
loss,2.30398
val_accuracy,0.11967
val_loss,2.30379


[34m[1mwandb[0m: Agent Starting Run: 15rf2o5s with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▁▁▁▁
epoch,▁▃▅▆█
loss,█▇▆▃▁
val_accuracy,▁▁▁▁▁
val_loss,█▇▅▃▁

0,1
accuracy,0.10083
epoch,5.0
loss,2.32523
val_accuracy,0.0925
val_loss,2.32807


[34m[1mwandb[0m: Agent Starting Run: 4j64twtw with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▂▃▄▄▅▆▇▇█
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▇▆▆▅▄▃▃▂▁
val_accuracy,▁▂▂▃▄▆▆▇▇█
val_loss,█▇▆▆▅▄▃▃▂▁

0,1
accuracy,0.08146
epoch,10.0
loss,2.30558
val_accuracy,0.0785
val_loss,2.3053


[34m[1mwandb[0m: Agent Starting Run: f3bchold with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▃▄▆█
epoch,▁▃▅▆█
loss,█▆▄▃▁
val_accuracy,▁▃▅▆█
val_loss,█▆▄▃▁

0,1
accuracy,0.10143
epoch,5.0
loss,2.32269
val_accuracy,0.1095
val_loss,2.3142


[34m[1mwandb[0m: Agent Starting Run: py37kmmt with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▂▃▅█
epoch,▁▃▅▆█
loss,█▆▅▃▁
val_accuracy,▁▄▄▄█
val_loss,█▆▅▃▁

0,1
accuracy,0.07531
epoch,5.0
loss,2.30027
val_accuracy,0.07133
val_loss,2.30059


[34m[1mwandb[0m: Agent Starting Run: 60zsq5th with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▁▄▅█
epoch,▁▃▅▆█
loss,█▇▆▄▁
val_accuracy,▁▁▁██
val_loss,█▇▅▃▁

0,1
accuracy,0.10291
epoch,5.0
loss,2.2936
val_accuracy,0.1035
val_loss,2.29443


[34m[1mwandb[0m: Agent Starting Run: az51g2q4 with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.1
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▃▅▅▆▇▇███
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▆▅▅▄▃▃▂▂▁
val_accuracy,▁▃▄▅▆▆▇▇██
val_loss,█▇▆▆▅▄▄▃▂▁

0,1
accuracy,0.40087
epoch,10.0
loss,1.93174
val_accuracy,0.39417
val_loss,1.88756


[34m[1mwandb[0m: Agent Starting Run: rpl5wlg8 with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▂▄▅█
epoch,▁▃▅▆█
loss,█▇▆▄▁
val_accuracy,▁▁▃█▆
val_loss,█▇▅▃▁

0,1
accuracy,0.10641
epoch,5.0
loss,2.30371
val_accuracy,0.10167
val_loss,2.30404


[34m[1mwandb[0m: Agent Starting Run: za61yamo with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,█████▆▆▆▃▁
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▇▆▅▅▄▃▂▂▁
val_accuracy,▁▁▁▁▁▁▁▁▁▁
val_loss,█▇▆▅▅▄▃▂▂▁

0,1
accuracy,0.09959
epoch,10.0
loss,2.31198
val_accuracy,0.10267
val_loss,2.30835


[34m[1mwandb[0m: Agent Starting Run: ofnsq0ql with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▃▄▅█
epoch,▁▃▅▆█
loss,█▆▄▃▁
val_accuracy,▁▁▃██
val_loss,█▆▅▃▁

0,1
accuracy,0.0567
epoch,5.0
loss,2.30752
val_accuracy,0.0605
val_loss,2.3075


[34m[1mwandb[0m: Agent Starting Run: jn01ggf6 with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▁▁▁▁▂▃▅▇█
epoch,▁▂▃▃▄▅▆▆▇█
loss,██▇▆▅▄▃▂▂▁
val_accuracy,▁▁▁▁▂▃▄▆▇█
val_loss,█▇▇▆▅▄▃▂▂▁

0,1
accuracy,0.32294
epoch,10.0
loss,2.25645
val_accuracy,0.35567
val_loss,2.23706


[34m[1mwandb[0m: Agent Starting Run: web4jfg9 with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,█▆▆▆▆▆▆▅▄▁
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▇▆▆▅▄▃▃▂▁
val_accuracy,███████▅▅▁
val_loss,█▇▆▆▅▄▃▃▂▁

0,1
accuracy,0.09448
epoch,10.0
loss,2.29769
val_accuracy,0.099
val_loss,2.29669


[34m[1mwandb[0m: Agent Starting Run: 0721vjkp with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.1
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▁▁▁▁▁▁▁▁▁
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▆▄▃▂▂▁▁▁▁
val_accuracy,▁▁▁▁▁▁▁▁▁▁
val_loss,█▆▄▃▂▂▁▁▁▁

0,1
accuracy,0.10065
epoch,10.0
loss,2.30277
val_accuracy,0.09417
val_loss,2.30243


[34m[1mwandb[0m: Agent Starting Run: u0cbw18l with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▁▂▂▃▄▅▆▇█
epoch,▁▂▃▃▄▅▆▆▇█
loss,██▇▇▆▅▄▃▂▁
val_accuracy,▁▁▂▃▃▄▅▆▇█
val_loss,██▇▆▅▅▄▃▂▁

0,1
accuracy,0.20772
epoch,10.0
loss,2.23491
val_accuracy,0.21067
val_loss,2.22601


[34m[1mwandb[0m: Agent Starting Run: lmuk7vos with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▃▄▆█
epoch,▁▃▅▆█
loss,█▆▄▂▁
val_accuracy,▁▃▄▆█
val_loss,█▆▄▃▁

0,1
accuracy,0.07311
epoch,5.0
loss,2.32921
val_accuracy,0.08233
val_loss,2.31893


[34m[1mwandb[0m: Agent Starting Run: 49o9zcor with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▁▁▁▁▁▁▁▁▁
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▇▆▆▅▄▃▃▂▁
val_accuracy,▁▁▁▁▁▁▁▁▁▁
val_loss,█▇▆▆▅▄▃▃▂▁

0,1
accuracy,0.10083
epoch,10.0
loss,2.60183
val_accuracy,0.0925
val_loss,2.60519


[34m[1mwandb[0m: Agent Starting Run: 6qp0tu3e with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.1
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▂▄▆█
epoch,▁▃▅▆█
loss,█▆▄▃▁
val_accuracy,▁▂▄▆█
val_loss,█▆▄▃▁

0,1
accuracy,0.0983
epoch,5.0
loss,2.30134
val_accuracy,0.10333
val_loss,2.30116


[34m[1mwandb[0m: Agent Starting Run: lep0yjkc with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▂▃▄▅▅▆▇▇█
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▇▆▆▅▄▃▃▂▁
val_accuracy,▁▂▄▄▅▆▆▇██
val_loss,█▇▆▆▅▄▃▃▂▁

0,1
accuracy,0.13478
epoch,10.0
loss,2.30335
val_accuracy,0.13783
val_loss,2.30249


[34m[1mwandb[0m: Agent Starting Run: ad5grvmi with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.1
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▂▃▅▇██▆▅▄
epoch,▁▂▃▃▄▅▆▆▇█
loss,███▇▇▆▅▄▃▁
val_accuracy,▁▂▅▇██▆▅▄▃
val_loss,██▇▇▇▆▅▄▃▁

0,1
accuracy,0.1645
epoch,10.0
loss,2.23632
val_accuracy,0.15617
val_loss,2.21086


[34m[1mwandb[0m: Agent Starting Run: 0i1sngbm with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▁▂▄█
epoch,▁▃▅▆█
loss,█▇▆▄▁
val_accuracy,▁▁▁▂█
val_loss,█▇▅▃▁

0,1
accuracy,0.05257
epoch,5.0
loss,2.30301
val_accuracy,0.05433
val_loss,2.30252


[34m[1mwandb[0m: Agent Starting Run: vjtmvglv with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▃▅▆█
epoch,▁▃▅▆█
loss,█▆▄▃▁
val_accuracy,▆▆▁▆█
val_loss,█▆▄▃▁

0,1
accuracy,0.09931
epoch,5.0
loss,2.31045
val_accuracy,0.1015
val_loss,2.30945


[34m[1mwandb[0m: Agent Starting Run: y8m3eq6y with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▁▂▃▄▆▇▇▇█
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▇▇▅▄▃▃▂▂▁
val_accuracy,▁▁▂▄▅▅▅▆▆█
val_loss,█▇▆▅▄▄▃▂▂▁

0,1
accuracy,0.21352
epoch,10.0
loss,2.15057
val_accuracy,0.23267
val_loss,2.12467


[34m[1mwandb[0m: Agent Starting Run: 61x8zoda with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.1
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▁▁▁▁▁▁▁▁▁
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▆▄▃▂▂▁▁▁▁
val_accuracy,▁▁▁▁▁▁▁▁▁▁
val_loss,█▅▄▃▂▂▁▁▁▁

0,1
accuracy,0.09939
epoch,10.0
loss,2.30222
val_accuracy,0.1055
val_loss,2.30193


[34m[1mwandb[0m: Agent Starting Run: fz9xxt96 with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.1
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▂▃▄▅▆▇▇▇█
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▇▇▆▅▅▄▃▂▁
val_accuracy,▁▂▃▅▅▆▆▇▇█
val_loss,█▇▇▆▅▅▄▃▂▁

0,1
accuracy,0.4242
epoch,10.0
loss,2.00598
val_accuracy,0.47067
val_loss,1.94933


[34m[1mwandb[0m: Agent Starting Run: zdzzoo6y with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▁▁▁▁
epoch,▁▃▅▆█
loss,█▆▄▃▁
val_accuracy,▁▁▁▁▁
val_loss,█▆▅▃▁

0,1
accuracy,0.0997
epoch,5.0
loss,2.31138
val_accuracy,0.10267
val_loss,2.3111


[34m[1mwandb[0m: Agent Starting Run: f40x8j19 with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▅▁▅█
epoch,▁▃▅▆█
loss,█▆▅▃▁
val_accuracy,▁▁▁▅█
val_loss,█▆▄▃▁

0,1
accuracy,0.04602
epoch,5.0
loss,2.30478
val_accuracy,0.0405
val_loss,2.30501


[34m[1mwandb[0m: Agent Starting Run: s28zbhyj with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▁▂▂▃▄▅▆▆█
epoch,▁▂▃▃▄▅▆▆▇█
loss,██▇▇▆▅▄▃▂▁
val_accuracy,▁▂▂▃▃▃▄▅▆█
val_loss,██▇▇▆▅▄▃▂▁

0,1
accuracy,0.1423
epoch,10.0
loss,2.30373
val_accuracy,0.143
val_loss,2.3034


[34m[1mwandb[0m: Agent Starting Run: igkgv7at with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▂▄▇█
epoch,▁▃▅▆█
loss,█▇▆▄▁
val_accuracy,▅▅▅▁█
val_loss,█▇▅▃▁

0,1
accuracy,0.10004
epoch,5.0
loss,2.38214
val_accuracy,0.10267
val_loss,2.38296


[34m[1mwandb[0m: Agent Starting Run: 5npqhaec with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▁▁▁▁
epoch,▁▃▅▆█
loss,█▆▄▃▁
val_accuracy,▁▁▁▁▁
val_loss,█▆▄▃▁

0,1
accuracy,0.10083
epoch,5.0
loss,2.31867
val_accuracy,0.0925
val_loss,2.32073


[34m[1mwandb[0m: Agent Starting Run: wl9pl8s6 with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▁▂▂▃▃▄▅▆█
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▇▆▅▄▄▃▂▂▁
val_accuracy,▁▁▂▂▃▃▄▅▆█
val_loss,█▇▆▅▄▄▃▂▂▁

0,1
accuracy,0.11254
epoch,10.0
loss,2.25838
val_accuracy,0.11733
val_loss,2.24752


[34m[1mwandb[0m: Agent Starting Run: zdss3f92 with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▁▂▃▄▄▅▇▇█
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▇▆▅▄▄▃▂▂▁
val_accuracy,▁▂▃▃▄▅▆▇▇█
val_loss,█▇▆▅▄▄▃▂▂▁

0,1
accuracy,0.33022
epoch,10.0
loss,2.03838
val_accuracy,0.3615
val_loss,1.98445


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: flxbqme3 with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.1
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▁▁▁▁
epoch,▁▃▅▆█
loss,█▆▄▂▁
val_accuracy,▁▁▁▁▁
val_loss,█▆▄▂▁

0,1
accuracy,0.10017
epoch,5.0
loss,2.31138
val_accuracy,0.0985
val_loss,2.30884


[34m[1mwandb[0m: Agent Starting Run: d325jv7o with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.1
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▁▁▁▁
epoch,▁▃▅▆█
loss,█▇▅▃▁
val_accuracy,████▁
val_loss,█▆▄▂▁

0,1
accuracy,0.09991
epoch,5.0
loss,2.3045
val_accuracy,0.10033
val_loss,2.30345


[34m[1mwandb[0m: Agent Starting Run: 4laje0xr with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▁▁▁▁▁▁▁▁▁
epoch,▁▂▃▃▄▅▆▆▇█
loss,██▇▇▆▅▄▃▂▁
val_accuracy,▁▁▁▁▁▁▁▁▁▁
val_loss,██▇▆▆▅▄▃▂▁

0,1
accuracy,0.0997
epoch,10.0
loss,2.47877
val_accuracy,0.10267
val_loss,2.47365


[34m[1mwandb[0m: Agent Starting Run: cmw24t6c with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▁▂▂▃▄▅▆▇█
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▇▆▅▄▄▃▂▂▁
val_accuracy,▁▂▂▃▃▄▅▆▇█
val_loss,█▇▆▅▄▄▃▂▂▁

0,1
accuracy,0.09246
epoch,10.0
loss,2.37913
val_accuracy,0.09633
val_loss,2.3699


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: 8oc2e7hw with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▁▁▂▃▄▅▆▇█
epoch,▁▂▃▃▄▅▆▆▇█
loss,██▇▇▆▅▄▃▂▁
val_accuracy,▆▆█▄▄▄▃▂▂▁
val_loss,██▇▇▆▅▄▃▂▁

0,1
accuracy,0.115
epoch,10.0
loss,2.29645
val_accuracy,0.11833
val_loss,2.29592


[34m[1mwandb[0m: Agent Starting Run: dkwcc77a with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.1
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▅▅▅▅█▁▁▁▁▁
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▆▃▁▁▂▃▄▃▂
val_accuracy,▄▄▄▁██████
val_loss,█▄▂▁▃▅▅▄▂▁

0,1
accuracy,0.0997
epoch,10.0
loss,2.30645
val_accuracy,0.10267
val_loss,2.30255


[34m[1mwandb[0m: Agent Starting Run: v94y1t98 with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.1
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▁▂▂▃▄▅▆▇█
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▆▆▅▄▄▃▂▂▁
val_accuracy,▁▁▂▃▄▅▆▇██
val_loss,█▇▆▅▅▄▃▃▂▁

0,1
accuracy,0.60554
epoch,10.0
loss,1.701
val_accuracy,0.635
val_loss,1.62511


[34m[1mwandb[0m: Agent Starting Run: mhz4ee4p with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▂▂▃▄▄▅▆▇█
epoch,▁▂▃▃▄▅▆▆▇█
loss,██▇▇▆▅▄▃▂▁
val_accuracy,▁▁▂▃▃▅▆▇██
val_loss,██▇▇▆▅▄▃▂▁

0,1
accuracy,0.16983
epoch,10.0
loss,2.30101
val_accuracy,0.17333
val_loss,2.30075


[34m[1mwandb[0m: Agent Starting Run: pa95wigi with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▂▃▅█
epoch,▁▃▅▆█
loss,█▇▆▄▁
val_accuracy,▁▂▃▅█
val_loss,█▇▅▃▁

0,1
accuracy,0.08394
epoch,5.0
loss,2.30333
val_accuracy,0.0985
val_loss,2.30068


[34m[1mwandb[0m: Agent Starting Run: 19fnf5hz with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.1
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▂▅▇█
epoch,▁▃▅▆█
loss,█▅▄▃▁
val_accuracy,▁▄▆▇█
val_loss,█▆▅▃▁

0,1
accuracy,0.28394
epoch,5.0
loss,2.18665
val_accuracy,0.30217
val_loss,2.12691


[34m[1mwandb[0m: Agent Starting Run: 1f1dzjh8 with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.1
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▁▁▁▁▁▁▁▁▁
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▇▅▄▃▃▂▂▁▁
val_accuracy,▁▁▁▁▁▁▁▁▁█
val_loss,█▇▅▄▃▃▂▂▁▁

0,1
accuracy,0.09996
epoch,10.0
loss,2.30505
val_accuracy,0.1005
val_loss,2.3047


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: 6tyiek5q with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▁▃▄█
epoch,▁▃▅▆█
loss,█▇▆▄▁
val_accuracy,▁▁▁█▁
val_loss,█▇▅▃▁

0,1
accuracy,0.08685
epoch,5.0
loss,2.30258
val_accuracy,0.0895
val_loss,2.30246


[34m[1mwandb[0m: Agent Starting Run: 6h0y0e4c with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.1
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▁▁▁█▁▁▁▁▁
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▄▃▃▃▃▃▃▂▁
val_accuracy,▁▁▂▄▁▁▁▁▁█
val_loss,█▅▅▅▆▆▅▃▂▁

0,1
accuracy,0.10031
epoch,10.0
loss,2.23951
val_accuracy,0.26583
val_loss,2.2161


[34m[1mwandb[0m: Agent Starting Run: fkb3a8ko with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▁▁▁▁▁▁▁▁▁
epoch,▁▂▃▃▄▅▆▆▇█
loss,██▇▇▆▅▄▃▂▁
val_accuracy,▁▁▁▁▁▁▁▁▁▁
val_loss,██▇▇▆▅▄▃▂▁

0,1
accuracy,0.09965
epoch,10.0
loss,2.39903
val_accuracy,0.10317
val_loss,2.39087


[34m[1mwandb[0m: Agent Starting Run: 58rzbtt8 with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▁▁▁▁▁▁▁▁▁
epoch,▁▂▃▃▄▅▆▆▇█
loss,██▇▆▆▅▄▃▂▁
val_accuracy,▁▁▁▁▁▁▁▁▁▁
val_loss,█▇▇▆▅▄▃▂▂▁

0,1
accuracy,0.09965
epoch,10.0
loss,2.30099
val_accuracy,0.10317
val_loss,2.29925


[34m[1mwandb[0m: Agent Starting Run: ae7uvjok with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▁▂▃▄▆▆▇▇█
epoch,▁▂▃▃▄▅▆▆▇█
loss,██▇▆▅▄▃▂▂▁
val_accuracy,▁▂▃▄▅▆▆▇▇█
val_loss,█▇▆▅▄▄▃▂▂▁

0,1
accuracy,0.25087
epoch,10.0
loss,2.1205
val_accuracy,0.27717
val_loss,2.08663


[34m[1mwandb[0m: Agent Starting Run: 5kvvyrhj with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▂▁▄▆▆▆▇█▇▆
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▇▆▆▅▄▃▃▂▁
val_accuracy,▁▅▅▁▅▅▅▅▅█
val_loss,█▇▆▆▅▄▃▂▂▁

0,1
accuracy,0.11048
epoch,10.0
loss,2.30255
val_accuracy,0.102
val_loss,2.30266


[34m[1mwandb[0m: Agent Starting Run: ctmmr32p with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▁▁▁▁▁▁▁▁▁
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▇▆▆▅▄▃▂▂▁
val_accuracy,▁▁▁▁▁▁▁▁▁▁
val_loss,█▇▆▆▅▄▃▂▂▁

0,1
accuracy,0.1003
epoch,10.0
loss,2.30838
val_accuracy,0.09733
val_loss,2.31024


[34m[1mwandb[0m: Agent Starting Run: vohb9j2m with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▂▃▆█
epoch,▁▃▅▆█
loss,█▇▆▄▁
val_accuracy,▁▂▃▄█
val_loss,█▇▅▃▁

0,1
accuracy,0.10904
epoch,5.0
loss,2.27127
val_accuracy,0.102
val_loss,2.27101


[34m[1mwandb[0m: Agent Starting Run: hjc79skt with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▁▁▁▁
epoch,▁▃▅▆█
loss,█▇▆▄▁
val_accuracy,▁▁▁▁▁
val_loss,█▇▅▃▁

0,1
accuracy,0.09944
epoch,5.0
loss,2.30626
val_accuracy,0.105
val_loss,2.30379


[34m[1mwandb[0m: Agent Starting Run: 0shcmlcq with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▁▁▁▁
epoch,▁▃▅▆█
loss,█▇▅▃▁
val_accuracy,▁▁▁▁▁
val_loss,█▇▅▃▁

0,1
accuracy,0.09996
epoch,5.0
loss,2.35308
val_accuracy,0.10033
val_loss,2.33348


[34m[1mwandb[0m: Agent Starting Run: bseftwnj with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▁▁▁▁▁▁▁▁▁
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▇▆▅▅▄▃▂▂▁
val_accuracy,▁▁▁▁▁▁▁▁▁▁
val_loss,█▇▆▅▅▄▃▂▂▁

0,1
accuracy,0.10065
epoch,10.0
loss,2.3193
val_accuracy,0.09417
val_loss,2.32157


[34m[1mwandb[0m: Agent Starting Run: jgdh7d4n with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.1
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▄▄▅█▁
epoch,▁▃▅▆█
loss,█▄▁▁▂
val_accuracy,▅▁█▂▇
val_loss,█▂▁▃▄

0,1
accuracy,0.09352
epoch,5.0
loss,2.32423
val_accuracy,0.10517
val_loss,2.33496


[34m[1mwandb[0m: Agent Starting Run: i4ry8662 with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▃▄▅▅▆▆▇██
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▇▆▅▄▄▃▂▂▁
val_accuracy,▁▃▄▅▅▆▆▇▇█
val_loss,█▇▆▅▄▄▃▂▂▁

0,1
accuracy,0.16085
epoch,10.0
loss,2.25609
val_accuracy,0.17017
val_loss,2.24303


[34m[1mwandb[0m: Agent Starting Run: ntf9z574 with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▂▃▅█
epoch,▁▃▅▆█
loss,█▇▆▄▁
val_accuracy,▁▄▄▆█
val_loss,█▇▅▃▁

0,1
accuracy,0.14506
epoch,5.0
loss,2.30237
val_accuracy,0.13933
val_loss,2.30257


[34m[1mwandb[0m: Agent Starting Run: 6ozd831w with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▁▅██
epoch,▁▃▅▆█
loss,█▆▄▃▁
val_accuracy,▁████
val_loss,█▆▄▃▁

0,1
accuracy,0.09937
epoch,5.0
loss,2.36002
val_accuracy,0.1055
val_loss,2.35354


[34m[1mwandb[0m: Agent Starting Run: 0p2dryce with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.1
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▃▅▇████▇▇
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▇▇▆▅▅▄▃▂▁
val_accuracy,▁▄▆▇███▇▇▆
val_loss,█▇▇▆▅▅▄▃▂▁

0,1
accuracy,0.19507
epoch,10.0
loss,2.27804
val_accuracy,0.19083
val_loss,2.27417


[34m[1mwandb[0m: Agent Starting Run: n48owapa with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▁▁▁▁
epoch,▁▃▅▆█
loss,█▆▄▃▁
val_accuracy,▁▁▁▁▁
val_loss,█▆▄▃▁

0,1
accuracy,0.09939
epoch,5.0
loss,2.49225
val_accuracy,0.1055
val_loss,2.48642


[34m[1mwandb[0m: Agent Starting Run: 2m1w4u2f with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▁▁▁▁▁▁▁▁▁
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▇▆▆▅▄▃▃▂▁
val_accuracy,▁▁▁▁▁▁▁▁▁▁
val_loss,█▇▆▆▅▄▃▃▂▁

0,1
accuracy,0.09944
epoch,10.0
loss,2.53046
val_accuracy,0.105
val_loss,2.51899


[34m[1mwandb[0m: Agent Starting Run: 3wxn40xr with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.1
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,████▁▅▅▅▅▅
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▆▃▁▁▂▃▄▃▂
val_accuracy,▁▁▁█▄▄▄▄▄▄
val_loss,█▄▁▁▃▅▅▅▃▁

0,1
accuracy,0.1003
epoch,10.0
loss,2.30563
val_accuracy,0.09733
val_loss,2.30269


[34m[1mwandb[0m: Agent Starting Run: rxxnm8j4 with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.1
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▁▁▁▁
epoch,▁▃▅▆█
loss,█▅▃▂▁
val_accuracy,▁▁▁▁▁
val_loss,█▅▃▂▁

0,1
accuracy,0.1003
epoch,5.0
loss,2.30722
val_accuracy,0.09733
val_loss,2.30624


[34m[1mwandb[0m: Agent Starting Run: 4friwbsn with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▁▁▁▁
epoch,▁▃▅▆█
loss,█▇▆▄▁
val_accuracy,▁▁▁▁▁
val_loss,█▇▅▃▁

0,1
accuracy,0.09944
epoch,5.0
loss,2.7269
val_accuracy,0.105
val_loss,2.72336


[34m[1mwandb[0m: Agent Starting Run: qdjpprix with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▂▃▆█
epoch,▁▃▅▆█
loss,█▇▆▄▁
val_accuracy,▁▂▃▅█
val_loss,█▇▅▃▁

0,1
accuracy,0.0688
epoch,5.0
loss,2.34191
val_accuracy,0.072
val_loss,2.33563


[34m[1mwandb[0m: Agent Starting Run: tqpivo6q with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.1
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▁▁▁█
epoch,▁▃▅▆█
loss,█▅▂▁▂
val_accuracy,▂▁▁█▁
val_loss,█▃▁▂▄

0,1
accuracy,0.16493
epoch,5.0
loss,2.31106
val_accuracy,0.0985
val_loss,2.33691


[34m[1mwandb[0m: Agent Starting Run: ci25mtj2 with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▂▄▆█
epoch,▁▃▅▆█
loss,█▇▅▃▁
val_accuracy,▁▃▅▇█
val_loss,█▇▅▃▁

0,1
accuracy,0.1573
epoch,5.0
loss,2.38421
val_accuracy,0.1745
val_loss,2.3445


[34m[1mwandb[0m: Agent Starting Run: o5dn89p4 with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▁▁▁▁▁▁▁▁▁
epoch,▁▂▃▃▄▅▆▆▇█
loss,██▇▇▆▅▄▃▂▁
val_accuracy,▁▁▁▁▁▁▁▁▁▁
val_loss,██▇▇▆▅▄▃▂▁

0,1
accuracy,0.09939
epoch,10.0
loss,2.32301
val_accuracy,0.1055
val_loss,2.31517


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: m769bda4 with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▁▁▁▁▁▁▁▁▁
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▇▆▆▅▄▃▃▂▁
val_accuracy,▁▁▁▁▁▁▁▁▁▁
val_loss,█▇▆▆▅▄▃▃▂▁

0,1
accuracy,0.10083
epoch,10.0
loss,2.41884
val_accuracy,0.0925
val_loss,2.42072


[34m[1mwandb[0m: Agent Starting Run: r8xjofpm with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.1
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▁▄▅█
epoch,▁▃▅▆█
loss,█▅▃▂▁
val_accuracy,▁▃▄▆█
val_loss,█▅▃▂▁

0,1
accuracy,0.21872
epoch,5.0
loss,2.22774
val_accuracy,0.28067
val_loss,2.20789


[34m[1mwandb[0m: Agent Starting Run: qhzquupq with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▂▃▄▅▆▆▇▇█
epoch,▁▂▃▃▄▅▆▆▇█
loss,██▇▆▅▄▄▃▂▁
val_accuracy,▁▂▃▄▅▆▆▇▇█
val_loss,█▇▇▆▅▄▄▃▂▁

0,1
accuracy,0.209
epoch,10.0
loss,2.21827
val_accuracy,0.2225
val_loss,2.20069


[34m[1mwandb[0m: Agent Starting Run: d0g1vk4v with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.1
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▁▁▂█
epoch,▁▃▅▆█
loss,█▆▄▂▁
val_accuracy,▁▁▁▂█
val_loss,█▅▃▁▁

0,1
accuracy,0.11285
epoch,5.0
loss,2.28693
val_accuracy,0.23967
val_loss,2.28029


[34m[1mwandb[0m: Agent Starting Run: 1gz875l1 with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▂▃▅█
epoch,▁▃▅▆█
loss,█▇▆▄▁
val_accuracy,▁▂▄▅█
val_loss,█▇▅▃▁

0,1
accuracy,0.0838
epoch,5.0
loss,2.3084
val_accuracy,0.09117
val_loss,2.30726


[34m[1mwandb[0m: Agent Starting Run: 4k7ks1wa with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▃▄▅█
epoch,▁▃▅▆█
loss,█▆▅▃▁
val_accuracy,▁▂▄▅█
val_loss,█▆▅▃▁

0,1
accuracy,0.11963
epoch,5.0
loss,2.30482
val_accuracy,0.1155
val_loss,2.30531


[34m[1mwandb[0m: Agent Starting Run: sy4kp1ep with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▄▆▇█
epoch,▁▃▅▆█
loss,█▆▄▃▁
val_accuracy,▁▃▂█▂
val_loss,█▆▄▃▁

0,1
accuracy,0.11569
epoch,5.0
loss,2.31072
val_accuracy,0.1175
val_loss,2.30449


[34m[1mwandb[0m: Agent Starting Run: q8a76q0g with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.1
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▂▃▄▅▆▇▇██
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▇▆▆▅▄▃▃▂▁
val_accuracy,▁▂▃▄▅▆▇▇██
val_loss,█▇▇▆▅▄▄▃▂▁

0,1
accuracy,0.49137
epoch,10.0
loss,1.74104
val_accuracy,0.52483
val_loss,1.65459


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: lmwvtb1t with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▁▁▂▂▄▅▆▇█
epoch,▁▂▃▃▄▅▆▆▇█
loss,██▇▇▆▅▄▃▂▁
val_accuracy,▁▁▂▄▄▄▅▆▇█
val_loss,██▇▇▆▅▄▃▂▁

0,1
accuracy,0.09937
epoch,10.0
loss,2.35361
val_accuracy,0.10633
val_loss,2.3407


[34m[1mwandb[0m: Agent Starting Run: oy9ygte8 with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▂▃▅█
epoch,▁▃▅▆█
loss,█▇▆▄▁
val_accuracy,▁▁▅▆█
val_loss,█▇▅▃▁

0,1
accuracy,0.14059
epoch,5.0
loss,2.30157
val_accuracy,0.14217
val_loss,2.30175


[34m[1mwandb[0m: Agent Starting Run: ews780q2 with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▂▅▇█
epoch,▁▃▅▆█
loss,█▆▄▃▁
val_accuracy,█▁▁██
val_loss,█▆▅▃▁

0,1
accuracy,0.12009
epoch,5.0
loss,2.30366
val_accuracy,0.11883
val_loss,2.3037


[34m[1mwandb[0m: Agent Starting Run: rmp9kb8o with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.1
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▂▄▆█
epoch,▁▃▅▆█
loss,█▇▆▄▁
val_accuracy,▁▂▅▇█
val_loss,█▇▅▃▁

0,1
accuracy,0.21722
epoch,5.0
loss,2.28808
val_accuracy,0.23483
val_loss,2.28107


[34m[1mwandb[0m: Agent Starting Run: il326kl5 with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▁▁▁▁
epoch,▁▃▅▆█
loss,█▇▆▄▁
val_accuracy,▁▁▁▁▁
val_loss,█▇▅▃▁

0,1
accuracy,0.09944
epoch,5.0
loss,2.39012
val_accuracy,0.105
val_loss,2.38191


[34m[1mwandb[0m: Agent Starting Run: kmqqry5o with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.1
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▁▁▂▁█▇▇▆█
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▆▄▂▂▂▂▂▂▁
val_accuracy,▁▁▁▁▅▄▄▄▅█
val_loss,█▅▄▃▃▃▃▃▂▁

0,1
accuracy,0.22319
epoch,10.0
loss,2.27549
val_accuracy,0.307
val_loss,2.26303


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: du1iekzd with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.1
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▁▁█▄
epoch,▁▃▅▆█
loss,█▆▃▁▁
val_accuracy,▁▁█▄▁
val_loss,█▄▂▁▂

0,1
accuracy,0.13561
epoch,5.0
loss,2.29475
val_accuracy,0.10083
val_loss,2.29683


[34m[1mwandb[0m: Agent Starting Run: okxtcgrs with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▁▂▃▄▆▆▇▇█
epoch,▁▂▃▃▄▅▆▆▇█
loss,██▇▆▅▅▄▃▂▁
val_accuracy,▁▁▂▄▅▆▆▇▇█
val_loss,█▇▇▆▅▄▃▃▂▁

0,1
accuracy,0.32994
epoch,10.0
loss,2.11417
val_accuracy,0.35067
val_loss,2.08423


[34m[1mwandb[0m: Agent Starting Run: iyixvx7h with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▃▄▆█
epoch,▁▃▅▆█
loss,█▇▆▄▁
val_accuracy,▂▁▂▅█
val_loss,█▇▅▃▁

0,1
accuracy,0.10157
epoch,5.0
loss,2.36916
val_accuracy,0.10983
val_loss,2.35885


[34m[1mwandb[0m: Agent Starting Run: 08gw702h with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▁▁▁▁▁▁▁▁▁
epoch,▁▂▃▃▄▅▆▆▇█
loss,██▇▇▆▅▄▃▂▁
val_accuracy,▁▁▁▁▁▁▁▁▁▁
val_loss,██▇▇▆▅▄▃▂▁

0,1
accuracy,0.10065
epoch,10.0
loss,2.32974
val_accuracy,0.09417
val_loss,2.33331


[34m[1mwandb[0m: Agent Starting Run: wjsjqplk with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.1
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▁▁▁▁▁▁▁▁▁
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▇▆▅▄▃▂▂▁▁
val_accuracy,▁▁▁▁▁▁▁▁▁▁
val_loss,█▇▆▅▄▃▃▂▁▁

0,1
accuracy,0.09944
epoch,10.0
loss,2.30267
val_accuracy,0.105
val_loss,2.30247


[34m[1mwandb[0m: Agent Starting Run: 0oivb06z with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▂▃▄▄▅▆▇▇█
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▇▆▆▅▄▃▃▂▁
val_accuracy,▁▃▄▅▅▆▆▇▇█
val_loss,█▇▆▆▅▄▃▃▂▁

0,1
accuracy,0.19541
epoch,10.0
loss,2.30128
val_accuracy,0.20267
val_loss,2.30114


[34m[1mwandb[0m: Agent Starting Run: g9p4lp5z with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▁▁▁▁
epoch,▁▃▅▆█
loss,█▆▄▃▁
val_accuracy,▁▁▁▁▁
val_loss,█▆▄▃▁

0,1
accuracy,0.09991
epoch,5.0
loss,2.366
val_accuracy,0.10083
val_loss,2.367


[34m[1mwandb[0m: Agent Starting Run: l8gpywag with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.1
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▅██▆
epoch,▁▃▅▆█
loss,█▇▆▄▁
val_accuracy,▁▇█▆▁
val_loss,█▇▅▃▁

0,1
accuracy,0.17196
epoch,5.0
loss,2.28294
val_accuracy,0.16433
val_loss,2.27417


[34m[1mwandb[0m: Agent Starting Run: 5luubclo with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▁▁▁▁▁▁▂▆█
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▇▆▅▄▃▂▂▁▁
val_accuracy,▁▁▁▁▁▁▂▆██
val_loss,█▇▆▄▃▂▂▁▁▁

0,1
accuracy,0.19744
epoch,10.0
loss,2.29351
val_accuracy,0.19467
val_loss,2.29155


[34m[1mwandb[0m: Agent Starting Run: u04dpdar with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▂▄▆█
epoch,▁▃▅▆█
loss,█▇▅▃▁
val_accuracy,▁▁███
val_loss,█▆▄▃▁

0,1
accuracy,0.12554
epoch,5.0
loss,2.30201
val_accuracy,0.133
val_loss,2.30204


[34m[1mwandb[0m: Agent Starting Run: 34ytq6sz with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.1
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▁▁█▁
epoch,▁▃▅▆█
loss,█▅▂▁▂
val_accuracy,▁▁█▂▁
val_loss,█▃▁▂▃

0,1
accuracy,0.09956
epoch,5.0
loss,2.30636
val_accuracy,0.10267
val_loss,2.30926


[34m[1mwandb[0m: Agent Starting Run: 4of5ohla with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.1
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▂▃▄▅▆▆▇██
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▇▆▆▅▄▃▃▂▁
val_accuracy,▁▂▃▄▅▆▇▇██
val_loss,█▇▆▆▅▄▃▃▂▁

0,1
accuracy,0.14956
epoch,10.0
loss,2.28694
val_accuracy,0.157
val_loss,2.2833


[34m[1mwandb[0m: Agent Starting Run: 2nvo3ahx with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.1
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▂▂▃▄▅▆▆▇█
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▇▆▆▅▄▃▃▂▁
val_accuracy,▁▂▃▃▄▅▅▆▇█
val_loss,█▇▆▆▅▄▃▃▂▁

0,1
accuracy,0.14561
epoch,10.0
loss,2.30179
val_accuracy,0.14383
val_loss,2.30166


[34m[1mwandb[0m: Agent Starting Run: qihj1hbg with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▁▂▃▄▅▅▆▇█
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▇▆▅▅▄▃▃▂▁
val_accuracy,▁▂▂▃▄▅▆▆▇█
val_loss,█▇▆▅▅▄▃▃▂▁

0,1
accuracy,0.3155
epoch,10.0
loss,2.13003
val_accuracy,0.35167
val_loss,2.09621


[34m[1mwandb[0m: Agent Starting Run: o21v8yih with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▁▁▁▁▁▁▁▁▁
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▇▆▅▄▄▃▂▂▁
val_accuracy,▁▁▁▁▁▁▁▁▁▁
val_loss,█▇▆▅▄▄▃▂▂▁

0,1
accuracy,0.1003
epoch,10.0
loss,2.39445
val_accuracy,0.09733
val_loss,2.39334


[34m[1mwandb[0m: Agent Starting Run: zkqp1syz with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.1
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▆█▇▃▁
epoch,▁▃▅▆█
loss,█▇▅▃▁
val_accuracy,▅▅▂▁█
val_loss,█▇▅▃▁

0,1
accuracy,0.11922
epoch,5.0
loss,2.24291
val_accuracy,0.1575
val_loss,2.21512


[34m[1mwandb[0m: Agent Starting Run: 0yyfou01 with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▁▂▂▃▃▄▆▇█
epoch,▁▂▃▃▄▅▆▆▇█
loss,██▇▇▆▅▄▃▂▁
val_accuracy,▁▂▂▃▃▃▄▅▇█
val_loss,██▇▇▆▅▄▃▂▁

0,1
accuracy,0.08948
epoch,10.0
loss,2.30246
val_accuracy,0.09483
val_loss,2.30244


[34m[1mwandb[0m: Agent Starting Run: t6zh9uyq with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▆▆▆█▆▁███▆
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▇▆▆▅▄▃▃▂▁
val_accuracy,▅▅▅██▅▅▅▁▁
val_loss,█▇▆▆▅▄▃▃▂▁

0,1
accuracy,0.11128
epoch,10.0
loss,2.30455
val_accuracy,0.11517
val_loss,2.30427


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: 2iyvjz2b with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▁▁▁▁▁▁▁▁▁
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▇▆▅▅▄▃▂▂▁
val_accuracy,▁▁▁▁▁▁▁▁▁▁
val_loss,█▇▆▅▅▄▃▂▂▁

0,1
accuracy,0.09991
epoch,10.0
loss,2.31531
val_accuracy,0.10083
val_loss,2.3135


[34m[1mwandb[0m: Agent Starting Run: 4ub5i4ka with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▂▂▄▅▅▆▇▇█
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▇▆▆▅▄▃▃▂▁
val_accuracy,▂▂▂▁▄▇▇▇█▇
val_loss,█▇▆▆▅▄▃▃▂▁

0,1
accuracy,0.128
epoch,10.0
loss,2.29332
val_accuracy,0.127
val_loss,2.29343


[34m[1mwandb[0m: Agent Starting Run: 8ziixwpw with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▁▁▁▁
epoch,▁▃▅▆█
loss,█▇▅▃▁
val_accuracy,▁▁▁▁▁
val_loss,█▆▅▃▁

0,1
accuracy,0.10065
epoch,5.0
loss,2.46885
val_accuracy,0.09417
val_loss,2.42611


[34m[1mwandb[0m: Agent Starting Run: pyjxglwt with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▁▁▁▁▁▁▁▁▁
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▇▆▆▅▄▃▃▂▁
val_accuracy,▁▁▁▁▁▁▁▁▁▁
val_loss,█▇▆▆▅▄▃▃▂▁

0,1
accuracy,0.1003
epoch,10.0
loss,2.36533
val_accuracy,0.09733
val_loss,2.37051


[34m[1mwandb[0m: Agent Starting Run: 090rwi49 with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.1
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▃▅▇█
epoch,▁▃▅▆█
loss,█▆▅▃▁
val_accuracy,▁▃▅▇█
val_loss,█▆▅▃▁

0,1
accuracy,0.54583
epoch,5.0
loss,1.68857
val_accuracy,0.60017
val_loss,1.46729


[34m[1mwandb[0m: Agent Starting Run: tc0dkax5 with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▃▂▃▃▄▅▆██
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▇▆▆▅▄▃▃▂▁
val_accuracy,▁▃▅▆▆▅▆▅▆█
val_loss,█▇▆▆▅▄▃▃▂▁

0,1
accuracy,0.13774
epoch,10.0
loss,2.30636
val_accuracy,0.13583
val_loss,2.30786


[34m[1mwandb[0m: Agent Starting Run: wq1l2f36 with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▁▁▁▁▁▁▁▁▁
epoch,▁▂▃▃▄▅▆▆▇█
loss,██▇▆▆▅▄▃▂▁
val_accuracy,▁▁▁▁▁▁▁▁▁▁
val_loss,█▇▇▆▅▄▃▂▂▁

0,1
accuracy,0.1003
epoch,10.0
loss,2.30204
val_accuracy,0.09733
val_loss,2.30023


[34m[1mwandb[0m: Agent Starting Run: szq800mg with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▂▃▄▅▆▇███
epoch,▁▂▃▃▄▅▆▆▇█
loss,██▇▇▆▅▄▃▂▁
val_accuracy,▁▂▂▃▂▅▅▆██
val_loss,██▇▇▆▅▄▃▂▁

0,1
accuracy,0.11119
epoch,10.0
loss,2.30152
val_accuracy,0.10617
val_loss,2.30137


[34m[1mwandb[0m: Agent Starting Run: zydigo8h with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,████▁▁▁▁▁▁
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▇▆▆▅▄▃▃▂▁
val_accuracy,▁▁▁▁▁▁▁▁▁▁
val_loss,█▇▆▆▅▄▃▃▂▁

0,1
accuracy,0.10059
epoch,10.0
loss,2.30929
val_accuracy,0.09433
val_loss,2.30961


[34m[1mwandb[0m: Agent Starting Run: hvut1nrg with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▁▁▁▁▁▁▁▁▁
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▇▆▅▅▄▃▂▂▁
val_accuracy,▁▁▁▁▁▁▁▁▁▁
val_loss,█▇▆▅▅▄▃▂▂▁

0,1
accuracy,0.09965
epoch,10.0
loss,2.39122
val_accuracy,0.10317
val_loss,2.38736


[34m[1mwandb[0m: Agent Starting Run: wkyiskec with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▁▁▁▁▁▁▁▁▁
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▇▆▅▄▄▃▂▂▁
val_accuracy,▁▁▁▁▁▁▁▁▁▁
val_loss,█▇▆▅▄▄▃▂▂▁

0,1
accuracy,0.10017
epoch,10.0
loss,2.40202
val_accuracy,0.0985
val_loss,2.40145


[34m[1mwandb[0m: Agent Starting Run: 9q1pcvg0 with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.1
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▂▃▅█
epoch,▁▃▅▆█
loss,█▇▅▃▁
val_accuracy,▁▂▃▅█
val_loss,█▇▅▃▁

0,1
accuracy,0.28941
epoch,5.0
loss,1.83572
val_accuracy,0.46617
val_loss,1.6426


[34m[1mwandb[0m: Agent Starting Run: 6f8rah6v with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▁▁▃▅▆▇▇▇█
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▇▇▆▅▄▃▃▂▁
val_accuracy,▁▁▂▄▅▅▆▆▇█
val_loss,█▇▆▆▅▄▃▃▂▁

0,1
accuracy,0.31091
epoch,10.0
loss,1.89682
val_accuracy,0.34883
val_loss,1.8381


[34m[1mwandb[0m: Agent Starting Run: 15djhcla with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.1
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▁▂▅▇█████
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▆▅▄▃▂▂▂▁▁
val_accuracy,▁▁▄▇██████
val_loss,█▆▅▄▃▃▂▂▁▁

0,1
accuracy,0.1947
epoch,10.0
loss,2.2945
val_accuracy,0.19917
val_loss,2.29371


[34m[1mwandb[0m: Agent Starting Run: qhrit0ud with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.1
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▁▁▁▁
epoch,▁▃▅▆█
loss,█▇▅▃▁
val_accuracy,▁▁▁▁█
val_loss,█▆▄▂▁

0,1
accuracy,0.10065
epoch,5.0
loss,2.30106
val_accuracy,0.20567
val_loss,2.29954


[34m[1mwandb[0m: Agent Starting Run: biozhbz1 with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.1
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▁▁▁▁▁█▁▁▁
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▇▅▃▂▁▁▁▂▃
val_accuracy,▂▂▂▂▂█▁▁▁▁
val_loss,▆▄▂▁▁▂▄▆▇█

0,1
accuracy,0.10065
epoch,10.0
loss,2.30448
val_accuracy,0.09417
val_loss,2.30739


[34m[1mwandb[0m: Agent Starting Run: nq1yjoxd with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.1
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▁▁▁█
epoch,▁▃▅▆█
loss,█▇▅▃▁
val_accuracy,▁▁▁▁█
val_loss,█▆▄▂▁

0,1
accuracy,0.10259
epoch,5.0
loss,2.30261
val_accuracy,0.1705
val_loss,2.29999


[34m[1mwandb[0m: Agent Starting Run: 6d3s1wia with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▁▁▁▁▁▁▁▁▁
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▇▆▆▅▄▃▃▂▁
val_accuracy,▁▁▁▁▁▁▁▁▁▁
val_loss,█▇▆▆▅▄▃▃▂▁

0,1
accuracy,0.10017
epoch,10.0
loss,2.31429
val_accuracy,0.0985
val_loss,2.31667


[34m[1mwandb[0m: Agent Starting Run: nqjo10ks with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▂▃▄▅▅▆▇▇█
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▇▆▅▅▄▃▂▂▁
val_accuracy,▁▂▃▄▅▆▆▇██
val_loss,█▇▆▅▅▄▃▂▂▁

0,1
accuracy,0.11413
epoch,10.0
loss,2.27695
val_accuracy,0.11983
val_loss,2.26379


[34m[1mwandb[0m: Agent Starting Run: qhv61ra4 with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.1
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▁▁▅█
epoch,▁▃▅▆█
loss,█▆▃▁▁
val_accuracy,▁▁▆█▁
val_loss,█▄▁▁▂

0,1
accuracy,0.17972
epoch,5.0
loss,2.29672
val_accuracy,0.10267
val_loss,2.30236


[34m[1mwandb[0m: Agent Starting Run: 05cdhe1g with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.1
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▂▄▆█
epoch,▁▃▅▆█
loss,█▇▆▄▁
val_accuracy,▁▃▅▆█
val_loss,█▇▅▃▁

0,1
accuracy,0.24361
epoch,5.0
loss,2.29023
val_accuracy,0.261
val_loss,2.28631


[34m[1mwandb[0m: Agent Starting Run: 0r8xs6z6 with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▁▃▅█
epoch,▁▃▅▆█
loss,█▇▆▄▁
val_accuracy,▁▂▃▅█
val_loss,█▇▅▃▁

0,1
accuracy,0.07183
epoch,5.0
loss,2.29633
val_accuracy,0.07483
val_loss,2.29299


[34m[1mwandb[0m: Agent Starting Run: 0anh7d1o with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▁▁▁▁▁▁▁▁▁
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▇▆▅▄▃▃▂▁▁
val_accuracy,▁▁▁▁▁▁▁▁▁▁
val_loss,█▇▆▅▄▃▃▂▁▁

0,1
accuracy,0.09996
epoch,10.0
loss,2.40744
val_accuracy,0.10033
val_loss,2.3868


[34m[1mwandb[0m: Agent Starting Run: pszvcp65 with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,█▇▄▂▁
epoch,▁▃▅▆█
loss,█▇▆▃▁
val_accuracy,█▅▂▃▁
val_loss,█▇▅▃▁

0,1
accuracy,0.13731
epoch,5.0
loss,2.31298
val_accuracy,0.13567
val_loss,2.3005


[34m[1mwandb[0m: Agent Starting Run: dd5f3gap with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▂▄▆█
epoch,▁▃▅▆█
loss,█▇▆▄▁
val_accuracy,▁▁▂▃█
val_loss,█▇▅▃▁

0,1
accuracy,0.10748
epoch,5.0
loss,2.33518
val_accuracy,0.11117
val_loss,2.33179


[34m[1mwandb[0m: Agent Starting Run: g1xwefwi with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▁▁▁▁
epoch,▁▃▅▆█
loss,█▇▆▄▁
val_accuracy,▁▁▁▁▁
val_loss,█▇▅▃▁

0,1
accuracy,0.09939
epoch,5.0
loss,2.30904
val_accuracy,0.1055
val_loss,2.30904


[34m[1mwandb[0m: Agent Starting Run: pqq0e5qh with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.1
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▁▆▇▆▆▇▇██
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▆▅▄▃▃▂▂▁▁
val_accuracy,▁▅▆▅▅▇▇▇██
val_loss,█▆▅▄▄▃▂▂▁▁

0,1
accuracy,0.24078
epoch,10.0
loss,2.18791
val_accuracy,0.25217
val_loss,2.17539


[34m[1mwandb[0m: Agent Starting Run: imnn2l7w with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.1
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▃▅▇█
epoch,▁▃▅▆█
loss,█▇▅▃▁
val_accuracy,▁▃▆██
val_loss,█▇▅▃▁

0,1
accuracy,0.53711
epoch,5.0
loss,1.69361
val_accuracy,0.55683
val_loss,1.46211


[34m[1mwandb[0m: Agent Starting Run: 0kmh4383 with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▂▅▆▇▇▄▁▁█▇
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▇▆▆▅▄▃▃▂▁
val_accuracy,▅▇▄▄▁▇█▇█▇
val_loss,█▇▆▆▅▄▃▃▂▁

0,1
accuracy,0.09276
epoch,10.0
loss,2.30629
val_accuracy,0.08817
val_loss,2.3064


[34m[1mwandb[0m: Agent Starting Run: 278m9812 with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▁▁▁▁▁▁█▆▂
epoch,▁▂▃▃▄▅▆▆▇█
loss,██▇▆▅▄▃▂▂▁
val_accuracy,▂▂▂▂▂▂█▅▂▁
val_loss,█▇▆▅▄▄▃▂▁▁

0,1
accuracy,0.10402
epoch,10.0
loss,2.30619
val_accuracy,0.1035
val_loss,2.29389


[34m[1mwandb[0m: Agent Starting Run: 5yyhlfhw with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▁▁▁▁▁▁▁▁▁
epoch,▁▂▃▃▄▅▆▆▇█
loss,██▇▇▆▅▄▃▂▁
val_accuracy,▁▁▁▁▁▁▁▁▁▁
val_loss,██▇▇▆▅▄▃▂▁

0,1
accuracy,0.0997
epoch,10.0
loss,2.31469
val_accuracy,0.10267
val_loss,2.31063


[34m[1mwandb[0m: Agent Starting Run: i7gwr3by with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▁▁▂▂▃▄▅▆█
epoch,▁▂▃▃▄▅▆▆▇█
loss,██▇▇▆▅▄▃▂▁
val_accuracy,▁▁▂▂▃▃▄▅▆█
val_loss,██▇▆▆▅▄▃▂▁

0,1
accuracy,0.12715
epoch,10.0
loss,2.27237
val_accuracy,0.13783
val_loss,2.26271


[34m[1mwandb[0m: Agent Starting Run: 3aoju6iv with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▁▁▁▁
epoch,▁▃▅▆█
loss,█▆▄▃▁
val_accuracy,▁▁▁▁▁
val_loss,█▆▄▃▁

0,1
accuracy,0.09944
epoch,5.0
loss,2.33392
val_accuracy,0.105
val_loss,2.33322


[34m[1mwandb[0m: Agent Starting Run: edmhc65h with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.1
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▂▃▆█
epoch,▁▃▅▆█
loss,█▇▆▄▁
val_accuracy,▁▂▄▆█
val_loss,█▇▅▃▁

0,1
accuracy,0.13861
epoch,5.0
loss,2.30184
val_accuracy,0.15433
val_loss,2.30141


[34m[1mwandb[0m: Agent Starting Run: gvgh3oct with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▃▄▆█
epoch,▁▃▅▆█
loss,█▆▅▃▁
val_accuracy,▁▂▅▅█
val_loss,█▆▄▃▁

0,1
accuracy,0.08411
epoch,5.0
loss,2.30157
val_accuracy,0.08317
val_loss,2.30147


[34m[1mwandb[0m: Agent Starting Run: m8xca9rs with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▁▁▁▁▁▁▁▁▁
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▇▆▅▅▄▃▂▂▁
val_accuracy,▁▁▁▁▁▁▁▁▁▁
val_loss,█▇▆▅▅▄▃▂▂▁

0,1
accuracy,0.09996
epoch,10.0
loss,2.322
val_accuracy,0.10033
val_loss,2.32327


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: ecf6mhkd with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.1
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▁▁▁▁
epoch,▁▃▅▆█
loss,█▇▅▃▁
val_accuracy,▁▁▁▁█
val_loss,█▆▄▂▁

0,1
accuracy,0.09996
epoch,5.0
loss,2.30263
val_accuracy,0.18733
val_loss,2.3009


[34m[1mwandb[0m: Agent Starting Run: k9cvmx3d with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▁▁▁▁▁▁▁▁▁
epoch,▁▂▃▃▄▅▆▆▇█
loss,██▇▇▆▅▄▃▂▁
val_accuracy,▁▁▁▁▁▁▁▁▁▁
val_loss,██▇▇▆▅▄▃▂▁

0,1
accuracy,0.09939
epoch,10.0
loss,2.40269
val_accuracy,0.1055
val_loss,2.39509


[34m[1mwandb[0m: Agent Starting Run: q83qteq2 with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▁▁▁▁
epoch,▁▃▅▆█
loss,█▆▅▃▁
val_accuracy,▁▁▁▁▁
val_loss,█▆▅▃▁

0,1
accuracy,0.09939
epoch,5.0
loss,2.31433
val_accuracy,0.1055
val_loss,2.31448


[34m[1mwandb[0m: Agent Starting Run: oxwkjtcs with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▁▁▁▁▁▃▃▆█
epoch,▁▂▃▃▄▅▆▆▇█
loss,██▇▇▆▅▄▃▂▁
val_accuracy,██████▅▅▅▁
val_loss,██▇▇▆▅▄▃▂▁

0,1
accuracy,0.09943
epoch,10.0
loss,2.3129
val_accuracy,0.10433
val_loss,2.31046


[34m[1mwandb[0m: Agent Starting Run: pg5vtl87 with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.1
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▁▁█▁
epoch,▁▃▅▆█
loss,█▄▁▁▂
val_accuracy,▁▂█▂▂
val_loss,█▂▁▃▅

0,1
accuracy,0.09944
epoch,5.0
loss,2.35062
val_accuracy,0.105
val_loss,2.37523


[34m[1mwandb[0m: Agent Starting Run: spngvw3g with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.1
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▄▅▆▆▆▆▇▇█
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▆▅▅▄▄▃▂▂▁
val_accuracy,▁▃▄▄▅▅▅▆▇█
val_loss,█▇▆▆▅▄▃▃▂▁

0,1
accuracy,0.42611
epoch,10.0
loss,1.74505
val_accuracy,0.47483
val_loss,1.67909


[34m[1mwandb[0m: Agent Starting Run: 9z6uxrsj with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▁▁▁▁
epoch,▁▃▅▆█
loss,█▆▄▃▁
val_accuracy,▁▁▁▁▁
val_loss,█▆▄▃▁

0,1
accuracy,0.0997
epoch,5.0
loss,2.47275
val_accuracy,0.10267
val_loss,2.46062


[34m[1mwandb[0m: Agent Starting Run: jrhtbw8l with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▁▁▁▁
epoch,▁▃▅▆█
loss,█▆▄▃▁
val_accuracy,▁▁▁▁▁
val_loss,█▆▄▃▁

0,1
accuracy,0.09944
epoch,5.0
loss,2.4907
val_accuracy,0.105
val_loss,2.47497


[34m[1mwandb[0m: Agent Starting Run: b25xarjf with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▁▁▁▁▁▁▁▁▁
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▇▆▆▅▄▃▃▂▁
val_accuracy,▁▁▁▁▁▁▁▁▁▁
val_loss,█▇▆▆▅▄▃▃▂▁

0,1
accuracy,0.09939
epoch,10.0
loss,2.4346
val_accuracy,0.1055
val_loss,2.43541


[34m[1mwandb[0m: Agent Starting Run: 24lokh6n with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▂▄▆█
epoch,▁▃▅▆█
loss,█▆▅▃▁
val_accuracy,▁▄▇██
val_loss,█▆▄▃▁

0,1
accuracy,0.17602
epoch,5.0
loss,2.30239
val_accuracy,0.18267
val_loss,2.30236


[34m[1mwandb[0m: Agent Starting Run: tag81cjl with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.1
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▂█▅▁
epoch,▁▃▅▆█
loss,█▃▁▁▁
val_accuracy,▂█▅▁▅
val_loss,█▁▁▂▂

0,1
accuracy,0.10509
epoch,5.0
loss,2.28316
val_accuracy,0.183
val_loss,2.29116


[34m[1mwandb[0m: Agent Starting Run: x78mgoll with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▂▃▄▅▆▇▇▇█
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▇▆▆▅▄▃▃▂▁
val_accuracy,▃▁▂▅▅▅▅▇▇█
val_loss,█▇▆▆▅▄▃▃▂▁

0,1
accuracy,0.10365
epoch,10.0
loss,2.29493
val_accuracy,0.10467
val_loss,2.29547


[34m[1mwandb[0m: Agent Starting Run: ronphe3a with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▂▃▄▅▅▆▇██
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▇▆▆▅▄▃▃▂▁
val_accuracy,▁▂▃▃▄▅▅▇██
val_loss,█▇▆▆▅▄▃▃▂▁

0,1
accuracy,0.1135
epoch,10.0
loss,2.34235
val_accuracy,0.11783
val_loss,2.34444


[34m[1mwandb[0m: Agent Starting Run: 5g6h5880 with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▂▃▅█
epoch,▁▃▅▆█
loss,█▇▆▄▁
val_accuracy,▁▂▄▆█
val_loss,█▇▅▃▁

0,1
accuracy,0.12998
epoch,5.0
loss,2.24569
val_accuracy,0.161
val_loss,2.21921


[34m[1mwandb[0m: Agent Starting Run: tdkv0jxy with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▁▁▁▁
epoch,▁▃▅▆█
loss,█▆▄▃▁
val_accuracy,▁▁▁▁▁
val_loss,█▆▄▃▁

0,1
accuracy,0.10017
epoch,5.0
loss,2.44301
val_accuracy,0.0985
val_loss,2.45599


[34m[1mwandb[0m: Agent Starting Run: s1hjv78m with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▂▃▄▄▅▆▇▇█
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▇▆▆▅▄▃▃▂▁
val_accuracy,▁▂▂▃▃▄▄▆▇█
val_loss,█▇▆▆▅▄▃▃▂▁

0,1
accuracy,0.11604
epoch,10.0
loss,2.30285
val_accuracy,0.1135
val_loss,2.30363


[34m[1mwandb[0m: Agent Starting Run: mx24xflv with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▁▁▁▁▁▁▁▁▁
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▇▆▅▄▃▃▂▂▁
val_accuracy,▁▁▁▁▁▁▁▁▁▁
val_loss,█▇▆▅▄▃▃▂▂▁

0,1
accuracy,0.09939
epoch,10.0
loss,2.38607
val_accuracy,0.1055
val_loss,2.36982


[34m[1mwandb[0m: Agent Starting Run: 5apus2ny with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▁▁▁▁▁▁▁▁▁
epoch,▁▂▃▃▄▅▆▆▇█
loss,██▇▇▆▅▄▃▂▁
val_accuracy,▁▁▁▁▁▁▁▁▁▁
val_loss,██▇▇▆▅▄▃▂▁

0,1
accuracy,0.09991
epoch,10.0
loss,2.3111
val_accuracy,0.10083
val_loss,2.31158


[34m[1mwandb[0m: Agent Starting Run: bzap3i4v with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.1
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▂▂▃▃▄▆███
epoch,▁▂▃▃▄▅▆▆▇█
loss,██▇▇▆▅▄▃▂▁
val_accuracy,▁▂▃▃▄▆██▇█
val_loss,██▇▆▆▄▃▂▂▁

0,1
accuracy,0.59561
epoch,10.0
loss,1.11034
val_accuracy,0.6465
val_loss,0.9814


[34m[1mwandb[0m: Agent Starting Run: 7j0e07wo with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▂▅▆█
epoch,▁▃▅▆█
loss,█▆▅▃▁
val_accuracy,▁▁▁▁█
val_loss,█▆▄▃▁

0,1
accuracy,0.09211
epoch,5.0
loss,2.30356
val_accuracy,0.091
val_loss,2.30402


[34m[1mwandb[0m: Agent Starting Run: tmt4cybs with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▁▁▁▁▁▁▁▁▁
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▇▆▅▅▄▃▂▂▁
val_accuracy,▁▁▁▁▁▁▁▁▁▁
val_loss,█▇▆▅▅▄▃▂▂▁

0,1
accuracy,0.0997
epoch,10.0
loss,2.31043
val_accuracy,0.10267
val_loss,2.31066


[34m[1mwandb[0m: Agent Starting Run: vjekeztt with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▁▂▃▃▄▅▆▇█
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▇▆▆▅▄▃▃▂▁
val_accuracy,▁▂▂▃▃▄▅▆▇█
val_loss,█▇▆▆▅▄▃▃▂▁

0,1
accuracy,0.17007
epoch,10.0
loss,2.25268
val_accuracy,0.18133
val_loss,2.24775


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: tbddnzl0 with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.1
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▁▁▂▂▂▃▄▆█
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▇▇▆▅▄▄▃▂▁
val_accuracy,▁▁▁▁▂▂▃▄▆█
val_loss,█▇▇▆▅▄▄▃▂▁

0,1
accuracy,0.13189
epoch,10.0
loss,2.24352
val_accuracy,0.148
val_loss,2.2349


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: ofzsm95f with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▁▁▁▁▁▁▁▁▁
epoch,▁▂▃▃▄▅▆▆▇█
loss,██▇▇▆▅▄▃▂▁
val_accuracy,▁▁▁▁▁▁▁▁▁▁
val_loss,██▇▇▆▅▄▃▂▁

0,1
accuracy,0.09939
epoch,10.0
loss,2.31397
val_accuracy,0.1055
val_loss,2.31533


[34m[1mwandb[0m: Agent Starting Run: cb2h4s2e with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.1
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▇▇▇▁█
epoch,▁▃▅▆█
loss,█▅▃▁▁
val_accuracy,██▇▁█
val_loss,█▃▁▂▄

0,1
accuracy,0.10083
epoch,5.0
loss,2.30474
val_accuracy,0.10033
val_loss,2.31691


[34m[1mwandb[0m: Agent Starting Run: nqwnqi2h with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.1
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▃▃▁▃▂▂▄█▇
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▆▅▅▅▄▄▃▂▁
val_accuracy,▃▃▁▃▂▂▄█▇▆
val_loss,█▆▆▆▆▅▄▂▂▁

0,1
accuracy,0.41465
epoch,10.0
loss,1.95692
val_accuracy,0.3895
val_loss,1.91651


[34m[1mwandb[0m: Agent Starting Run: eofqzan7 with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▁▂▄█
epoch,▁▃▅▆█
loss,█▇▆▄▁
val_accuracy,▁▄▄▄█
val_loss,█▇▅▃▁

0,1
accuracy,0.10039
epoch,5.0
loss,2.29974
val_accuracy,0.09767
val_loss,2.29928


[34m[1mwandb[0m: Agent Starting Run: wnxakxjh with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.1
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▄▄▄▁█
epoch,▁▃▅▆█
loss,█▆▃▁▁
val_accuracy,▅▅█▁▆
val_loss,█▃▁▂▄

0,1
accuracy,0.10065
epoch,5.0
loss,2.30319
val_accuracy,0.10267
val_loss,2.30964


[34m[1mwandb[0m: Agent Starting Run: 9xxdsv13 with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▁▁▁▁▁▁▁▁▁
epoch,▁▂▃▃▄▅▆▆▇█
loss,██▇▇▆▅▄▃▂▁
val_accuracy,▁▁▁▁▁▁▁▁▁▁
val_loss,██▇▇▆▅▄▃▂▁

0,1
accuracy,0.09939
epoch,10.0
loss,2.32982
val_accuracy,0.1055
val_loss,2.32933


[34m[1mwandb[0m: Agent Starting Run: 1zx34xdf with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▃▆▅▅▄▄▆█▆
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▇▆▆▅▄▃▂▂▁
val_accuracy,▂▂▃▁▁▂▄▄▅█
val_loss,█▇▆▆▅▄▃▂▂▁

0,1
accuracy,0.12274
epoch,10.0
loss,2.32309
val_accuracy,0.1195
val_loss,2.32805


[34m[1mwandb[0m: Agent Starting Run: jtot7r1l with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▁▁▁▁▃▄▂▂█
epoch,▁▂▃▃▄▅▆▆▇█
loss,██▇▆▅▄▃▂▂▁
val_accuracy,▁▁▁▁▂▃▂▁▅█
val_loss,█▇▆▅▄▄▃▂▁▁

0,1
accuracy,0.23344
epoch,10.0
loss,2.24092
val_accuracy,0.349
val_loss,2.22327


[34m[1mwandb[0m: Agent Starting Run: owtci831 with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▁▂▃▃▄▅▆▇█
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▇▆▅▄▃▃▂▂▁
val_accuracy,▁▁▂▃▃▄▆▆▇█
val_loss,█▇▆▅▄▃▃▂▂▁

0,1
accuracy,0.12078
epoch,10.0
loss,2.23776
val_accuracy,0.12317
val_loss,2.23191


[34m[1mwandb[0m: Agent Starting Run: mzxati81 with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▂▄▆█
epoch,▁▃▅▆█
loss,█▆▄▃▁
val_accuracy,▁▂▄▆█
val_loss,█▆▄▃▁

0,1
accuracy,0.08978
epoch,5.0
loss,2.33874
val_accuracy,0.10083
val_loss,2.33123


[34m[1mwandb[0m: Agent Starting Run: 9hk9a2qd with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.1
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▁▁▄▆▆▇▇██
epoch,▁▂▃▃▄▅▆▆▇█
loss,██▇▇▆▅▄▃▂▁
val_accuracy,▁▁▄▅▆▇▇███
val_loss,█▇▇▆▅▄▃▂▁▁

0,1
accuracy,0.62135
epoch,10.0
loss,1.09063
val_accuracy,0.61367
val_loss,1.1004


[34m[1mwandb[0m: Agent Starting Run: kmhd0b2z with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.1
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▁▁▁▁▁█▇▆▇
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▅▃▂▃▄▃▃▂▁
val_accuracy,▁▁▁▁▁▄▄▃▄█
val_loss,█▄▄▅▆▆▅▃▂▁

0,1
accuracy,0.18209
epoch,10.0
loss,2.23858
val_accuracy,0.32833
val_loss,2.22308


[34m[1mwandb[0m: Agent Starting Run: cib2vhsm with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▃▅▇█
epoch,▁▃▅▆█
loss,█▆▄▃▁
val_accuracy,▁▃▄▅█
val_loss,█▆▄▃▁

0,1
accuracy,0.08672
epoch,5.0
loss,2.34402
val_accuracy,0.09283
val_loss,2.34298


[34m[1mwandb[0m: Agent Starting Run: r5vgi9rz with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.1
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▁▁▁▁▄▇███
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▆▅▄▃▃▂▂▁▁
val_accuracy,▁▁▁▁▄▇▇███
val_loss,█▆▅▄▃▃▂▂▁▁

0,1
accuracy,0.35693
epoch,10.0
loss,2.2609
val_accuracy,0.35017
val_loss,2.25568


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: gsqcy38m with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.1
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▂▄▆█
epoch,▁▃▅▆█
loss,█▇▆▄▁
val_accuracy,▁▃▄▆█
val_loss,█▇▅▃▁

0,1
accuracy,0.18328
epoch,5.0
loss,2.24461
val_accuracy,0.2375
val_loss,2.21352


[34m[1mwandb[0m: Agent Starting Run: ujxfsn5m with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▁▁▂█
epoch,▁▃▅▆█
loss,█▇▅▃▁
val_accuracy,▁▁▁▃█
val_loss,█▇▅▃▁

0,1
accuracy,0.11024
epoch,5.0
loss,2.4646
val_accuracy,0.1455
val_loss,2.4175


[34m[1mwandb[0m: Agent Starting Run: a4hixmid with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▁▁▁▁▁▁▁▁▁
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▇▆▆▅▄▃▃▂▁
val_accuracy,▁▁▁▁▁▁▁▁▁▁
val_loss,█▇▆▆▅▄▃▃▂▁

0,1
accuracy,0.09939
epoch,10.0
loss,2.3383
val_accuracy,0.1055
val_loss,2.33072


[34m[1mwandb[0m: Agent Starting Run: rnbjxi9l with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,███▇▇▆▅▄▂▁
epoch,▁▂▃▃▄▅▆▆▇█
loss,██▇▇▆▅▄▃▂▁
val_accuracy,██▇▆▅▅▄▃▂▁
val_loss,██▇▇▆▅▄▃▂▁

0,1
accuracy,0.08669
epoch,10.0
loss,2.33777
val_accuracy,0.08467
val_loss,2.3404


[34m[1mwandb[0m: Agent Starting Run: mhse5rg9 with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.1
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▁▁▁▁▁▁▁▁▁
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▇▅▄▄▃▂▂▁▁
val_accuracy,▁▁▁▁▁▁▁▁▁▁
val_loss,█▇▅▄▃▃▂▂▁▁

0,1
accuracy,0.10083
epoch,10.0
loss,2.30493
val_accuracy,0.0925
val_loss,2.30399


[34m[1mwandb[0m: Agent Starting Run: i8erd384 with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▁▁▁▁
epoch,▁▃▅▆█
loss,█▆▄▃▁
val_accuracy,▁▁▁▁▁
val_loss,█▆▄▃▁

0,1
accuracy,0.1003
epoch,5.0
loss,2.32612
val_accuracy,0.09733
val_loss,2.32413


[34m[1mwandb[0m: Agent Starting Run: zkz00hct with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▁▂▃▄▅▇██▇
epoch,▁▂▃▃▄▅▆▆▇█
loss,██▇▆▅▄▄▃▂▁
val_accuracy,▁▂▃▄▆▇█▇▆▆
val_loss,█▇▇▆▅▄▃▂▂▁

0,1
accuracy,0.16828
epoch,10.0
loss,2.31478
val_accuracy,0.16067
val_loss,2.30082


[34m[1mwandb[0m: Agent Starting Run: 57tci9hw with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.1
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▁▄▅▅▆▆▇▇█
epoch,▁▂▃▃▄▅▆▆▇█
loss,██▇▇▆▆▅▄▃▁
val_accuracy,▁▃▄▅▅▆▆▆▇█
val_loss,██▇▇▇▆▅▄▃▁

0,1
accuracy,0.30152
epoch,10.0
loss,2.07342
val_accuracy,0.337
val_loss,1.98909


[34m[1mwandb[0m: Agent Starting Run: wo9ltlu3 with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▂▂▃▄▄▅▆▇█
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▇▆▆▅▄▃▃▂▁
val_accuracy,▁▁▂▃▄▅▅▆▇█
val_loss,█▇▆▆▅▄▃▃▂▁

0,1
accuracy,0.16624
epoch,10.0
loss,2.28886
val_accuracy,0.17217
val_loss,2.28699


[34m[1mwandb[0m: Agent Starting Run: v3elejg5 with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▁▁▂▃▄▅▆▇█
epoch,▁▂▃▃▄▅▆▆▇█
loss,██▇▇▆▅▄▃▂▁
val_accuracy,▁▁▂▃▄▆▆▇██
val_loss,██▇▆▆▅▄▃▂▁

0,1
accuracy,0.09687
epoch,10.0
loss,2.31202
val_accuracy,0.101
val_loss,2.30713


[34m[1mwandb[0m: Agent Starting Run: l70s45zg with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▆▅▆█▁
epoch,▁▃▅▆█
loss,█▆▄▃▁
val_accuracy,▄▁▄██
val_loss,█▆▄▃▁

0,1
accuracy,0.09972
epoch,5.0
loss,2.39907
val_accuracy,0.10567
val_loss,2.39455


[34m[1mwandb[0m: Agent Starting Run: i7ohm6g8 with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.1
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▁▂▃▄▅▆▇▇█
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▇▇▆▅▄▄▃▂▁
val_accuracy,▁▁▂▃▄▅▆▇██
val_loss,█▇▇▆▅▄▄▃▂▁

0,1
accuracy,0.33485
epoch,10.0
loss,2.24337
val_accuracy,0.36
val_loss,2.2337


[34m[1mwandb[0m: Agent Starting Run: po09vndj with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▂▃▅█
epoch,▁▃▅▆█
loss,█▇▆▄▁
val_accuracy,▁▂▅▆█
val_loss,█▇▅▃▁

0,1
accuracy,0.0818
epoch,5.0
loss,2.3488
val_accuracy,0.07667
val_loss,2.3516


[34m[1mwandb[0m: Agent Starting Run: qb2y1zbp with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▁▁▁▁
epoch,▁▃▅▆█
loss,█▇▆▄▁
val_accuracy,▁▁▁▁▁
val_loss,█▇▅▃▁

0,1
accuracy,0.10017
epoch,5.0
loss,2.40635
val_accuracy,0.0985
val_loss,2.40833


[34m[1mwandb[0m: Agent Starting Run: bt30raw0 with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▁▁▂▇█▆▃▂▂
epoch,▁▂▃▃▄▅▆▆▇█
loss,██▇▆▅▄▃▂▂▁
val_accuracy,▁▁▂▇█▆▃▂▂▂
val_loss,█▇▆▅▄▃▃▂▁▁

0,1
accuracy,0.10752
epoch,10.0
loss,2.28593
val_accuracy,0.11267
val_loss,2.27523


[34m[1mwandb[0m: Agent Starting Run: sy4hjjq1 with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▁▁▁▁▁▁▁▁█
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▇▇▆▄▃▃▂▁▁
val_accuracy,▁▁▁▁▁▁▁▁▁█
val_loss,█▇▆▅▄▃▂▂▁▁

0,1
accuracy,0.10069
epoch,10.0
loss,2.29645
val_accuracy,0.13183
val_loss,2.28694


[34m[1mwandb[0m: Agent Starting Run: o9y6f8m2 with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.1
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▂▁▁▃█
epoch,▁▃▅▆█
loss,█▆▅▃▁
val_accuracy,▁▁▂▄█
val_loss,█▇▅▃▁

0,1
accuracy,0.26506
epoch,5.0
loss,1.97686
val_accuracy,0.37917
val_loss,1.8376


[34m[1mwandb[0m: Agent Starting Run: mpu4g69e with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▇█▇▄▁▇█▅▇▄
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▇▆▆▅▄▃▃▂▁
val_accuracy,▁▁▅▅███▅▅▅
val_loss,█▇▆▆▅▄▃▃▂▁

0,1
accuracy,0.10237
epoch,10.0
loss,2.30251
val_accuracy,0.0965
val_loss,2.3026


[34m[1mwandb[0m: Agent Starting Run: mpkpqwbv with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.1
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▄▅▆█
epoch,▁▃▅▆█
loss,█▅▄▂▁
val_accuracy,▁▃▄▆█
val_loss,█▆▄▃▁

0,1
accuracy,0.41783
epoch,5.0
loss,1.94066
val_accuracy,0.4655
val_loss,1.86389


[34m[1mwandb[0m: Agent Starting Run: pxfnrpdc with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▁▁▁▁▁▁▁▁▁
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▇▆▅▄▄▃▂▂▁
val_accuracy,▁▁▁▁▁▁▁▁▁▁
val_loss,█▇▆▅▄▄▃▂▂▁

0,1
accuracy,0.09939
epoch,10.0
loss,2.73541
val_accuracy,0.1055
val_loss,2.69251


[34m[1mwandb[0m: Agent Starting Run: my6cs7m8 with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▁▁▁▁
epoch,▁▃▅▆█
loss,█▆▄▃▁
val_accuracy,▁▁▁▁▁
val_loss,█▆▄▃▁

0,1
accuracy,0.1003
epoch,5.0
loss,2.63296
val_accuracy,0.09733
val_loss,2.6248


[34m[1mwandb[0m: Agent Starting Run: nwn21cuf with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▁▁▁▁
epoch,▁▃▅▆█
loss,█▇▅▃▁
val_accuracy,▁▁▁▁█
val_loss,█▆▄▂▁

0,1
accuracy,0.09939
epoch,5.0
loss,2.41327
val_accuracy,0.10617
val_loss,2.35043


[34m[1mwandb[0m: Agent Starting Run: kkus4pnu with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▁▁▁▁
epoch,▁▃▅▆█
loss,█▆▄▃▁
val_accuracy,▁▁▁▁▁
val_loss,█▆▄▃▁

0,1
accuracy,0.1003
epoch,5.0
loss,2.55494
val_accuracy,0.09733
val_loss,2.56333


[34m[1mwandb[0m: Agent Starting Run: l9w57kk9 with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.1
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▃▄▄▄▄▄▅▆█
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▆▅▄▄▄▄▃▂▁
val_accuracy,▁▃▂▃▂▂▃▅▇█
val_loss,█▆▆▅▅▅▄▃▂▁

0,1
accuracy,0.45374
epoch,10.0
loss,1.90083
val_accuracy,0.4995
val_loss,1.8533


[34m[1mwandb[0m: Agent Starting Run: ojjy3fp8 with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.1
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▁▁▁▁
epoch,▁▃▅▆█
loss,█▇▅▃▁
val_accuracy,▁▁▁▁█
val_loss,█▆▄▂▁

0,1
accuracy,0.10065
epoch,5.0
loss,2.30402
val_accuracy,0.1505
val_loss,2.30116


[34m[1mwandb[0m: Agent Starting Run: ragiq18g with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.1
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▁▁█▁▁▁▁▁▁
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▆▃▂▁▂▃▃▂▁
val_accuracy,▂▂█▁▁▁▁▁▁▁
val_loss,█▅▃▃▄▅▆▅▃▁

0,1
accuracy,0.09996
epoch,10.0
loss,2.3021
val_accuracy,0.10033
val_loss,2.30125


[34m[1mwandb[0m: Agent Starting Run: 4m5comae with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▃▄▆█
epoch,▁▃▅▆█
loss,█▆▄▃▁
val_accuracy,▁▃▅▆█
val_loss,█▆▄▃▁

0,1
accuracy,0.14004
epoch,5.0
loss,2.31004
val_accuracy,0.1445
val_loss,2.30958


[34m[1mwandb[0m: Agent Starting Run: 4i407zig with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.1
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▄▅▅▅▅▆▆▇█
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▇▆▅▅▄▃▂▂▁
val_accuracy,▁▂▂▂▃▃▄▅▆█
val_loss,█▇▆▆▅▄▃▃▂▁

0,1
accuracy,0.25115
epoch,10.0
loss,1.95138
val_accuracy,0.28017
val_loss,1.90074


[34m[1mwandb[0m: Agent Starting Run: blxxg9in with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▂▂▂▁▁▁▁▂▅█
epoch,▁▂▃▃▄▅▆▆▇█
loss,██▇▇▆▅▄▃▂▁
val_accuracy,▂▂▂▁▁▂▂▄▇█
val_loss,██▇▆▆▅▄▃▂▁

0,1
accuracy,0.11076
epoch,10.0
loss,2.44679
val_accuracy,0.1105
val_loss,2.43228


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: pkiy9tvg with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▁▁▁▂▄▆▇▇█
epoch,▁▂▃▃▄▅▆▆▇█
loss,██▇▆▅▄▄▃▂▁
val_accuracy,▁▁▁▂▃▅▇▇▇█
val_loss,█▇▇▆▅▄▃▃▂▁

0,1
accuracy,0.33354
epoch,10.0
loss,2.15396
val_accuracy,0.35933
val_loss,2.13218


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: h0o7utao with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.1
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▃▄▅▆▆▆▆▇█
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▆▄▄▃▂▂▂▁▁
val_accuracy,▁▁▂▄▄▄▄▅▇█
val_loss,█▆▅▄▄▃▂▂▁▁

0,1
accuracy,0.35794
epoch,10.0
loss,2.14825
val_accuracy,0.4025
val_loss,2.12771


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: svjnki1v with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▁▁▁▁▁▁▁▁▁
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▇▆▆▅▄▃▃▂▁
val_accuracy,▁▁▁▁▁▁▁▁▁▁
val_loss,█▇▆▆▅▄▃▃▂▁

0,1
accuracy,0.0997
epoch,10.0
loss,2.33429
val_accuracy,0.10267
val_loss,2.32753


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: iiwfy7g4 with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▁▁▁▁▁▁▁▁▁
epoch,▁▂▃▃▄▅▆▆▇█
loss,██▇▆▅▄▃▂▂▁
val_accuracy,▁▁▁▁▁▁▁▁▁▁
val_loss,█▇▇▆▅▄▃▂▂▁

0,1
accuracy,0.10065
epoch,10.0
loss,2.3081
val_accuracy,0.09417
val_loss,2.30788


[34m[1mwandb[0m: Agent Starting Run: vzcspruj with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▂▂▃▄▅▅▆▇█
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▇▆▆▅▄▃▃▂▁
val_accuracy,▁▁▃▃▅▅▆▆▆█
val_loss,█▇▆▆▅▄▃▃▂▁

0,1
accuracy,0.093
epoch,10.0
loss,2.30202
val_accuracy,0.0925
val_loss,2.30209


[34m[1mwandb[0m: Agent Starting Run: spzbwtmb with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▂▃▆█
epoch,▁▃▅▆█
loss,█▇▆▄▁
val_accuracy,▁▂▄▆█
val_loss,█▇▅▃▁

0,1
accuracy,0.12317
epoch,5.0
loss,2.29359
val_accuracy,0.13083
val_loss,2.28658


[34m[1mwandb[0m: Agent Starting Run: 9zk68cbl with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.1
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▁▁█▃
epoch,▁▃▅▆█
loss,█▆▄▂▁
val_accuracy,▁▁█▂▁
val_loss,█▄▂▁▁

0,1
accuracy,0.11344
epoch,5.0
loss,2.29699
val_accuracy,0.0985
val_loss,2.29797


[34m[1mwandb[0m: Agent Starting Run: eluz96bo with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.1
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▁▄██
epoch,▁▃▅▆█
loss,█▅▃▂▁
val_accuracy,▁▄███
val_loss,█▅▃▂▁

0,1
accuracy,0.18407
epoch,5.0
loss,2.30688
val_accuracy,0.17617
val_loss,2.30429


[34m[1mwandb[0m: Agent Starting Run: isjca8o4 with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.1
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▃▅▆█
epoch,▁▃▅▆█
loss,█▆▅▃▁
val_accuracy,▄▅▂▁█
val_loss,█▆▅▃▁

0,1
accuracy,0.11657
epoch,5.0
loss,2.30245
val_accuracy,0.11283
val_loss,2.30237


[34m[1mwandb[0m: Agent Starting Run: 8hvs7ec2 with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▃▅▆█
epoch,▁▃▅▆█
loss,█▆▄▃▁
val_accuracy,▆▅▁▆█
val_loss,█▆▄▃▁

0,1
accuracy,0.07707
epoch,5.0
loss,2.30135
val_accuracy,0.07833
val_loss,2.30121


[34m[1mwandb[0m: Agent Starting Run: 5bmcnrys with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▁▁▁▁▁▁▁▁▁
epoch,▁▂▃▃▄▅▆▆▇█
loss,██▇▇▆▅▄▃▂▁
val_accuracy,▁▁▁▁▁▁▁▁▁▁
val_loss,██▇▆▆▅▄▃▂▁

0,1
accuracy,0.0997
epoch,10.0
loss,2.34548
val_accuracy,0.10267
val_loss,2.34659


[34m[1mwandb[0m: Agent Starting Run: okqr3tsi with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.1
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▂▃▄▅▆▇▇██
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▇▆▆▅▄▄▃▂▁
val_accuracy,▁▂▄▅▆▆▇▇██
val_loss,█▇▇▆▅▅▄▃▂▁

0,1
accuracy,0.44148
epoch,10.0
loss,1.87211
val_accuracy,0.47233
val_loss,1.79775


[34m[1mwandb[0m: Agent Starting Run: 9iqlebqc with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▂▃▄▄▅▆▇▇█
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▇▆▅▅▄▃▂▂▁
val_accuracy,▁▂▃▄▅▆▆▇▇█
val_loss,█▇▆▅▅▄▃▂▂▁

0,1
accuracy,0.11602
epoch,10.0
loss,2.30547
val_accuracy,0.12367
val_loss,2.29319


[34m[1mwandb[0m: Agent Starting Run: o1n5fhpv with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▁▁▁▁▁▁▁▁▁
epoch,▁▂▃▃▄▅▆▆▇█
loss,██▇▇▆▅▄▃▂▁
val_accuracy,▁▁▁▁▁▁▁▁▁▁
val_loss,██▇▇▆▅▄▃▂▁

0,1
accuracy,0.09991
epoch,10.0
loss,2.46284
val_accuracy,0.10083
val_loss,2.45368


[34m[1mwandb[0m: Agent Starting Run: k20noxcr with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▃▂▁▃█
epoch,▁▃▅▆█
loss,█▇▅▃▁
val_accuracy,▁▁▂▅█
val_loss,█▆▅▃▁

0,1
accuracy,0.08991
epoch,5.0
loss,2.29971
val_accuracy,0.10767
val_loss,2.28154


[34m[1mwandb[0m: Agent Starting Run: psk0ski2 with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▁▂▂▃▄▅▆▇█
epoch,▁▂▃▃▄▅▆▆▇█
loss,██▇▇▆▅▄▃▂▁
val_accuracy,▁▁▂▃▃▄▅▆▇█
val_loss,██▇▇▆▅▄▃▂▁

0,1
accuracy,0.16261
epoch,10.0
loss,2.28403
val_accuracy,0.17367
val_loss,2.27937


[34m[1mwandb[0m: Agent Starting Run: o3y62xmm with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.1
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▁▁▁▁▁▁▁▁▁
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▅▄▃▂▂▂▁▁▁
val_accuracy,▁▁▁▁▁▁▁▁▁▁
val_loss,█▆▄▃▃▂▂▁▁▁

0,1
accuracy,0.10065
epoch,10.0
loss,2.29617
val_accuracy,0.09417
val_loss,2.29388


[34m[1mwandb[0m: Agent Starting Run: zhg97jy6 with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▁▁▁▁
epoch,▁▃▅▆█
loss,█▆▄▃▁
val_accuracy,▁▁▁▁▁
val_loss,█▆▄▃▁

0,1
accuracy,0.10017
epoch,5.0
loss,2.41703
val_accuracy,0.0985
val_loss,2.41395


[34m[1mwandb[0m: Agent Starting Run: df96cp5y with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▁▁▁▁▁▁▁▁▁
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▇▆▆▅▄▃▃▂▁
val_accuracy,▁▁▁▁▁▁▁▁▁▁
val_loss,█▇▆▆▅▄▃▃▂▁

0,1
accuracy,0.10083
epoch,10.0
loss,2.38233
val_accuracy,0.0925
val_loss,2.38166


[34m[1mwandb[0m: Agent Starting Run: qlmbb4bz with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▁▁▁▁
epoch,▁▃▅▆█
loss,█▆▄▃▁
val_accuracy,▁▁▁▁▁
val_loss,█▆▄▃▁

0,1
accuracy,0.09939
epoch,5.0
loss,2.32416
val_accuracy,0.1055
val_loss,2.32749


[34m[1mwandb[0m: Agent Starting Run: il5se3qp with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▂▃▅█
epoch,▁▃▅▆█
loss,█▇▆▄▁
val_accuracy,▁▂▄▆█
val_loss,█▇▅▃▁

0,1
accuracy,0.10044
epoch,5.0
loss,2.29715
val_accuracy,0.10433
val_loss,2.2937


[34m[1mwandb[0m: Agent Starting Run: 95nlzy91 with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▃▅▆█
epoch,▁▃▅▆█
loss,█▆▄▃▁
val_accuracy,▁▄▅▆█
val_loss,█▆▄▃▁

0,1
accuracy,0.14061
epoch,5.0
loss,2.40574
val_accuracy,0.145
val_loss,2.40065


[34m[1mwandb[0m: Agent Starting Run: z3lhd0xg with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▁▁▁▁▁▁▁▁▁
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▇▆▆▅▄▃▃▂▁
val_accuracy,▁▁▁▁▁▁▁▁▁▁
val_loss,█▇▆▆▅▄▃▃▂▁

0,1
accuracy,0.09944
epoch,10.0
loss,2.54604
val_accuracy,0.105
val_loss,2.53105


[34m[1mwandb[0m: Agent Starting Run: 5of8oc74 with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▂▄▆█
epoch,▁▃▅▆█
loss,█▇▆▄▁
val_accuracy,▁▂▅▆█
val_loss,█▇▅▃▁

0,1
accuracy,0.11474
epoch,5.0
loss,2.30521
val_accuracy,0.102
val_loss,2.30582


[34m[1mwandb[0m: Agent Starting Run: pbojz5zt with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▂▃▄▅▆▇▇██
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▇▆▆▅▄▃▃▂▁
val_accuracy,▁▃▂▂▂▃▅▅▅█
val_loss,█▇▆▆▅▄▃▃▂▁

0,1
accuracy,0.10804
epoch,10.0
loss,2.30275
val_accuracy,0.10967
val_loss,2.30275


[34m[1mwandb[0m: Agent Starting Run: mvtad6gs with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.1
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▁▁▁▁█▂▁▁▁
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▇▅▃▂▁▁▁▁▁
val_accuracy,▁▁▁▁█▁▁▁▁▁
val_loss,█▆▄▂▁▁▁▁▁▁

0,1
accuracy,0.0997
epoch,10.0
loss,2.30093
val_accuracy,0.10267
val_loss,2.30028


[34m[1mwandb[0m: Agent Starting Run: gravhors with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.1
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▄▁█▂
epoch,▁▃▅▆█
loss,█▅▃▂▁
val_accuracy,▂▁▄▂█
val_loss,█▄▃▂▁

0,1
accuracy,0.10839
epoch,5.0
loss,2.25196
val_accuracy,0.22683
val_loss,2.22828


[34m[1mwandb[0m: Agent Starting Run: y37m9wka with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.1
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▁▁▁▁
epoch,▁▃▅▆█
loss,█▅▃▂▁
val_accuracy,▁▁▁▁▁
val_loss,█▅▃▂▁

0,1
accuracy,0.10065
epoch,5.0
loss,2.30338
val_accuracy,0.09417
val_loss,2.30318


[34m[1mwandb[0m: Agent Starting Run: szj5ht61 with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▂▃▄▅▆▆▇▇█
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▇▆▅▄▃▃▂▁▁
val_accuracy,▁▂▃▄▄▆▆▆▇█
val_loss,█▇▆▅▄▃▃▂▂▁

0,1
accuracy,0.11635
epoch,10.0
loss,2.24433
val_accuracy,0.11267
val_loss,2.23536


[34m[1mwandb[0m: Agent Starting Run: v7dsaaqi with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▃▅▆█
epoch,▁▃▅▆█
loss,█▆▄▂▁
val_accuracy,▁▄▅▇█
val_loss,█▆▄▂▁

0,1
accuracy,0.13037
epoch,5.0
loss,2.30858
val_accuracy,0.14333
val_loss,2.29279


[34m[1mwandb[0m: Agent Starting Run: 0bw5mkwm with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▂▃▄▄▅▆▆▇█
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▇▆▆▅▄▃▃▂▁
val_accuracy,▁▂▃▄▄▅▆▆▇█
val_loss,█▇▆▆▅▄▃▃▂▁

0,1
accuracy,0.1093
epoch,10.0
loss,2.30249
val_accuracy,0.11583
val_loss,2.30212


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: fgnyfvb0 with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.1
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▁▃▃▃▁▁▁▄█
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▇▅▄▃▄▄▃▂▁
val_accuracy,▁▃▄▃▁▁▁▄██
val_loss,█▆▅▅▆▆▆▄▃▁

0,1
accuracy,0.30969
epoch,10.0
loss,2.276
val_accuracy,0.2965
val_loss,2.26679


[34m[1mwandb[0m: Agent Starting Run: kqhs0dwc with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.1
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▃▅▇█
epoch,▁▃▅▆█
loss,█▅▄▂▁
val_accuracy,▁▃▅▇█
val_loss,█▆▄▃▁

0,1
accuracy,0.30133
epoch,5.0
loss,1.98442
val_accuracy,0.35517
val_loss,1.90396


[34m[1mwandb[0m: Agent Starting Run: 93jc4io3 with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.1
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▁▁▁█
epoch,▁▃▅▆█
loss,█▅▃▂▁
val_accuracy,▁▁▁▁█
val_loss,█▅▃▂▁

0,1
accuracy,0.0997
epoch,5.0
loss,2.29424
val_accuracy,0.16883
val_loss,2.28351


[34m[1mwandb[0m: Agent Starting Run: 766ae2ue with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▁▁▂▃▃▄▅▇█
epoch,▁▂▃▃▄▅▆▆▇█
loss,██▇▇▆▅▄▃▂▁
val_accuracy,▁▁▂▃▃▃▃▅▆█
val_loss,██▇▇▆▅▄▃▂▁

0,1
accuracy,0.02774
epoch,10.0
loss,2.30447
val_accuracy,0.03033
val_loss,2.30469


[34m[1mwandb[0m: Agent Starting Run: e14ab9yt with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▁▁▁▁▁▁▁▁▁
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▇▆▆▅▄▃▃▂▁
val_accuracy,▁▁▁▁▁▁▁▁▁▁
val_loss,█▇▆▆▅▄▃▃▂▁

0,1
accuracy,0.09939
epoch,10.0
loss,2.33421
val_accuracy,0.1055
val_loss,2.32785


[34m[1mwandb[0m: Agent Starting Run: 7ynwhaka with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,█▇▇▆▅▅▄▃▂▁
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▇▆▅▅▄▃▂▂▁
val_accuracy,▅▅▅▄█▇▂▁▁▁
val_loss,█▇▆▅▅▄▃▂▂▁

0,1
accuracy,0.09465
epoch,10.0
loss,2.31257
val_accuracy,0.094
val_loss,2.30852


[34m[1mwandb[0m: Agent Starting Run: ze9vwjpr with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.1
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▂█▁▁▁
epoch,▁▃▅▆█
loss,█▅▃▂▁
val_accuracy,█▁▁▁▁
val_loss,█▅▃▂▁

0,1
accuracy,0.0997
epoch,5.0
loss,2.44705
val_accuracy,0.10267
val_loss,2.40281


[34m[1mwandb[0m: Agent Starting Run: 8f8rkihw with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▁▁▁▁
epoch,▁▃▅▆█
loss,█▆▄▃▁
val_accuracy,▁▁▁▁▁
val_loss,█▆▄▃▁

0,1
accuracy,0.09944
epoch,5.0
loss,2.32688
val_accuracy,0.105
val_loss,2.32743


[34m[1mwandb[0m: Agent Starting Run: qdso4gsj with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.1
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▃▄▆█
epoch,▁▃▅▆█
loss,█▆▄▃▁
val_accuracy,▁▃▄▆█
val_loss,█▆▄▃▁

0,1
accuracy,0.17954
epoch,5.0
loss,2.29415
val_accuracy,0.19517
val_loss,2.2923


[34m[1mwandb[0m: Agent Starting Run: yo88pk56 with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▁▁▁▁
epoch,▁▃▅▆█
loss,█▇▆▃▁
val_accuracy,▁▁▁▁▁
val_loss,█▇▅▃▁

0,1
accuracy,0.09944
epoch,5.0
loss,2.31727
val_accuracy,0.105
val_loss,2.31249


[34m[1mwandb[0m: Agent Starting Run: vl5gcphh with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▂▃▅█
epoch,▁▃▅▆█
loss,█▇▆▄▁
val_accuracy,▁▂▄▆█
val_loss,█▇▅▃▁

0,1
accuracy,0.16798
epoch,5.0
loss,2.31904
val_accuracy,0.17383
val_loss,2.30892


[34m[1mwandb[0m: Agent Starting Run: ldmbx8hh with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.1
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▁▁▃█
epoch,▁▃▅▆█
loss,█▆▃▁▁
val_accuracy,▁▁▃█▄
val_loss,█▅▂▁▁

0,1
accuracy,0.23739
epoch,5.0
loss,2.2964
val_accuracy,0.15417
val_loss,2.29347


[34m[1mwandb[0m: Agent Starting Run: q74sxtkm with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▁▁▂▃▄▄▅▆█
epoch,▁▂▃▃▄▅▆▆▇█
loss,██▇▆▆▅▄▃▂▁
val_accuracy,▁▁▂▂▃▄▄▅▆█
val_loss,█▇▇▆▅▄▄▃▂▁

0,1
accuracy,0.21104
epoch,10.0
loss,2.16309
val_accuracy,0.24367
val_loss,2.13951


[34m[1mwandb[0m: Agent Starting Run: u93chonu with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.1
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▁▁▁▁▁▁▁▁▁
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▆▄▃▂▂▁▁▁▁
val_accuracy,▁▁▁▁▁▁▁▁▁▁
val_loss,█▆▄▃▂▂▂▁▁▁

0,1
accuracy,0.10083
epoch,10.0
loss,2.30229
val_accuracy,0.0925
val_loss,2.30275


[34m[1mwandb[0m: Agent Starting Run: 032jdxr8 with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.1
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▃▄▄█
epoch,▁▃▅▆█
loss,█▅▄▃▁
val_accuracy,▁▂▃▆█
val_loss,█▇▆▃▁

0,1
accuracy,0.17259
epoch,5.0
loss,2.14404
val_accuracy,0.20033
val_loss,2.06407


[34m[1mwandb[0m: Agent Starting Run: 4b32wgrc with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▂▃▆█
epoch,▁▃▅▆█
loss,█▇▅▃▁
val_accuracy,▁▂▄▆█
val_loss,█▇▅▃▁

0,1
accuracy,0.16157
epoch,5.0
loss,2.26376
val_accuracy,0.1845
val_loss,2.23678


[34m[1mwandb[0m: Agent Starting Run: m0j6qxd7 with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▂▃▃▄▅▆▇▇█
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▇▆▆▅▄▃▃▂▁
val_accuracy,▁▁▁▂▃▅▆▆▇█
val_loss,█▇▆▆▅▄▃▃▂▁

0,1
accuracy,0.13237
epoch,10.0
loss,2.3705
val_accuracy,0.12467
val_loss,2.37743


[34m[1mwandb[0m: Agent Starting Run: eiatkr3t with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▁▁▁▁▁▁▁▁▁
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▇▆▆▅▄▃▃▂▁
val_accuracy,▁▁▁▁▁▁▁▁▁▁
val_loss,█▇▆▆▅▄▃▃▂▁

0,1
accuracy,0.10083
epoch,10.0
loss,2.48154
val_accuracy,0.0925
val_loss,2.48301


[34m[1mwandb[0m: Agent Starting Run: p8e6z8e6 with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.1
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▁▁▁▁▁▂▅▇█
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▇▆▅▅▄▃▃▂▁
val_accuracy,▁▁▁▁▁▂▅▆▇█
val_loss,█▇▇▆▅▄▃▃▂▁

0,1
accuracy,0.32856
epoch,10.0
loss,1.91411
val_accuracy,0.362
val_loss,1.85406


[34m[1mwandb[0m: Agent Starting Run: ettvyh52 with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▁▁▁▁▁▁▁▁▁
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▇▆▆▅▄▃▂▂▁
val_accuracy,▁▁▁▁▁▁▁▁▁▁
val_loss,█▇▆▆▅▄▃▂▂▁

0,1
accuracy,0.10017
epoch,10.0
loss,2.47754
val_accuracy,0.0985
val_loss,2.47554


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: y60pr2h7 with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▁▁▁▁
epoch,▁▃▅▆█
loss,█▆▄▃▁
val_accuracy,▁▁▁▁▁
val_loss,█▆▄▃▁

0,1
accuracy,0.10083
epoch,5.0
loss,2.30612
val_accuracy,0.0925
val_loss,2.30702


[34m[1mwandb[0m: Agent Starting Run: cb1ihpvl with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▁▁▁▁
epoch,▁▃▅▆█
loss,█▇▆▃▁
val_accuracy,▁▁▁▁▁
val_loss,█▇▅▃▁

0,1
accuracy,0.1003
epoch,5.0
loss,2.32948
val_accuracy,0.09733
val_loss,2.32403


[34m[1mwandb[0m: Agent Starting Run: qxp5xa09 with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,█▇▄▃▁
epoch,▁▃▅▆█
loss,█▆▄▃▁
val_accuracy,██▆▁▁
val_loss,█▆▄▃▁

0,1
accuracy,0.10572
epoch,5.0
loss,2.30251
val_accuracy,0.10783
val_loss,2.30234


[34m[1mwandb[0m: Agent Starting Run: t067zhe2 with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.1
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▁▁▁▁▁▁▁▁█
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▅▄▃▂▂▂▁▁▁
val_accuracy,▁▁▁▁▁▁▁▁▃█
val_loss,█▆▄▃▃▂▂▁▁▁

0,1
accuracy,0.1217
epoch,10.0
loss,2.29409
val_accuracy,0.16683
val_loss,2.29115


[34m[1mwandb[0m: Agent Starting Run: ox0gcrjc with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▁▁▁▁▁▁▁▁▁
epoch,▁▂▃▃▄▅▆▆▇█
loss,██▇▇▆▅▄▃▂▁
val_accuracy,▁▁▁▁▁▁▁▁▁▁
val_loss,██▇▇▆▅▄▃▂▁

0,1
accuracy,0.09939
epoch,10.0
loss,2.35138
val_accuracy,0.1055
val_loss,2.33724


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: q8szdla8 with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▁▂▂▃▃▄▅▆█
epoch,▁▂▃▃▄▅▆▆▇█
loss,██▇▆▅▄▃▂▂▁
val_accuracy,▁▁▂▂▃▃▄▅▇█
val_loss,█▇▇▆▅▄▃▂▂▁

0,1
accuracy,0.22006
epoch,10.0
loss,2.21381
val_accuracy,0.24717
val_loss,2.19561


[34m[1mwandb[0m: Agent Starting Run: 83r4yprp with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.1
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▁▁█▂▁▁▁▃▅
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▆▄▃▃▄▄▃▂▁
val_accuracy,▁▁▃▁▁▁▁▂▂█
val_loss,█▆▅▅▅▆▅▄▂▁

0,1
accuracy,0.13663
epoch,10.0
loss,2.27905
val_accuracy,0.32283
val_loss,2.27006


[34m[1mwandb[0m: Agent Starting Run: mz9ilhb3 with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▂▂▃▄▅▆▆▇█
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▇▆▆▅▄▃▃▂▁
val_accuracy,▁▁▃▃▃▆▆▆▇█
val_loss,█▇▆▆▅▄▃▃▂▁

0,1
accuracy,0.08074
epoch,10.0
loss,2.3033
val_accuracy,0.0835
val_loss,2.30329


[34m[1mwandb[0m: Agent Starting Run: y344xhgc with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▂▂▃▄▅▆▆▇█
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▇▆▆▅▄▃▃▂▁
val_accuracy,▁▂▂▄▄▄▅▆▇█
val_loss,█▇▆▆▅▄▃▃▂▁

0,1
accuracy,0.10778
epoch,10.0
loss,2.30368
val_accuracy,0.10617
val_loss,2.30362


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: gy8rss4m with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▁▁▁▁▁▁▁▁▁
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▇▆▅▅▄▃▂▂▁
val_accuracy,▁▁▁▁▁▁▁▁▁▁
val_loss,█▇▆▅▅▄▃▂▂▁

0,1
accuracy,0.0997
epoch,10.0
loss,2.31153
val_accuracy,0.10267
val_loss,2.31244


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: bjlt7b6v with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▅█▆▄▁
epoch,▁▃▅▆█
loss,█▆▅▃▁
val_accuracy,██▁▁▁
val_loss,█▆▄▃▁

0,1
accuracy,0.07585
epoch,5.0
loss,2.3034
val_accuracy,0.0735
val_loss,2.30357


[34m[1mwandb[0m: Agent Starting Run: 3s355wpv with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▁▁▁▁
epoch,▁▃▅▆█
loss,█▇▆▄▁
val_accuracy,▁▁▁▁▁
val_loss,█▇▅▃▁

0,1
accuracy,0.09965
epoch,5.0
loss,2.30639
val_accuracy,0.10317
val_loss,2.30603


[34m[1mwandb[0m: Agent Starting Run: ikqyhbr9 with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.1
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▂▃▃▄▅▅▆▇█
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▇▆▆▅▄▃▃▂▁
val_accuracy,▁▂▃▄▄▅▆▆▇█
val_loss,█▇▆▆▅▄▃▃▂▁

0,1
accuracy,0.14965
epoch,10.0
loss,2.29505
val_accuracy,0.16067
val_loss,2.29362


[34m[1mwandb[0m: Agent Starting Run: 0xj6ru7d with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▁▁▁▁▁▁▁▁▁
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▇▆▆▅▄▃▃▂▁
val_accuracy,▁▁▁▁▁▁▁▁▁▁
val_loss,█▇▆▆▅▄▃▃▂▁

0,1
accuracy,0.09939
epoch,10.0
loss,2.58879
val_accuracy,0.1055
val_loss,2.5843


[34m[1mwandb[0m: Agent Starting Run: bmpza593 with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▂▅▆█
epoch,▁▃▅▆█
loss,█▆▄▃▁
val_accuracy,▁▁▁▅█
val_loss,█▆▄▃▁

0,1
accuracy,0.10674
epoch,5.0
loss,2.32592
val_accuracy,0.09883
val_loss,2.33012


[34m[1mwandb[0m: Agent Starting Run: 393zl7av with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▂▃▄▄▅▆▇▇█
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▇▆▆▅▄▃▂▂▁
val_accuracy,▁▂▃▄▅▆▆▇██
val_loss,█▇▆▆▅▄▃▂▂▁

0,1
accuracy,0.14319
epoch,10.0
loss,2.2523
val_accuracy,0.14983
val_loss,2.24388


[34m[1mwandb[0m: Agent Starting Run: fhhbijxh with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▅▁▅▅█
epoch,▁▃▅▆█
loss,█▆▄▃▁
val_accuracy,▁▁▁▁▁
val_loss,█▆▄▃▁

0,1
accuracy,0.0955
epoch,5.0
loss,2.30938
val_accuracy,0.087
val_loss,2.31075


[34m[1mwandb[0m: Agent Starting Run: 0hz1s32q with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.1
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▂▃▅▆▆▇▇██
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▇▆▅▄▄▃▂▂▁
val_accuracy,▁▂▄▅▆▆▇▇██
val_loss,█▇▆▅▅▄▃▂▂▁

0,1
accuracy,0.54446
epoch,10.0
loss,1.62546
val_accuracy,0.57067
val_loss,1.55366


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: vrd043te with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▁▁▁▁
epoch,▁▃▅▆█
loss,█▇▆▃▁
val_accuracy,▁▁▁▁▁
val_loss,█▇▅▃▁

0,1
accuracy,0.0997
epoch,5.0
loss,2.30955
val_accuracy,0.10267
val_loss,2.30637


[34m[1mwandb[0m: Agent Starting Run: l769os59 with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▁▂▂▃▄▅▆▇█
epoch,▁▂▃▃▄▅▆▆▇█
loss,██▇▇▆▅▄▃▂▁
val_accuracy,▁▁▂▂▃▄▅▆▇█
val_loss,██▇▇▆▅▄▃▂▁

0,1
accuracy,0.12081
epoch,10.0
loss,2.47174
val_accuracy,0.13183
val_loss,2.46091


[34m[1mwandb[0m: Agent Starting Run: 6s1xb0dm with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.1
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▁▁▂▃▅▆▇▇█
epoch,▁▂▃▃▄▅▆▆▇█
loss,██▇▇▆▆▅▄▃▁
val_accuracy,▁▁▂▃▄▆▆▇██
val_loss,██▇▇▆▆▅▄▃▁

0,1
accuracy,0.39328
epoch,10.0
loss,2.26402
val_accuracy,0.4115
val_loss,2.24975


[34m[1mwandb[0m: Agent Starting Run: uc7jvzdv with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.1
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▂▅▆█
epoch,▁▃▅▆█
loss,█▅▄▂▁
val_accuracy,▁▃▅▆█
val_loss,█▆▅▃▁

0,1
accuracy,0.27007
epoch,5.0
loss,2.14462
val_accuracy,0.31383
val_loss,2.09642


[34m[1mwandb[0m: Agent Starting Run: 6cexno88 with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.1
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▁▁▁▁▁▁▁▁▁
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▆▅▄▃▃▂▂▁▁
val_accuracy,▁▁▁▁▁▁▁▁▁▁
val_loss,█▇▅▄▄▃▂▂▁▁

0,1
accuracy,0.10083
epoch,10.0
loss,2.30357
val_accuracy,0.0925
val_loss,2.30429


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: kbxv0zam with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▁▁▁▁
epoch,▁▃▅▆█
loss,█▇▆▄▁
val_accuracy,▁▁▁▁▁
val_loss,█▇▅▃▁

0,1
accuracy,0.10083
epoch,5.0
loss,2.31099
val_accuracy,0.0925
val_loss,2.31154


[34m[1mwandb[0m: Agent Starting Run: ke6n1kel with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.1
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▂▃▆█
epoch,▁▃▅▆█
loss,█▇▆▄▁
val_accuracy,▁▂▄▆█
val_loss,█▇▅▃▁

0,1
accuracy,0.24793
epoch,5.0
loss,2.28874
val_accuracy,0.29033
val_loss,2.2819


[34m[1mwandb[0m: Agent Starting Run: wh8no40x with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▁▁▁▁
epoch,▁▃▅▆█
loss,█▇▆▄▁
val_accuracy,▁▁▁▁▁
val_loss,█▇▅▃▁

0,1
accuracy,0.1003
epoch,5.0
loss,2.4104
val_accuracy,0.09733
val_loss,2.40653


[34m[1mwandb[0m: Agent Starting Run: urpkah8m with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.1
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▁▁▁▁
epoch,▁▃▅▆█
loss,█▇▅▃▁
val_accuracy,▁▁▁▁█
val_loss,█▆▄▂▁

0,1
accuracy,0.09965
epoch,5.0
loss,2.30201
val_accuracy,0.24517
val_loss,2.29976


[34m[1mwandb[0m: Agent Starting Run: abvyw790 with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,███▆▁
epoch,▁▃▅▆█
loss,█▇▆▄▁
val_accuracy,▆█▁▆▆
val_loss,█▇▅▃▁

0,1
accuracy,0.07196
epoch,5.0
loss,2.31997
val_accuracy,0.06883
val_loss,2.31903


[34m[1mwandb[0m: Agent Starting Run: gybtdc94 with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▁▁▁▁▁▁▁▁▁
epoch,▁▂▃▃▄▅▆▆▇█
loss,██▇▇▆▅▄▃▂▁
val_accuracy,▁▁▁▁▁▁▁▁▁▁
val_loss,██▇▇▆▅▄▃▂▁

0,1
accuracy,0.10065
epoch,10.0
loss,2.31285
val_accuracy,0.09417
val_loss,2.31747


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: 6h8l8okk with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▁▂▃▃▃▄▄▆█
epoch,▁▂▃▃▄▅▆▆▇█
loss,██▇▆▅▄▄▃▂▁
val_accuracy,▁▂▂▃▃▃▄▅▆█
val_loss,█▇▇▆▅▄▃▃▂▁

0,1
accuracy,0.15085
epoch,10.0
loss,2.12772
val_accuracy,0.172
val_loss,2.09868


[34m[1mwandb[0m: Agent Starting Run: 85r11m8m with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▁▁▁▁▁▁███
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▇▆▆▅▄▃▂▂▁
val_accuracy,▁▁▁▁▁▁▁▁▁▁
val_loss,█▇▆▆▅▄▃▃▂▁

0,1
accuracy,0.11106
epoch,10.0
loss,2.30257
val_accuracy,0.10417
val_loss,2.30267


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: 7hsxfroy with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▁▁▁▁▁▁▁▁▁
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▇▆▆▅▄▃▂▂▁
val_accuracy,▁▁▁▁▁▁▁▁▁▁
val_loss,█▇▆▆▅▄▃▂▂▁

0,1
accuracy,0.1003
epoch,10.0
loss,2.31411
val_accuracy,0.09733
val_loss,2.3144


[34m[1mwandb[0m: Agent Starting Run: yehsty4o with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▃▃▄▅▄▄▆▇█
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▇▆▆▅▄▃▂▂▁
val_accuracy,▅▅▅▁▅█▅▁█▅
val_loss,█▇▆▆▅▄▃▂▂▁

0,1
accuracy,0.10041
epoch,10.0
loss,2.35791
val_accuracy,0.103
val_loss,2.3561


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: 0dwnt5eq with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▂▄▆█
epoch,▁▃▅▆█
loss,█▆▄▃▁
val_accuracy,▁▃▅▆█
val_loss,█▆▄▃▁

0,1
accuracy,0.15981
epoch,5.0
loss,2.26384
val_accuracy,0.16767
val_loss,2.2567


[34m[1mwandb[0m: Agent Starting Run: z40kc8c8 with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▅█▅▅
epoch,▁▃▅▆█
loss,█▆▅▃▁
val_accuracy,▁▁▁▁▁
val_loss,█▆▄▃▁

0,1
accuracy,0.03081
epoch,5.0
loss,2.30886
val_accuracy,0.0325
val_loss,2.30856


[34m[1mwandb[0m: Agent Starting Run: 571r9zar with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.1
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▁▂▂▃▃▄▄▅█
epoch,▁▂▃▃▄▅▆▆▇█
loss,██▇▇▆▅▄▃▂▁
val_accuracy,▁▁▂▂▃▃▄▄▇█
val_loss,██▇▆▅▅▄▃▂▁

0,1
accuracy,0.19115
epoch,10.0
loss,2.30015
val_accuracy,0.22217
val_loss,2.29956


[34m[1mwandb[0m: Agent Starting Run: g8xmgv5q with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.1
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▁▃▆▇█▇▇▆▆
epoch,▁▂▃▃▄▅▆▆▇█
loss,██▇▇▆▅▄▄▂▁
val_accuracy,▁▂▆▇█▇▇▆▆▅
val_loss,██▇▇▆▅▅▄▂▁

0,1
accuracy,0.2225
epoch,10.0
loss,2.26336
val_accuracy,0.21583
val_loss,2.25086


[34m[1mwandb[0m: Agent Starting Run: te0niwmg with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▁▁▃█
epoch,▁▃▅▆█
loss,█▇▆▄▁
val_accuracy,▁▁▃██
val_loss,█▇▅▃▁

0,1
accuracy,0.08872
epoch,5.0
loss,2.30348
val_accuracy,0.0895
val_loss,2.30353


[34m[1mwandb[0m: Agent Starting Run: artvs15g with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▁▁▁▁▁████
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▇▆▆▅▄▃▃▂▁
val_accuracy,▁▁▁▁▁▁▁▁▁▁
val_loss,█▇▆▆▅▄▃▃▂▁

0,1
accuracy,0.09959
epoch,10.0
loss,2.30425
val_accuracy,0.10533
val_loss,2.30318


[34m[1mwandb[0m: Agent Starting Run: qmgsk3ra with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.1
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▁▁▁▁▁▂▆▆█
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▃▂▂▂▁▁▁▁▁
val_accuracy,▁▁▁▁▁▂▅▅▇█
val_loss,█▅▄▄▃▃▂▂▁▁

0,1
accuracy,0.23641
epoch,10.0
loss,2.25009
val_accuracy,0.28667
val_loss,2.24027


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: wjay78qy with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.1
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▁▄▃█
epoch,▁▃▅▆█
loss,█▆▃▂▁
val_accuracy,▁▄▄█▇
val_loss,█▅▂▁▁

0,1
accuracy,0.29657
epoch,5.0
loss,2.23314
val_accuracy,0.26383
val_loss,2.22385


[34m[1mwandb[0m: Agent Starting Run: 1axkbe1m with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▁▁▁▁▁▁▁▁▁
epoch,▁▂▃▃▄▅▆▆▇█
loss,██▇▇▆▅▄▃▂▁
val_accuracy,▁▁▁▁▁▁▁▁▁▁
val_loss,██▇▆▆▅▄▃▂▁

0,1
accuracy,0.10017
epoch,10.0
loss,2.3058
val_accuracy,0.0985
val_loss,2.30731


[34m[1mwandb[0m: Agent Starting Run: dyezucsf with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▄▅██
epoch,▁▃▅▆█
loss,█▆▄▃▁
val_accuracy,█▆▆▁▄
val_loss,█▆▄▃▁

0,1
accuracy,0.11296
epoch,5.0
loss,2.31591
val_accuracy,0.1095
val_loss,2.31645


[34m[1mwandb[0m: Agent Starting Run: mnktzdtn with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.1
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▂▃▆█
epoch,▁▃▅▆█
loss,█▇▆▄▁
val_accuracy,▁▂▅▇█
val_loss,█▇▅▃▁

0,1
accuracy,0.1523
epoch,5.0
loss,2.30246
val_accuracy,0.168
val_loss,2.30191


[34m[1mwandb[0m: Agent Starting Run: 2ulivo87 with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▁▁▁▁
epoch,▁▃▅▆█
loss,█▇▆▃▁
val_accuracy,▁▁▁▁▁
val_loss,█▇▅▃▁

0,1
accuracy,0.10083
epoch,5.0
loss,2.32944
val_accuracy,0.0925
val_loss,2.327


[34m[1mwandb[0m: Agent Starting Run: nc2b0f79 with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▁▁▁▁
epoch,▁▃▅▆█
loss,█▇▆▃▁
val_accuracy,▁▁▁▁▁
val_loss,█▇▅▃▁

0,1
accuracy,0.10083
epoch,5.0
loss,2.31981
val_accuracy,0.0925
val_loss,2.32109


[34m[1mwandb[0m: Agent Starting Run: 7qbqwyq9 with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▁▁▁▁▁▁▁▁▁
epoch,▁▂▃▃▄▅▆▆▇█
loss,██▇▇▆▅▄▃▂▁
val_accuracy,▁▁▁▁▁▁▁▁▁▁
val_loss,██▇▇▆▅▄▃▂▁

0,1
accuracy,0.1003
epoch,10.0
loss,2.4201
val_accuracy,0.09733
val_loss,2.41865


[34m[1mwandb[0m: Agent Starting Run: 8hkletrd with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▁▁▁▁▁▁▁▁▁
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▇▆▆▅▄▃▃▂▁
val_accuracy,▁▁▁▁▁▁▁▁▁▁
val_loss,█▇▆▆▅▄▃▃▂▁

0,1
accuracy,0.0997
epoch,10.0
loss,2.61982
val_accuracy,0.10267
val_loss,2.61281


[34m[1mwandb[0m: Agent Starting Run: 0xj9squ3 with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▁▁▁▁▁▁▁▁█
epoch,▁▂▃▃▄▅▆▆▇█
loss,██▇▆▅▄▃▂▂▁
val_accuracy,▁▁▁▁▁▁▁▁▃█
val_loss,█▇▇▆▅▄▃▂▂▁

0,1
accuracy,0.11611
epoch,10.0
loss,2.33381
val_accuracy,0.15533
val_loss,2.31937


[34m[1mwandb[0m: Agent Starting Run: ej2wryaz with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.1
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▁▁▁▁
epoch,▁▃▅▆█
loss,█▆▄▂▁
val_accuracy,▁▁▁▁▁
val_loss,█▆▄▂▁

0,1
accuracy,0.09965
epoch,5.0
loss,2.30575
val_accuracy,0.10317
val_loss,2.30428


[34m[1mwandb[0m: Agent Starting Run: zl7aq4r0 with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▁▁▁▁
epoch,▁▃▅▆█
loss,█▆▄▃▁
val_accuracy,▁▁▁▁▁
val_loss,█▆▄▃▁

0,1
accuracy,0.09939
epoch,5.0
loss,2.34411
val_accuracy,0.1055
val_loss,2.34064


[34m[1mwandb[0m: Agent Starting Run: xua0ls2r with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▁▁▁▁▁▁▁▁▁
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▇▆▆▅▄▃▃▂▁
val_accuracy,▁▁▁▁▁▁▁▁▁▁
val_loss,█▇▆▆▅▄▃▃▂▁

0,1
accuracy,0.10065
epoch,10.0
loss,2.32878
val_accuracy,0.09417
val_loss,2.32739


[34m[1mwandb[0m: Agent Starting Run: p6okw31n with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.1
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▂▃▄▄▅▆▇██
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▇▇▆▅▄▄▃▂▁
val_accuracy,▁▂▃▄▄▅▆▇██
val_loss,█▇▇▆▅▅▄▃▂▁

0,1
accuracy,0.29893
epoch,10.0
loss,1.95658
val_accuracy,0.315
val_loss,1.90762


[34m[1mwandb[0m: Agent Starting Run: s19pte89 with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▁▁▁▁
epoch,▁▃▅▆█
loss,█▇▆▃▁
val_accuracy,▁▁▁▁▁
val_loss,█▇▅▃▁

0,1
accuracy,0.10065
epoch,5.0
loss,2.31576
val_accuracy,0.09417
val_loss,2.3166


[34m[1mwandb[0m: Agent Starting Run: v0nwfeil with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▁▁▁▁▁▁▁▁▁
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▇▆▅▄▄▃▂▂▁
val_accuracy,▁▁▁▁▁▁▁▁▁▁
val_loss,█▇▆▅▄▄▃▂▂▁

0,1
accuracy,0.1003
epoch,10.0
loss,2.32794
val_accuracy,0.09733
val_loss,2.32452


[34m[1mwandb[0m: Agent Starting Run: vdf6mtod with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▂▃▃▅▆▆▆▇█
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▇▆▆▅▄▃▃▂▁
val_accuracy,▁▁▁▁▁▄▄▄██
val_loss,█▇▆▆▅▄▃▃▂▁

0,1
accuracy,0.10285
epoch,10.0
loss,2.29614
val_accuracy,0.10783
val_loss,2.29514


[34m[1mwandb[0m: Agent Starting Run: jv4qiant with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.1
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▁▁▁▁▁▁▁▁▁
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▆▅▄▃▃▂▂▁▁
val_accuracy,▁▁▁▁▁▁▁▁▁▁
val_loss,█▆▅▄▃▂▂▂▁▁

0,1
accuracy,0.0997
epoch,10.0
loss,2.30448
val_accuracy,0.10267
val_loss,2.30328


[34m[1mwandb[0m: Agent Starting Run: lndrwdny with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.1
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁████
epoch,▁▃▅▆█
loss,█▆▄▂▁
val_accuracy,▁▁▁▁▁
val_loss,█▆▄▂▁

0,1
accuracy,0.10083
epoch,5.0
loss,2.30589
val_accuracy,0.0925
val_loss,2.30471


[34m[1mwandb[0m: Agent Starting Run: jaoiwism with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▂▃▅█
epoch,▁▃▅▆█
loss,█▇▆▄▁
val_accuracy,▁▂▄▇█
val_loss,█▇▅▃▁

0,1
accuracy,0.07354
epoch,5.0
loss,2.30779
val_accuracy,0.06533
val_loss,2.30768


[34m[1mwandb[0m: Agent Starting Run: ub5in4ce with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.1
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▅▅▆█
epoch,▁▃▅▆█
loss,█▅▄▂▁
val_accuracy,▁▂▃▆█
val_loss,█▆▄▃▁

0,1
accuracy,0.13878
epoch,5.0
loss,2.22548
val_accuracy,0.15583
val_loss,2.19751


[34m[1mwandb[0m: Agent Starting Run: 4sv3rki1 with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▁▁▁▁
epoch,▁▃▅▆█
loss,█▆▄▃▁
val_accuracy,▁▁▁▁▁
val_loss,█▆▄▃▁

0,1
accuracy,0.09939
epoch,5.0
loss,2.31686
val_accuracy,0.1055
val_loss,2.31274


[34m[1mwandb[0m: Agent Starting Run: mm161d0y with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▁▁▁▁
epoch,▁▃▅▆█
loss,█▇▆▄▁
val_accuracy,▁▁▁▁▁
val_loss,█▇▅▃▁

0,1
accuracy,0.09981
epoch,5.0
loss,2.30275
val_accuracy,0.10067
val_loss,2.30276


[34m[1mwandb[0m: Agent Starting Run: cw89z4ep with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▃▄▆█
epoch,▁▃▅▆█
loss,█▆▄▂▁
val_accuracy,▁▃▄▆█
val_loss,█▆▄▃▁

0,1
accuracy,0.15396
epoch,5.0
loss,2.30078
val_accuracy,0.16567
val_loss,2.28359


[34m[1mwandb[0m: Agent Starting Run: a9ou8ide with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▂▃▄▅▅▆▆▇█
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▇▆▆▅▄▃▃▂▁
val_accuracy,▁▂▂▃▅▆▇▇██
val_loss,█▇▆▆▅▄▃▃▂▁

0,1
accuracy,0.09789
epoch,10.0
loss,2.35762
val_accuracy,0.101
val_loss,2.35938


[34m[1mwandb[0m: Agent Starting Run: 7dy8ijac with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▁▁▁▁
epoch,▁▃▅▆█
loss,█▇▆▄▁
val_accuracy,▁▁▁▁▁
val_loss,█▇▅▃▁

0,1
accuracy,0.09996
epoch,5.0
loss,2.31939
val_accuracy,0.10033
val_loss,2.32157


[34m[1mwandb[0m: Agent Starting Run: l44cfwfe with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▂▄▅█
epoch,▁▃▅▆█
loss,█▇▆▄▁
val_accuracy,▃▁███
val_loss,█▇▅▃▁

0,1
accuracy,0.10141
epoch,5.0
loss,2.33996
val_accuracy,0.09883
val_loss,2.33487


[34m[1mwandb[0m: Agent Starting Run: 6duq0mr1 with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▁▂▂▃▄▅▆▇█
epoch,▁▂▃▃▄▅▆▆▇█
loss,██▇▇▆▅▄▃▂▁
val_accuracy,▁▁▂▃▃▄▅▆▇█
val_loss,██▇▇▆▅▄▃▂▁

0,1
accuracy,0.1697
epoch,10.0
loss,2.29923
val_accuracy,0.183
val_loss,2.29875


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: 6ssck2bg with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▁▁▁▁
epoch,▁▃▅▆█
loss,█▆▄▃▁
val_accuracy,▁▁▁▁▁
val_loss,█▆▄▃▁

0,1
accuracy,0.1003
epoch,5.0
loss,2.44114
val_accuracy,0.09733
val_loss,2.43821


[34m[1mwandb[0m: Agent Starting Run: imzup0en with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▁▁▁▁▁▁▁▁▁
epoch,▁▂▃▃▄▅▆▆▇█
loss,██▇▇▆▅▄▃▂▁
val_accuracy,▁▁▁▁▁▁▁▁▁▁
val_loss,██▇▇▆▅▄▃▂▁

0,1
accuracy,0.09996
epoch,10.0
loss,2.30669
val_accuracy,0.10033
val_loss,2.30666


[34m[1mwandb[0m: Agent Starting Run: whzr994r with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▁▁▂▃▃▄▆▇█
epoch,▁▂▃▃▄▅▆▆▇█
loss,██▇▇▆▅▄▃▂▁
val_accuracy,▃▃▁▁▁▆▃▃▃█
val_loss,██▇▆▆▅▄▃▂▁

0,1
accuracy,0.09926
epoch,10.0
loss,2.30234
val_accuracy,0.09767
val_loss,2.30228


[34m[1mwandb[0m: Agent Starting Run: bpqgos1r with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▁▁▁▁▁▁▁▁▁
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▇▆▆▅▄▃▃▂▁
val_accuracy,▁▁▁▁▁▁▁▁▁▁
val_loss,█▇▆▆▅▄▃▃▂▁

0,1
accuracy,0.09996
epoch,10.0
loss,2.31842
val_accuracy,0.10033
val_loss,2.3175


[34m[1mwandb[0m: Agent Starting Run: be8y2vlp with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.1
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,███▁▆▃▄▄▄▄
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▆▃▂▁▁▂▂▂▁
val_accuracy,▁▁▂▂▄▃▃▃▃█
val_loss,█▅▂▁▂▂▂▂▂▁

0,1
accuracy,0.0997
epoch,10.0
loss,2.30833
val_accuracy,0.12083
val_loss,2.28835


[34m[1mwandb[0m: Agent Starting Run: 0yfqqh1e with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▂▂▃▄▄▅▆▇█
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▇▆▅▄▄▃▂▂▁
val_accuracy,▁▂▃▃▄▅▅▆▇█
val_loss,█▇▆▅▄▄▃▂▂▁

0,1
accuracy,0.18413
epoch,10.0
loss,2.23571
val_accuracy,0.18417
val_loss,2.22632


[34m[1mwandb[0m: Agent Starting Run: qvbu9cty with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▁▁▁▁▁▁▁▁▁
epoch,▁▂▃▃▄▅▆▆▇█
loss,██▇▇▆▅▄▃▂▁
val_accuracy,▁▁▁▁▁▁▁▁▁▁
val_loss,██▇▇▆▅▄▃▂▁

0,1
accuracy,0.09991
epoch,10.0
loss,2.33388
val_accuracy,0.10083
val_loss,2.32921


[34m[1mwandb[0m: Agent Starting Run: 9u0vrvrt with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.1
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▂▃▅█
epoch,▁▃▅▆█
loss,█▆▅▃▁
val_accuracy,▁▂▃▆█
val_loss,█▇▆▄▁

0,1
accuracy,0.35746
epoch,5.0
loss,2.13703
val_accuracy,0.42533
val_loss,2.04592


[34m[1mwandb[0m: Agent Starting Run: vqlhylil with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▂▃▄▅▆▆▇▇█
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▇▆▆▅▄▃▃▂▁
val_accuracy,▁▂▃▄▅▅▇▇▇█
val_loss,█▇▆▆▅▄▃▃▂▁

0,1
accuracy,0.14356
epoch,10.0
loss,2.29938
val_accuracy,0.15167
val_loss,2.29931


[34m[1mwandb[0m: Agent Starting Run: 1405ymwd with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▁▁▁▁▁▂▃▅█
epoch,▁▂▃▃▄▅▆▆▇█
loss,██▇▇▆▅▄▃▂▁
val_accuracy,▁▁▁▁▂▂▂▃▅█
val_loss,██▇▆▅▅▄▃▂▁

0,1
accuracy,0.10496
epoch,10.0
loss,2.3088
val_accuracy,0.11683
val_loss,2.27856


[34m[1mwandb[0m: Agent Starting Run: 7hbtadj5 with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▁▁▁▁
epoch,▁▃▅▆█
loss,█▇▆▄▁
val_accuracy,▁▁▁▁▁
val_loss,█▇▅▃▁

0,1
accuracy,0.10017
epoch,5.0
loss,2.57139
val_accuracy,0.0985
val_loss,2.58034


[34m[1mwandb[0m: Agent Starting Run: bgxv5esg with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▂▄▆█
epoch,▁▃▅▆█
loss,█▇▅▃▁
val_accuracy,▁▃▅▇█
val_loss,█▇▅▃▁

0,1
accuracy,0.22896
epoch,5.0
loss,2.23868
val_accuracy,0.2475
val_loss,2.2202


[34m[1mwandb[0m: Agent Starting Run: e9lb1pxo with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▁▂▂▃▄▅▆▇█
epoch,▁▂▃▃▄▅▆▆▇█
loss,██▇▇▆▅▄▃▂▁
val_accuracy,▁▁▂▃▄▄▅▆▇█
val_loss,██▇▇▆▅▄▃▂▁

0,1
accuracy,0.15239
epoch,10.0
loss,2.29228
val_accuracy,0.15
val_loss,2.29254


[34m[1mwandb[0m: Agent Starting Run: cw06allp with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▁▁▁▁
epoch,▁▃▅▆█
loss,█▆▄▃▁
val_accuracy,▁▁▁▁▁
val_loss,█▆▄▃▁

0,1
accuracy,0.10083
epoch,5.0
loss,2.31596
val_accuracy,0.0925
val_loss,2.31509


[34m[1mwandb[0m: Agent Starting Run: 2lhrd9el with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▁▂▃▄▅▆▇▇█
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▇▆▅▄▄▃▂▂▁
val_accuracy,▁▂▃▃▄▅▆▇▇█
val_loss,█▇▆▅▄▄▃▂▂▁

0,1
accuracy,0.16672
epoch,10.0
loss,2.29295
val_accuracy,0.1765
val_loss,2.28335


[34m[1mwandb[0m: Agent Starting Run: 3uz47zvo with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▁▁▁▁▁▁▁▁▁
epoch,▁▂▃▃▄▅▆▆▇█
loss,██▇▇▆▅▄▃▂▁
val_accuracy,▁▁▁▁▁▁▁▁▁▁
val_loss,██▇▇▆▅▄▃▂▁

0,1
accuracy,0.09944
epoch,10.0
loss,2.3204
val_accuracy,0.105
val_loss,2.31851


[34m[1mwandb[0m: Agent Starting Run: 1ev9eelt with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▃▅▇█
epoch,▁▃▅▆█
loss,█▆▄▂▁
val_accuracy,▁▃▅▆█
val_loss,█▆▄▂▁

0,1
accuracy,0.12161
epoch,5.0
loss,2.29118
val_accuracy,0.12283
val_loss,2.28712


[34m[1mwandb[0m: Agent Starting Run: 16vyg81d with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.1
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▃▂▂▆▃▅▆▅█
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▇▅▄▃▃▂▂▂▁
val_accuracy,▃▁▁▅▃▄▅▄▇█
val_loss,█▆▅▄▄▃▃▂▂▁

0,1
accuracy,0.29169
epoch,10.0
loss,2.12143
val_accuracy,0.29483
val_loss,2.09849


[34m[1mwandb[0m: Agent Starting Run: 65hpi12v with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.1
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▁▁█▅
epoch,▁▃▅▆█
loss,█▆▃▂▁
val_accuracy,▁▁█▆▇
val_loss,█▅▃▂▁

0,1
accuracy,0.19935
epoch,5.0
loss,2.21816
val_accuracy,0.2285
val_loss,2.19427


[34m[1mwandb[0m: Agent Starting Run: zeverckk with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▁▁▁▁
epoch,▁▃▅▆█
loss,█▇▆▃▁
val_accuracy,▁▁▁▁▁
val_loss,█▇▅▃▁

0,1
accuracy,0.1003
epoch,5.0
loss,2.31399
val_accuracy,0.09733
val_loss,2.31422


[34m[1mwandb[0m: Agent Starting Run: j9hd08lp with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▃▆▇█
epoch,▁▃▅▆█
loss,█▆▅▃▁
val_accuracy,▁▃▃▃█
val_loss,█▆▅▃▁

0,1
accuracy,0.13385
epoch,5.0
loss,2.30208
val_accuracy,0.13283
val_loss,2.302


[34m[1mwandb[0m: Agent Starting Run: gvybjyuj with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▁▁▂▂▃▄▅▆█
epoch,▁▂▃▃▄▅▆▆▇█
loss,██▇▇▆▅▄▃▂▁
val_accuracy,▁▁▁▂▃▃▄▅▆█
val_loss,██▇▇▆▅▄▃▂▁

0,1
accuracy,0.11954
epoch,10.0
loss,2.29928
val_accuracy,0.12867
val_loss,2.29829


[34m[1mwandb[0m: Agent Starting Run: ilbugmdo with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▁▁▁▁▁▁▁▁▁
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▇▆▅▅▄▃▂▂▁
val_accuracy,▁▁▁▁▁▁▁▁▁▁
val_loss,█▇▆▅▅▄▃▂▂▁

0,1
accuracy,0.1003
epoch,10.0
loss,2.31195
val_accuracy,0.09733
val_loss,2.31092


[34m[1mwandb[0m: Agent Starting Run: 71po79cn with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▃▅▆█
epoch,▁▃▅▆█
loss,█▆▄▃▁
val_accuracy,▁▃▄▆█
val_loss,█▆▄▃▁

0,1
accuracy,0.13319
epoch,5.0
loss,2.32052
val_accuracy,0.14083
val_loss,2.31787


[34m[1mwandb[0m: Agent Starting Run: 3dethekt with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▃▅▇█
epoch,▁▃▅▆█
loss,█▆▄▃▁
val_accuracy,▆▄█▁▆
val_loss,█▆▄▃▁

0,1
accuracy,0.14402
epoch,5.0
loss,2.31036
val_accuracy,0.146
val_loss,2.30696


[34m[1mwandb[0m: Agent Starting Run: qnt616bk with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▁▁▁▁▁▁▆█▂
epoch,▁▂▃▃▄▅▆▆▇█
loss,██▇▆▅▄▃▂▁▁
val_accuracy,▁▁▁▁▁▁▆█▂▁
val_loss,█▇▆▅▄▃▂▂▁▁

0,1
accuracy,0.1045
epoch,10.0
loss,2.27419
val_accuracy,0.10017
val_loss,2.26576


[34m[1mwandb[0m: Agent Starting Run: kbfoondc with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,█▇▅▄▃▂▃▄▂▁
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▇▆▆▅▄▃▃▂▁
val_accuracy,█▆▆▆▆▃▃▃▁▁
val_loss,█▇▆▆▅▄▃▃▂▁

0,1
accuracy,0.10694
epoch,10.0
loss,2.29976
val_accuracy,0.11217
val_loss,2.29931


[34m[1mwandb[0m: Agent Starting Run: 4lv0wbkk with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▂▃▄▄▅▆▇▇█
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▇▆▅▅▄▃▂▂▁
val_accuracy,▁▂▃▄▅▅▆▇██
val_loss,█▇▆▅▅▄▃▂▂▁

0,1
accuracy,0.11541
epoch,10.0
loss,2.29064
val_accuracy,0.122
val_loss,2.28565


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: pucjqq9i with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▁▁▁▁▁▁▁▁▁
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▇▆▆▅▄▃▂▂▁
val_accuracy,▁▁▁▁▁▁▁▁▁▁
val_loss,█▇▆▆▅▄▃▂▂▁

0,1
accuracy,0.0997
epoch,10.0
loss,2.30989
val_accuracy,0.10267
val_loss,2.30826


[34m[1mwandb[0m: Agent Starting Run: 0z12ltp1 with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.1
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▃▆██
epoch,▁▃▅▆█
loss,█▆▄▃▁
val_accuracy,▁▄▆▇█
val_loss,█▇▅▄▁

0,1
accuracy,0.33033
epoch,5.0
loss,2.06017
val_accuracy,0.37183
val_loss,1.92344


[34m[1mwandb[0m: Agent Starting Run: fdtv4sjt with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▁▂▂▃▄▄▆▇█
epoch,▁▂▃▃▄▅▆▆▇█
loss,██▇▇▆▅▄▃▂▁
val_accuracy,▁▁▁▁▃▄▅▆▆█
val_loss,██▇▇▆▅▄▃▂▁

0,1
accuracy,0.09061
epoch,10.0
loss,2.30147
val_accuracy,0.08867
val_loss,2.30172


[34m[1mwandb[0m: Agent Starting Run: zeyl19c7 with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▁▁▁▁▁▁▁▁▁
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▇▆▆▅▄▃▂▂▁
val_accuracy,▁▁▁▁▁▁▁▁▁▁
val_loss,█▇▆▆▅▄▃▂▂▁

0,1
accuracy,0.09996
epoch,10.0
loss,2.30998
val_accuracy,0.10033
val_loss,2.30974


[34m[1mwandb[0m: Agent Starting Run: 2zg1yx3t with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▁▂▃▄▅▆▇▇█
epoch,▁▂▃▃▄▅▆▆▇█
loss,██▇▆▆▅▄▃▂▁
val_accuracy,▁▂▃▄▅▆▆▇▇█
val_loss,██▇▆▅▅▄▃▂▁

0,1
accuracy,0.38667
epoch,10.0
loss,1.98297
val_accuracy,0.41533
val_loss,1.93729


[34m[1mwandb[0m: Agent Starting Run: 5120lg40 with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▁▁▁▁▁▆█▅▁
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▇▆▅▄▃▂▂▁▁
val_accuracy,▁▁▁▁▁▆█▅▁▁
val_loss,█▇▅▄▃▂▂▁▁▁

0,1
accuracy,0.10646
epoch,10.0
loss,2.25958
val_accuracy,0.10067
val_loss,2.25721


[34m[1mwandb[0m: Agent Starting Run: xrknmd49 with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▂▃▅█
epoch,▁▃▅▆█
loss,█▇▆▄▁
val_accuracy,▁▂▄▆█
val_loss,█▇▅▃▁

0,1
accuracy,0.19513
epoch,5.0
loss,2.28424
val_accuracy,0.22617
val_loss,2.27738


[34m[1mwandb[0m: Agent Starting Run: b6hnpfe0 with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▃▅▆█
epoch,▁▃▅▆█
loss,█▆▄▃▁
val_accuracy,▁▃▅▆█
val_loss,█▆▄▃▁

0,1
accuracy,0.11004
epoch,5.0
loss,2.36065
val_accuracy,0.105
val_loss,2.35867


[34m[1mwandb[0m: Agent Starting Run: 2jwpzvmm with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▁▁▁▁
epoch,▁▃▅▆█
loss,█▇▆▄▁
val_accuracy,▁▁▁▁▁
val_loss,█▇▅▃▁

0,1
accuracy,0.09939
epoch,5.0
loss,2.31693
val_accuracy,0.1055
val_loss,2.31788


[34m[1mwandb[0m: Agent Starting Run: zmhtsztc with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▁▁▂▂▃▄▅▆█
epoch,▁▂▃▃▄▅▆▆▇█
loss,██▇▇▆▅▄▃▂▁
val_accuracy,▁▁▂▂▂▃▃▄▆█
val_loss,██▇▇▆▅▄▃▂▁

0,1
accuracy,0.13722
epoch,10.0
loss,2.29735
val_accuracy,0.154
val_loss,2.29643


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: hwhrtum2 with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▁▁▅█
epoch,▁▃▅▆█
loss,█▆▄▃▁
val_accuracy,▁▁▃██
val_loss,█▆▄▃▁

0,1
accuracy,0.08102
epoch,5.0
loss,2.41417
val_accuracy,0.08217
val_loss,2.41099


[34m[1mwandb[0m: Agent Starting Run: wuwzyegv with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▁▁▁▁▁▁▁▁▁
epoch,▁▂▃▃▄▅▆▆▇█
loss,██▇▇▆▅▄▃▂▁
val_accuracy,▁▁▁▁▁▁▁▁▁▁
val_loss,██▇▆▅▄▄▃▂▁

0,1
accuracy,0.09939
epoch,10.0
loss,2.31057
val_accuracy,0.1055
val_loss,2.30675


[34m[1mwandb[0m: Agent Starting Run: dsdqqq99 with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,███▇▆▅▄▃▂▁
epoch,▁▂▃▃▄▅▆▆▇█
loss,██▇▇▆▅▄▃▂▁
val_accuracy,██▇▇▆▄▃▂▂▁
val_loss,██▇▇▆▅▄▃▂▁

0,1
accuracy,0.1053
epoch,10.0
loss,2.29649
val_accuracy,0.11
val_loss,2.29539


[34m[1mwandb[0m: Agent Starting Run: 3gynzrqc with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.1
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▂▂▃▄▄▅▆▇█
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▇▇▆▅▄▄▃▂▁
val_accuracy,▁▂▂▃▄▅▅▆▇█
val_loss,█▇▇▆▅▄▄▃▂▁

0,1
accuracy,0.19404
epoch,10.0
loss,2.29079
val_accuracy,0.20417
val_loss,2.28981


[34m[1mwandb[0m: Agent Starting Run: e0y7xvnu with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▂▄▄▅▆▇▇▇█
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▇▆▆▅▄▃▃▂▁
val_accuracy,▂▁▁▂▃▆█▇▆▇
val_loss,█▇▆▆▅▄▃▃▂▁

0,1
accuracy,0.10898
epoch,10.0
loss,2.3021
val_accuracy,0.10567
val_loss,2.30217


[34m[1mwandb[0m: Agent Starting Run: 8dxmee0h with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▂▃▃▄▅▆▆▇█
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▇▆▆▅▄▃▃▂▁
val_accuracy,▁▁▂▃▄▄▅▆▆█
val_loss,█▇▆▆▅▄▃▃▂▁

0,1
accuracy,0.1115
epoch,10.0
loss,2.29958
val_accuracy,0.11167
val_loss,2.29955


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: uubao91y with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.1
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▃▆▇█
epoch,▁▃▅▆█
loss,█▆▄▃▁
val_accuracy,▁▄▆▇█
val_loss,█▆▅▃▁

0,1
accuracy,0.31694
epoch,5.0
loss,2.14443
val_accuracy,0.3505
val_loss,2.09411


[34m[1mwandb[0m: Agent Starting Run: o8otlnhy with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▁▁▁▁
epoch,▁▃▅▆█
loss,█▆▄▃▁
val_accuracy,▁▁▁▁▁
val_loss,█▆▄▃▁

0,1
accuracy,0.0997
epoch,5.0
loss,2.333
val_accuracy,0.10267
val_loss,2.33166


[34m[1mwandb[0m: Agent Starting Run: zep03hcw with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▁▁▁▁▁▁▁▁▁
epoch,▁▂▃▃▄▅▆▆▇█
loss,██▇▇▆▅▄▃▂▁
val_accuracy,▁▁▁▁▁▁▁▁▁▁
val_loss,██▇▇▆▅▄▃▂▁

0,1
accuracy,0.09939
epoch,10.0
loss,2.31324
val_accuracy,0.1055
val_loss,2.31082


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: uu3yflj6 with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.1
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▁▁▄█
epoch,▁▃▅▆█
loss,█▅▂▁▁
val_accuracy,▁▁▄██
val_loss,█▃▁▂▂

0,1
accuracy,0.19009
epoch,5.0
loss,2.28623
val_accuracy,0.194
val_loss,2.29051


[34m[1mwandb[0m: Agent Starting Run: x0sufej0 with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.1
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▄▆▇█
epoch,▁▃▅▆█
loss,█▆▅▃▁
val_accuracy,▁▄▆▇█
val_loss,█▆▅▃▁

0,1
accuracy,0.10409
epoch,5.0
loss,2.29407
val_accuracy,0.10667
val_loss,2.29116


[34m[1mwandb[0m: Agent Starting Run: fsrr1pn8 with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▁▁▁▁
epoch,▁▃▅▆█
loss,█▇▆▄▁
val_accuracy,▁▁▁▁▁
val_loss,█▇▅▃▁

0,1
accuracy,0.10017
epoch,5.0
loss,2.43911
val_accuracy,0.0985
val_loss,2.44872


[34m[1mwandb[0m: Agent Starting Run: kmyxiykq with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▁▁▁▁
epoch,▁▃▅▆█
loss,█▆▄▃▁
val_accuracy,▁▁▁▁▁
val_loss,█▆▄▃▁

0,1
accuracy,0.10065
epoch,5.0
loss,2.43024
val_accuracy,0.09417
val_loss,2.42974


[34m[1mwandb[0m: Agent Starting Run: kt1q56yr with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▃▄▆█
epoch,▁▃▅▆█
loss,█▆▄▂▁
val_accuracy,▁▃▄▆█
val_loss,█▆▄▂▁

0,1
accuracy,0.13076
epoch,5.0
loss,2.3285
val_accuracy,0.12733
val_loss,2.32117


[34m[1mwandb[0m: Agent Starting Run: nqnenrz9 with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▁▁▁▁▁▁▁▁▁
epoch,▁▂▃▃▄▅▆▆▇█
loss,██▇▇▆▅▄▃▂▁
val_accuracy,▁▁▁▁▁▁▁▁▁▁
val_loss,██▇▇▆▅▄▃▂▁

0,1
accuracy,0.09996
epoch,10.0
loss,2.48173
val_accuracy,0.10033
val_loss,2.49459


[34m[1mwandb[0m: Agent Starting Run: 1ti4b636 with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.1
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,██████▆▁▁▁
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▇▅▃▂▁▁▂▂▃
val_accuracy,▁▁▁▁▁▃████
val_loss,█▆▄▂▁▁▂▂▃▃

0,1
accuracy,0.10017
epoch,10.0
loss,2.30399
val_accuracy,0.0985
val_loss,2.30419


[34m[1mwandb[0m: Agent Starting Run: 3g2z9y6p with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▁▁▁▁
epoch,▁▃▅▆█
loss,█▇▆▄▁
val_accuracy,▁▁▁▁▁
val_loss,█▇▅▃▁

0,1
accuracy,0.09965
epoch,5.0
loss,2.31607
val_accuracy,0.10317
val_loss,2.31442


[34m[1mwandb[0m: Agent Starting Run: yhgjlash with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▃▅▇▇▅▆▇▇█
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▇▆▆▅▄▃▂▂▁
val_accuracy,▄█▅▂▄█▂▁▁▄
val_loss,█▇▆▆▅▄▃▂▂▁

0,1
accuracy,0.10846
epoch,10.0
loss,2.30622
val_accuracy,0.10117
val_loss,2.30794


[34m[1mwandb[0m: Agent Starting Run: zwkc6stl with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▁▁▁▁▁▁▁▁▁
epoch,▁▂▃▃▄▅▆▆▇█
loss,██▇▇▆▅▄▃▂▁
val_accuracy,▁▁▁▁▁▁▁▁▁▁
val_loss,██▇▇▆▅▄▃▂▁

0,1
accuracy,0.09944
epoch,10.0
loss,2.31937
val_accuracy,0.105
val_loss,2.31752


[34m[1mwandb[0m: Agent Starting Run: q74zjy0n with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▃▅▅█
epoch,▁▃▅▆█
loss,█▆▄▃▁
val_accuracy,▁█▆▆▃
val_loss,█▆▄▃▁

0,1
accuracy,0.10226
epoch,5.0
loss,2.44146
val_accuracy,0.10283
val_loss,2.44292


[34m[1mwandb[0m: Agent Starting Run: 5ksgfpht with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.1
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▂▄▆▆▆▅▆▇█
epoch,▁▂▃▃▄▅▆▆▇█
loss,██▇▇▆▆▅▄▃▁
val_accuracy,▁▄▅▅▅▅▅▇██
val_loss,██▇▇▆▆▅▄▃▁

0,1
accuracy,0.34635
epoch,10.0
loss,2.00336
val_accuracy,0.3585
val_loss,1.89638


[34m[1mwandb[0m: Agent Starting Run: uaqmx234 with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▆▆█▆
epoch,▁▃▅▆█
loss,█▆▄▃▁
val_accuracy,▁▁▁▁▁
val_loss,█▆▅▃▁

0,1
accuracy,0.03085
epoch,5.0
loss,2.30291
val_accuracy,0.03117
val_loss,2.30304


[34m[1mwandb[0m: Agent Starting Run: b9cflmfd with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▂▃▅█
epoch,▁▃▅▆█
loss,█▇▆▄▁
val_accuracy,▁▂▃▅█
val_loss,█▇▅▃▁

0,1
accuracy,0.11065
epoch,5.0
loss,2.47025
val_accuracy,0.10067
val_loss,2.47387


[34m[1mwandb[0m: Agent Starting Run: gxfzdrwu with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▂▃▄▅▆▆▇██
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▇▆▆▅▄▃▃▂▁
val_accuracy,▁▁▃▃▅▅▇▇██
val_loss,█▇▆▆▅▄▃▃▂▁

0,1
accuracy,0.15672
epoch,10.0
loss,2.37027
val_accuracy,0.1485
val_loss,2.37702


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: nmk4x2e0 with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▁▁▁▄▄▄▄██
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▇▆▆▅▄▃▃▂▁
val_accuracy,▁▁▁▁▁▁▁▁▁▁
val_loss,█▇▆▆▅▄▃▃▂▁

0,1
accuracy,0.0995
epoch,10.0
loss,2.57527
val_accuracy,0.1055
val_loss,2.56195


[34m[1mwandb[0m: Agent Starting Run: qtpjs18i with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▇█▇▅▃▂▁▁▁▂
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▇▅▄▃▃▂▂▁▁
val_accuracy,█▇▄▃▁▂▂▂▂▆
val_loss,█▇▅▄▄▃▂▂▁▁

0,1
accuracy,0.06306
epoch,10.0
loss,2.32335
val_accuracy,0.06767
val_loss,2.31362


[34m[1mwandb[0m: Agent Starting Run: yr89ygrz with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▂▃▄▄▆▆▇▇█
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▇▆▆▅▄▃▃▂▁
val_accuracy,▁▃▆▆▆▆▆▆██
val_loss,█▇▆▆▅▄▃▃▂▁

0,1
accuracy,0.11352
epoch,10.0
loss,2.30404
val_accuracy,0.11017
val_loss,2.30385


[34m[1mwandb[0m: Agent Starting Run: hw97xtyz with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.1
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▁▁▁▃▅▅▆▇█
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▅▄▃▂▂▂▁▁▁
val_accuracy,▁▁▁▃▅▅▅▆▇█
val_loss,█▆▄▃▃▂▂▂▁▁

0,1
accuracy,0.25561
epoch,10.0
loss,2.26325
val_accuracy,0.26567
val_loss,2.25855


[34m[1mwandb[0m: Agent Starting Run: 9jlu3lei with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▃▄▆█
epoch,▁▃▅▆█
loss,█▆▄▃▁
val_accuracy,▁▃▅▆█
val_loss,█▆▄▃▁

0,1
accuracy,0.11604
epoch,5.0
loss,2.31602
val_accuracy,0.119
val_loss,2.31951


[34m[1mwandb[0m: Agent Starting Run: gea7605g with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▃▁▃▆█
epoch,▁▃▅▆█
loss,█▇▆▄▁
val_accuracy,▁▁▂▇█
val_loss,█▇▅▃▁

0,1
accuracy,0.10817
epoch,5.0
loss,2.3029
val_accuracy,0.10217
val_loss,2.30326


[34m[1mwandb[0m: Agent Starting Run: yrngtqp3 with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▃█▆▃▁
epoch,▁▃▅▆█
loss,█▆▄▃▁
val_accuracy,▁▅███
val_loss,█▆▅▃▁

0,1
accuracy,0.11463
epoch,5.0
loss,2.30208
val_accuracy,0.12183
val_loss,2.3019


[34m[1mwandb[0m: Agent Starting Run: fqqtoxdp with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.1
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▄▅▆█
epoch,▁▃▅▆█
loss,█▆▄▃▁
val_accuracy,▁▃▄▆█
val_loss,█▆▄▃▁

0,1
accuracy,0.12674
epoch,5.0
loss,2.2787
val_accuracy,0.14183
val_loss,2.27068


[34m[1mwandb[0m: Agent Starting Run: 3vzkf1z5 with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.1
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▂▃▅█
epoch,▁▃▅▆█
loss,█▇▆▄▁
val_accuracy,▁▂▄▆█
val_loss,█▇▆▄▁

0,1
accuracy,0.25402
epoch,5.0
loss,2.23974
val_accuracy,0.3055
val_loss,2.20789


[34m[1mwandb[0m: Agent Starting Run: lkcdbor8 with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.1
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▁▁▁▂▃▅██▇
epoch,▁▂▃▃▄▅▆▆▇█
loss,██▇▇▆▆▅▄▃▁
val_accuracy,▁▁▁▂▃▅██▇▆
val_loss,██▇▇▆▆▅▄▃▁

0,1
accuracy,0.19602
epoch,10.0
loss,2.265
val_accuracy,0.1905
val_loss,2.25332


[34m[1mwandb[0m: Agent Starting Run: k4c0qx8r with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.1
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▁▁▁▁
epoch,▁▃▅▆█
loss,█▆▄▂▁
val_accuracy,▁▁▁▁▁
val_loss,█▆▄▂▁

0,1
accuracy,0.09939
epoch,5.0
loss,2.30421
val_accuracy,0.1055
val_loss,2.3027


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: aff2ag2o with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.1
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▂▄▄█
epoch,▁▃▅▆█
loss,█▆▄▃▁
val_accuracy,▁▃▃▅█
val_loss,█▆▅▃▁

0,1
accuracy,0.29487
epoch,5.0
loss,1.93614
val_accuracy,0.444
val_loss,1.76435


[34m[1mwandb[0m: Agent Starting Run: 3kbpto7z with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▂▃▃▄▅▆▆▇█
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▇▆▆▅▄▃▃▂▁
val_accuracy,▁▂▂▄▄▄▅▆▇█
val_loss,█▇▆▆▅▄▃▃▂▁

0,1
accuracy,0.13741
epoch,10.0
loss,2.31671
val_accuracy,0.13833
val_loss,2.31787


[34m[1mwandb[0m: Agent Starting Run: g99zd016 with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.1
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▁▁▁▁
epoch,▁▃▅▆█
loss,█▅▃▂▁
val_accuracy,▁▁▁▁█
val_loss,█▅▄▂▁

0,1
accuracy,0.09939
epoch,5.0
loss,2.33303
val_accuracy,0.10683
val_loss,2.31205


[34m[1mwandb[0m: Agent Starting Run: nppa98cs with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▁▃▄▄▄▅▆▇█
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▇▇▆▅▄▃▂▂▁
val_accuracy,▁▃▃▃▅▅▆▆▆█
val_loss,█▇▇▆▅▄▃▂▂▁

0,1
accuracy,0.07752
epoch,10.0
loss,2.30228
val_accuracy,0.07783
val_loss,2.30228


[34m[1mwandb[0m: Agent Starting Run: 1ih7hqjw with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.1
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▂▃▅▅▇▇█▇█
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▇▆▅▄▄▃▂▂▁
val_accuracy,▁▁▄▄▆▆█▇██
val_loss,█▇▆▅▅▄▃▂▂▁

0,1
accuracy,0.4855
epoch,10.0
loss,1.69046
val_accuracy,0.49467
val_loss,1.62035


[34m[1mwandb[0m: Agent Starting Run: e2zsk0u0 with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.1
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▂▄▆█
epoch,▁▃▅▆█
loss,█▇▅▃▁
val_accuracy,▁▂▄▆█
val_loss,█▇▅▃▁

0,1
accuracy,0.10607
epoch,5.0
loss,2.30239
val_accuracy,0.11917
val_loss,2.302


[34m[1mwandb[0m: Agent Starting Run: bige7nc8 with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▁▁▁▁
epoch,▁▃▅▆█
loss,█▆▄▃▁
val_accuracy,▁▁▁▁▁
val_loss,█▆▄▃▁

0,1
accuracy,0.10083
epoch,5.0
loss,2.35075
val_accuracy,0.0925
val_loss,2.35806


[34m[1mwandb[0m: Agent Starting Run: fnpjhewk with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.1
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▁▂▅▆▆▆▆▇█
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▅▄▃▂▂▂▁▁▁
val_accuracy,▁▂▃▄▄▄▄▄▅█
val_loss,█▆▄▃▃▂▂▂▁▁

0,1
accuracy,0.21554
epoch,10.0
loss,2.26617
val_accuracy,0.29567
val_loss,2.25991


[34m[1mwandb[0m: Agent Starting Run: nnnopkny with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.1
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▁▃▄▄▆▇▇██
epoch,▁▂▃▃▄▅▆▆▇█
loss,█▇▇▆▆▅▄▃▂▁
val_accuracy,▁▃▃▄▆▆▆▇▇█
val_loss,██▇▆▅▅▄▃▂▁

0,1
accuracy,0.5322
epoch,10.0
loss,1.28368
val_accuracy,0.59717
val_loss,1.12044


[34m[1mwandb[0m: Agent Starting Run: c0e5xli9 with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.1
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▃▆▇█
epoch,▁▃▅▆█
loss,█▆▄▃▁
val_accuracy,▁▄▅▆█
val_loss,█▆▅▃▁

0,1
accuracy,0.18902
epoch,5.0
loss,2.13967
val_accuracy,0.22167
val_loss,2.09581


[34m[1mwandb[0m: Agent Starting Run: x604emy7 with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 32
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▁▁▁▁▁▁▁▁▁
epoch,▁▂▃▃▄▅▆▆▇█
loss,██▇▇▆▅▄▃▂▁
val_accuracy,▁▁▁▁▁▁▁▁▁▁
val_loss,██▇▆▆▅▄▃▂▁

0,1
accuracy,0.10017
epoch,10.0
loss,2.50254
val_accuracy,0.0985
val_loss,2.48078


[34m[1mwandb[0m: Agent Starting Run: 0d3mdxnl with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▁▁▁▁
epoch,▁▃▅▆█
loss,█▆▄▃▁
val_accuracy,▁▁▁▁▁
val_loss,█▆▄▃▁

0,1
accuracy,0.09965
epoch,5.0
loss,2.31565
val_accuracy,0.10317
val_loss,2.31419


[34m[1mwandb[0m: Agent Starting Run: 42g9g82m with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.01
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▃▆██
epoch,▁▃▅▆█
loss,█▇▄▂▁
val_accuracy,▁▅▇▇█
val_loss,█▆▄▂▁

0,1
accuracy,0.18352
epoch,5.0
loss,2.23819
val_accuracy,0.201
val_loss,2.21434


[34m[1mwandb[0m: Agent Starting Run: q6rlomra with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.1
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: random


0,1
accuracy,▁▂▄▆█
epoch,▁▃▅▆█
loss,█▆▄▃▁
val_accuracy,▁▂▄▆█
val_loss,█▆▄▃▁

0,1
accuracy,0.11041
epoch,5.0
loss,2.29875
val_accuracy,0.117
val_loss,2.29787


[34m[1mwandb[0m: Agent Starting Run: 9yr6m7fp with config:
[34m[1mwandb[0m: 	activation: relu
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 3
[34m[1mwandb[0m: 	hidden_size: 64
[34m[1mwandb[0m: 	learning_rate: 0.1
[34m[1mwandb[0m: 	optimizer: momentum
[34m[1mwandb[0m: 	weight_init: xavier


0,1
accuracy,▁▁▂▄▅▅▆▆▆█
epoch,▁▂▃▃▄▅▆▆▇█
loss,██▇▇▆▅▄▃▂▁
val_accuracy,▁▂▃▄▅▅▅▅▇█
val_loss,██▇▆▆▅▃▃▁▁

0,1
accuracy,0.55793
epoch,10.0
loss,1.19563
val_accuracy,0.61333
val_loss,1.08867


[34m[1mwandb[0m: Agent Starting Run: aznflo78 with config:
[34m[1mwandb[0m: 	activation: sigmoid
[34m[1mwandb[0m: 	batch_size: 64
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	hidden_layers: 2
[34m[1mwandb[0m: 	hidden_size: 32
[34m[1mwandb[0m: 	learning_rate: 0.001
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	weight_init: random


: 