In [None]:
# --- Imports ---
import tensorflow as tf
from tensorflow.keras.layers import Layer, Dense, Input, Dropout # Conv2D etc. removed as not needed for NLP
from tensorflow.keras.models import Model # Sequential might not be needed
from tensorflow.keras.optimizers import AdamW # Standard optimizer for BERT
from tensorflow.keras.callbacks import EarlyStopping, ReduceLROnPlateau
from tensorflow.keras.utils import to_categorical
from transformers import BertTokenizer, TFBertModel, BertConfig # Key imports for BERT
import datasets as hf_datasets # Hugging Face datasets library for easy loading
import numpy as np
import pandas as pd
import random
import time
import os
import gc

# --- Configuration (general and NLP-specific) ---
RAND_SEED = 42
NUM_RUNS = 1 # Start with 1, BERT training takes longer
EPOCHS_NLP = 3 # Fine-tuning BERT usually requires fewer epochs
PATIENCE_NLP = 2 # For EarlyStopping
BATCH_SIZE_NLP = 16 # May need to be reduced (e.g., 8 or 4) depending on GPU/TPU memory
MAX_LENGTH = 128  # Maximum sequence length for tokenizer
BERT_MODEL_NAME = 'bert-base-uncased' # Popular BERT model choice
LEARNING_RATE_BERT = 2e-5 # Typical learning rate for fine-tuning BERT

# --- Custom Activation Layers (OptimA and OptimALinear) ---
class OptimA(Layer):
    """Custom Optimal Activation function."""
    def __init__(self, **kwargs):
        super(OptimA, self).__init__(**kwargs)

    def build(self, input_shape):
        self.alpha = self.add_weight(name='alpha', shape=(), initializer='ones', trainable=True)
        self.beta = self.add_weight(name='beta', shape=(), initializer=tf.keras.initializers.Constant(0.5), trainable=True)
        self.gamma = self.add_weight(name='gamma', shape=(), initializer='ones', trainable=True)
        self.delta = self.add_weight(name='delta', shape=(), initializer=tf.keras.initializers.Constant(0.5), trainable=True)
        self.lambda_ = self.add_weight(name='lambda', shape=(), initializer='ones', trainable=True)
        super(OptimA, self).build(input_shape)

    def call(self, x):
        term1 = self.alpha * tf.math.tanh(self.beta * x)
        term2 = self.gamma * tf.math.softplus(self.delta * x) * tf.math.sigmoid(self.lambda_ * x)
        return term1 + term2

    def get_config(self):
        config = super(OptimA, self).get_config()
        return config

class OptimALinear(Layer):
    """Custom Optimal Activation function (Linear Approximation)."""
    def __init__(self, epsilon=1e-5, **kwargs):
        super(OptimALinear, self).__init__(**kwargs)
        self.epsilon = epsilon

    def build(self, input_shape):
        self.alpha = self.add_weight(name='alpha', shape=(), initializer='ones', trainable=True)
        self.beta = self.add_weight(name='beta', shape=(), initializer=tf.keras.initializers.Constant(0.5), trainable=True)
        self.gamma = self.add_weight(name='gamma', shape=(), initializer='ones', trainable=True)
        self.delta = self.add_weight(name='delta', shape=(), initializer=tf.keras.initializers.Constant(0.5), trainable=True)
        self.lambda_ = self.add_weight(name='lambda', shape=(), initializer='ones', trainable=True)
        super(OptimALinear, self).build(input_shape)

    def call(self, x):
        term1 = self.alpha * tf.clip_by_value(self.beta * x, -1, 1)
        term2 = self.gamma * (tf.maximum(0.0, self.delta * x) + self.epsilon) * (0.5 + 0.25 * self.lambda_ * x)
        return term1 + term2

    def get_config(self):
        config = super(OptimALinear, self).get_config()
        config.update({'epsilon': self.epsilon})
        return config

def set_seed(seed=42):
    """Sets random seeds for reproducibility."""
    tf.random.set_seed(seed)
    np.random.seed(seed)
    random.seed(seed)
    os.environ['PYTHONHASHSEED'] = str(seed)
    # tf.config.threading.set_inter_op_parallelism_threads(1) # Can slow down execution
    # tf.config.threading.set_intra_op_parallelism_threads(1) # Can slow down execution

set_seed(RAND_SEED)

# --- Helper to get activation layer ---
def get_activation(act_config):
    if isinstance(act_config, str): return tf.keras.layers.Activation(act_config)
    elif isinstance(act_config, Layer):
        if type(act_config) == OptimA: return OptimA()
        if type(act_config) == OptimALinear: return OptimALinear()
        return act_config # Should be an instance already
    elif isinstance(act_config, type) and issubclass(act_config, Layer): return act_config()
    else: raise ValueError(f"Unsupported activation: {act_config}")

# --- Data Loading and Preprocessing (NLP) ---
def load_and_prepare_nlp_data(dataset_name, tokenizer, max_length, batch_size, seed):
    """Loads and prepares NLP dataset (e.g., IMDB) using Hugging Face datasets."""
    print(f"Loading dataset: {dataset_name}")
    if dataset_name == "imdb":
        raw_ds = hf_datasets.load_dataset("imdb", trust_remote_code=True)
        text_field = "text"
        label_field = "label"
        num_classes = raw_ds["train"].features[label_field].num_classes
    elif dataset_name == "ag_news":
        raw_ds = hf_datasets.load_dataset("ag_news", trust_remote_code=True)
        text_field = "text"
        label_field = "label"
        num_classes = raw_ds["train"].features[label_field].num_classes
    else:
        raise ValueError(f"Unsupported NLP dataset: {dataset_name}")

    def tokenize_function(examples):
        return tokenizer(examples[text_field], truncation=True, padding='max_length', max_length=max_length)

    print("Tokenizing dataset...")
    tokenized_ds = raw_ds.map(tokenize_function, batched=True)
    tokenized_ds = tokenized_ds.remove_columns([text_field])
    tokenized_ds = tokenized_ds.rename_column(label_field, "labels")

    # 'token_type_ids' is included because the tokenizer generates it,
    # and TFBertModel can use it (defaults to zeros if not provided to the model call).
    # set_format expects all columns that will be converted to TensorFlow tensors.
    columns_to_format = ["input_ids", "attention_mask", "token_type_ids", "labels"]
    tokenized_ds.set_format("tensorflow", columns=columns_to_format)

    def as_tf_dataset(split, shuffle=False):
        # Explicitly create a dictionary for from_tensor_slices
        data_for_slicing = {col: tokenized_ds[split][col] for col in columns_to_format}

        ds = tf.data.Dataset.from_tensor_slices(data_for_slicing)

        if shuffle:
            ds = ds.shuffle(buffer_size=len(tokenized_ds[split]), seed=seed, reshuffle_each_iteration=True)

        ds = ds.batch(batch_size)

        # Map function: selects necessary inputs for the model and one-hot encodes labels
        def restructure_and_one_hot(batch_element):
            model_inputs = {
                'input_ids': batch_element['input_ids'],
                'attention_mask': batch_element['attention_mask']
                # 'token_type_ids' can be optionally passed here if the model is built to expect them explicitly.
                # TFBertModel uses them internally if they are part of the output signature from the tokenizer.
            }
            one_hot_labels = tf.one_hot(batch_element['labels'], depth=num_classes)
            return model_inputs, one_hot_labels

        ds = ds.map(restructure_and_one_hot, num_parallel_calls=tf.data.AUTOTUNE)
        return ds.prefetch(tf.data.AUTOTUNE)

    tf_train_dataset = as_tf_dataset("train", shuffle=True)

    if "validation" in tokenized_ds:
        tf_eval_dataset = as_tf_dataset("validation") # Used for validation during training
        tf_test_dataset = as_tf_dataset("test")     # Used for final evaluation
    elif "test" in tokenized_ds:
        print("Warning: No 'validation' split found. Using 'test' split for evaluation during training and final testing.")
        # If no 'validation' split, 'test' is used for both validation and testing.
        # For rigorous research, separate validation and test splits are recommended.
        tf_eval_dataset = as_tf_dataset("test")
        tf_test_dataset = tf_eval_dataset # Use the same dataset for final evaluation
    else:
        raise ValueError("Dataset must have a 'test' or 'validation' split.")

    print(f"Number of classes for {dataset_name}: {num_classes}")
    return tf_train_dataset, tf_eval_dataset, tf_test_dataset, num_classes

# --- Model Building (NLP with BERT) ---
def build_bert_classifier_model(bert_model_name_local, num_classes_local, activation_func_config, max_length_local, strategy=None):
    if isinstance(activation_func_config, str): activation_name = activation_func_config
    elif hasattr(activation_func_config, '__name__'): activation_name = activation_func_config.__name__
    else: activation_name = activation_func_config.__class__.__name__

    context = strategy.scope() if strategy else tf.device('/CPU:0') # Fallback to CPU if no strategy

    with context:
        # 1. Load pre-trained BERT model
        bert_model_layer = TFBertModel.from_pretrained(bert_model_name_local)
        bert_model_layer.trainable = True # Fine-tune BERT layers

        # Input layers
        input_ids = Input(shape=(max_length_local,), dtype=tf.int32, name='input_ids')
        attention_mask = Input(shape=(max_length_local,), dtype=tf.int32, name='attention_mask')

        # 2. Pass inputs through BERT layer
        bert_outputs = bert_model_layer(input_ids=input_ids, attention_mask=attention_mask)
        pooled_output = bert_outputs.pooler_output

        # Custom classifier head
        x = Dropout(0.2, name='dropout_bert_out')(pooled_output)
        x = Dense(256, name='dense_pre_activation')(x)
        x = get_activation(activation_func_config)(x) # Apply configured activation
        x = Dropout(0.2, name='dropout_post_activation')(x)
        output_tensor = Dense(num_classes_local, activation='softmax', name='classifier_output')(x)

        model_inputs = {'input_ids': input_ids, 'attention_mask': attention_mask}
        model = Model(inputs=model_inputs, outputs=output_tensor, name=f"BERT_{activation_name}_Classifier")

    return model

# --- Experiment Execution (adapted for NLP) ---
def run_nlp_experiment(nlp_datasets_config, activations_config, nlp_optimizers_config,
                       num_runs, epochs_nlp_local, batch_size_nlp_local, patience_nlp_local,
                       max_len, bert_model_n_local):
    results = {}
    histories = {}

    tokenizer = BertTokenizer.from_pretrained(bert_model_n_local)

    # Attempt to initialize TPU (if available, e.g., on Kaggle/Colab)
    try:
        tpu = tf.distribute.cluster_resolver.TPUClusterResolver.connect() # connect() if on TPU VM
        strategy = tf.distribute.TPUStrategy(tpu)
        print('Running on TPU:', tpu.resolver.master())
        print(f"Number of accelerators: {strategy.num_replicas_in_sync}")
    except ValueError:
        print("TPU not found. Using default strategy (CPU/GPU).")
        # Use MirroredStrategy if GPUs are available, otherwise default (CPU)
        gpus = tf.config.list_physical_devices('GPU')
        if gpus:
            strategy = tf.distribute.MultiWorkerMirroredStrategy()
            print(f"Running on {len(gpus)} GPU(s).")
        else:
            strategy = tf.distribute.get_strategy() # Default strategy (CPU)
            print("Running on CPU.")
        print(f"Number of accelerators: {strategy.num_replicas_in_sync}")


    for run_idx in range(num_runs):
        print(f"\n--- Starting NLP Run {run_idx + 1}/{num_runs} ---")
        current_seed = RAND_SEED + run_idx
        set_seed(current_seed) # Set seed for each run for reproducibility

        for dataset_name, dataset_cfg in nlp_datasets_config.items():
            print(f"\nNLP Dataset: {dataset_name} (Task: {dataset_cfg['task']})")
            if dataset_name not in results:
                results[dataset_name], histories[dataset_name] = {}, {}

            print(f"Loading and tokenizing {dataset_name} for run {run_idx + 1}...")
            # Pass current_seed to load_and_prepare_nlp_data for reproducible shuffle
            train_ds, val_ds, test_ds, num_classes_ds = load_and_prepare_nlp_data(
                dataset_name, tokenizer, max_len, batch_size_nlp_local, current_seed
            )

            loss_f, eval_m, primary_m_name, primary_m_idx = 'categorical_crossentropy', ['accuracy'], 'accuracy', 1

            for opt_name, opt_creator in nlp_optimizers_config.items():
                print(f"  Optimizer: {opt_name} (Run {run_idx + 1})")
                if opt_name not in results[dataset_name]:
                    results[dataset_name][opt_name], histories[dataset_name][opt_name] = {}, {}

                for act_name, act_cfg_val in activations_config.items():
                    print(f"    Activation: {act_name}")
                    if act_name not in results[dataset_name][opt_name]:
                        results[dataset_name][opt_name][act_name] = {'loss': [], primary_m_name: [], 'time': [], 'params': []}
                        histories[dataset_name][opt_name][act_name] = []

                    tf.keras.backend.clear_session(); gc.collect(); set_seed(current_seed)

                    # Build and compile model within strategy.scope()
                    with strategy.scope():
                        model = build_bert_classifier_model(bert_model_n_local, num_classes_ds, act_cfg_val, max_len, strategy)
                        opt_instance = opt_creator()
                        model.compile(optimizer=opt_instance, loss=loss_f, metrics=eval_m)
                    # model.summary() # For debugging

                    # Callbacks
                    mon_metric = 'val_accuracy' # Metric for EarlyStopping and ReduceLROnPlateau
                    cbs = [
                        EarlyStopping(monitor=mon_metric, patience=patience_nlp_local, restore_best_weights=True, verbose=1),
                        ReduceLROnPlateau(monitor=mon_metric, factor=0.2, patience=patience_nlp_local // 2 + 1, min_lr=1e-7, verbose=1)
                    ]

                    start_t = time.time()
                    print(f"Starting training: {dataset_name}/{opt_name}/{act_name}...")
                    hist = model.fit(
                        train_ds,
                        epochs=epochs_nlp_local,
                        validation_data=val_ds, # Use val_ds for validation during training
                        callbacks=cbs,
                        verbose=1
                    )
                    train_time = time.time() - start_t

                    print(f"Evaluating model on test set: {dataset_name}/{opt_name}/{act_name}...")
                    # Evaluate on the separate test_ds
                    eval_res = model.evaluate(test_ds, verbose=0, return_dict=False) # return_dict=False for list output

                    eval_l, eval_pm = eval_res[0], eval_res[primary_m_idx]
                    n_params = model.count_params()

                    res_dict = results[dataset_name][opt_name][act_name]
                    res_dict['loss'].append(eval_l); res_dict[primary_m_name].append(eval_pm)
                    res_dict['time'].append(train_time); res_dict['params'].append(n_params)
                    histories[dataset_name][opt_name][act_name].append(hist.history)
                    print(f"      Test Loss: {eval_l:.4f}, Test {primary_m_name.capitalize()}: {eval_pm:.4f}, Time: {train_time:.2f}s, Params: {n_params}")

                    del model, opt_instance, hist; gc.collect() # Clean up model and history
            del train_ds, val_ds, test_ds; gc.collect() # Clean up dataset data
    return results, histories

# --- Aggregate and Display Results ---
def aggregate_and_display_results(final_results, datasets_cfg_local, all_histories_local, num_runs_executed):
    """Aggregates results from multiple runs and displays them."""
    aggregated = {}
    best_metric_overall = {} # Store best primary metric for each dataset

    # First pass: aggregate all data
    for ds_name, opt_data in final_results.items():
        aggregated[ds_name] = {}
        task = datasets_cfg_local[ds_name]['task'] # 'classification' or 'regression'
        # Determine primary metric based on task
        primary_metric_key = 'accuracy' if task == 'classification' else 'mae' # Adapt if using other regression metrics
        best_metric_overall[ds_name] = {'value': 0 if task == 'classification' else float('inf'),
                                        'optimizer': None, 'activation': None,
                                        'is_higher_better': task == 'classification'}


        for opt_n, act_data in opt_data.items():
            aggregated[ds_name][opt_n] = {}
            for act_n, metrics_vals in act_data.items():
                if not metrics_vals['loss']: # Handle cases where a run might have failed or not produced results
                    agg_data = {'Avg Loss': np.nan, 'Std Loss': np.nan,
                                f'Avg {primary_metric_key.capitalize()}': np.nan,
                                f'Std {primary_metric_key.capitalize()}': np.nan,
                                'Avg Time': np.nan, 'Std Time': np.nan, 'Avg Params': np.nan}
                else:
                    avg_primary_metric = np.mean(metrics_vals[primary_metric_key])
                    agg_data = {
                        'Avg Loss': np.mean(metrics_vals['loss']),
                        'Std Loss': np.std(metrics_vals['loss']),
                        f'Avg {primary_metric_key.capitalize()}': avg_primary_metric,
                        f'Std {primary_metric_key.capitalize()}': np.std(metrics_vals[primary_metric_key]),
                        'Avg Time': np.mean(metrics_vals['time']),
                        'Std Time': np.std(metrics_vals['time']),
                        'Avg Params': int(np.mean(metrics_vals['params'])) if metrics_vals['params'] else np.nan
                    }

                    # Track best metric for this dataset
                    is_better = (best_metric_overall[ds_name]['is_higher_better'] and avg_primary_metric > best_metric_overall[ds_name]['value']) or \
                                (not best_metric_overall[ds_name]['is_higher_better'] and avg_primary_metric < best_metric_overall[ds_name]['value'])
                    if is_better:
                        best_metric_overall[ds_name]['value'] = avg_primary_metric
                        best_metric_overall[ds_name]['optimizer'] = opt_n
                        best_metric_overall[ds_name]['activation'] = act_n

                aggregated[ds_name][opt_n][act_n] = agg_data

    # Create DataFrame for results
    all_rows = []
    for ds, o_data in aggregated.items():
        task = datasets_cfg_local[ds]['task']
        primary_metric_key_cap = ('Accuracy' if task == 'classification' else 'Mae') # Adapt if metric is different

        for o, a_data in o_data.items():
            for a, m_vals in a_data.items():
                row = {'Dataset': ds, 'Optimizer': o, 'Activation': a}
                row.update(m_vals)

                # Add marker for the best combination for this dataset
                is_best_current_combo = (best_metric_overall.get(ds, {}).get('optimizer') == o and
                                         best_metric_overall.get(ds, {}).get('activation') == a)
                row[f'Best {primary_metric_key_cap}'] = '★' if is_best_current_combo else ''
                all_rows.append(row)

    df_res = pd.DataFrame(all_rows)
    if not df_res.empty:
        df_res = df_res.set_index(['Dataset', 'Optimizer', 'Activation'])
        # Dynamically determine column order based on available metrics
        cols_order = []
        for m_cap in ['Accuracy', 'Mae']: # Add other primary metrics if used
            if f'Best {m_cap}' in df_res.columns: cols_order.append(f'Best {m_cap}')
        for m_cap in ['Accuracy', 'Mae']:
            if f'Avg {m_cap}' in df_res.columns: cols_order.append(f'Avg {m_cap}')
        for m_cap in ['Accuracy', 'Mae']:
            if f'Std {m_cap}' in df_res.columns: cols_order.append(f'Std {m_cap}')

        cols_order += ['Avg Loss', 'Std Loss', 'Avg Time', 'Std Time', 'Avg Params']
        cols_order = [col for col in cols_order if col in df_res.columns] # Ensure only existing columns are used
        df_res = df_res.reindex(columns=cols_order).sort_index()

    print("\n--- Aggregated NLP Benchmark Results ---")
    if best_metric_overall:
        print("\nBest Performing Combinations per Dataset:")
        for ds, info in best_metric_overall.items():
            metric_name = 'Accuracy' if info['is_higher_better'] else 'MAE' # Or other relevant metric name
            print(f"  {ds}: {info['optimizer']} with {info['activation']} ({metric_name}: {info['value']:.4f})")

    pd.options.display.float_format = '{:.4f}'.format
    print(df_res.dropna(axis=1, how='all') if not df_res.empty else "No NLP results to display.")

# --- Main Execution (NLP) ---
if __name__ == "__main__":
    # Ensure internet access for downloading Hugging Face models and datasets
    os.environ["HF_HUB_DISABLE_PROGRESS_BARS"] = "1" # Disable HF progress bars if desired

    # Define NLP datasets for the benchmark
    nlp_datasets_run_cfg = {
        "imdb": {"task": "classification"}, # Using 'classification' as the task type
        # "ag_news": {"task": "classification"}, # More datasets can be added if time/resources permit
    }
    if not nlp_datasets_run_cfg:
        print("No NLP datasets configured. Exiting.")
        exit()

    # Activation functions
    activations_run_cfg = {
        'OptimA': OptimA,
        'OptimALinear': OptimALinear,
        'GeLU': 'gelu', # GeLU is a standard activation in BERT
    }

    # Optimizers for BERT fine-tuning
    nlp_optimizers_run_cfg = {
        # AdamW is standard for BERT. Epsilon is often 1e-8 for Transformers.
        'AdamW_BERT': lambda: AdamW(learning_rate=LEARNING_RATE_BERT, epsilon=1e-8, beta_1=0.95, beta_2=0.999, amsgrad=True),
        # Other AdamW variations or optimizers can be added for comparison if desired
    }

    print(f"--- NLP BENCHMARK ---")
    print(f"BERT Model: {BERT_MODEL_NAME}, Max Sequence Length: {MAX_LENGTH}")
    print(f"Effective Batch Size: {BATCH_SIZE_NLP}, Epochs: {EPOCHS_NLP}, Number of Runs: {NUM_RUNS}")


    # Run NLP experiments
    final_nlp_data, all_nlp_hists = run_nlp_experiment(
        nlp_datasets_run_cfg, activations_run_cfg, nlp_optimizers_run_cfg,
        num_runs=NUM_RUNS, epochs_nlp_local=EPOCHS_NLP, batch_size_nlp_local=BATCH_SIZE_NLP,
        patience_nlp_local=PATIENCE_NLP, max_len=MAX_LENGTH, bert_model_n_local=BERT_MODEL_NAME
    )

    # Display aggregated NLP results
    aggregate_and_display_results(final_nlp_data, nlp_datasets_run_cfg, all_nlp_hists, NUM_RUNS)

2025-05-10 16:10:12.658963: E external/local_xla/xla/stream_executor/cuda/cuda_dnn.cc:9261] Unable to register cuDNN factory: Attempting to register factory for plugin cuDNN when one has already been registered
2025-05-10 16:10:12.658993: E external/local_xla/xla/stream_executor/cuda/cuda_fft.cc:607] Unable to register cuFFT factory: Attempting to register factory for plugin cuFFT when one has already been registered
2025-05-10 16:10:12.659955: E external/local_xla/xla/stream_executor/cuda/cuda_blas.cc:1515] Unable to register cuBLAS factory: Attempting to register factory for plugin cuBLAS when one has already been registered
2025-05-10 16:10:12.665139: I tensorflow/core/platform/cpu_feature_guard.cc:182] This TensorFlow binary is optimized to use available CPU instructions in performance-critical operations.
To enable the following instructions: AVX2 FMA, in other operations, rebuild TensorFlow with the appropriate compiler flags.


--- NLP BENCHMARK ---
BERT Model: bert-base-uncased, Max Sequence Length: 128
Effective Batch Size: 16, Epochs: 3, Number of Runs: 1




TPU not found. Using default strategy (CPU/GPU).


2025-05-10 16:10:15.881493: I external/local_xla/xla/stream_executor/cuda/cuda_executor.cc:901] successful NUMA node read from SysFS had negative value (-1), but there must be at least one NUMA node, so returning NUMA node zero. See more at https://github.com/torvalds/linux/blob/v6.0/Documentation/ABI/testing/sysfs-bus-pci#L344-L355
2025-05-10 16:10:15.889849: I external/local_xla/xla/stream_executor/cuda/cuda_executor.cc:901] successful NUMA node read from SysFS had negative value (-1), but there must be at least one NUMA node, so returning NUMA node zero. See more at https://github.com/torvalds/linux/blob/v6.0/Documentation/ABI/testing/sysfs-bus-pci#L344-L355
2025-05-10 16:10:15.923143: I external/local_xla/xla/stream_executor/cuda/cuda_executor.cc:901] successful NUMA node read from SysFS had negative value (-1), but there must be at least one NUMA node, so returning NUMA node zero. See more at https://github.com/torvalds/linux/blob/v6.0/Documentation/ABI/testing/sysfs-bus-pci#L344-

INFO:tensorflow:Using MirroredStrategy with devices ('/device:GPU:0', '/device:GPU:1')


2025-05-10 16:10:16.179147: I external/local_xla/xla/stream_executor/cuda/cuda_executor.cc:901] successful NUMA node read from SysFS had negative value (-1), but there must be at least one NUMA node, so returning NUMA node zero. See more at https://github.com/torvalds/linux/blob/v6.0/Documentation/ABI/testing/sysfs-bus-pci#L344-L355
2025-05-10 16:10:16.180493: I external/local_xla/xla/stream_executor/cuda/cuda_executor.cc:901] successful NUMA node read from SysFS had negative value (-1), but there must be at least one NUMA node, so returning NUMA node zero. See more at https://github.com/torvalds/linux/blob/v6.0/Documentation/ABI/testing/sysfs-bus-pci#L344-L355
2025-05-10 16:10:16.181713: I external/local_xla/xla/stream_executor/cuda/cuda_executor.cc:901] successful NUMA node read from SysFS had negative value (-1), but there must be at least one NUMA node, so returning NUMA node zero. See more at https://github.com/torvalds/linux/blob/v6.0/Documentation/ABI/testing/sysfs-bus-pci#L344-

INFO:tensorflow:Single-worker MultiWorkerMirroredStrategy with local_devices = ('/device:GPU:0', '/device:GPU:1'), communication = CommunicationImplementation.AUTO
Running on 2 GPU(s).
Number of accelerators: 2

--- Starting NLP Run 1/1 ---

NLP Dataset: imdb (Task: classification)
Loading and tokenizing imdb for run 1...
Loading dataset: imdb
Tokenizing dataset...


2025-05-10 16:10:26.196940: I external/local_tsl/tsl/platform/default/subprocess.cc:304] Start cannot spawn child process: No such file or directory


Number of classes for imdb: 2
  Optimizer: AdamW_BERT (Run 1)
    Activation: OptimA


Some weights of the PyTorch model were not used when initializing the TF 2.0 model TFBertModel: ['cls.predictions.transform.LayerNorm.weight', 'cls.predictions.transform.dense.bias', 'cls.predictions.bias', 'cls.predictions.transform.LayerNorm.bias', 'cls.predictions.transform.dense.weight', 'cls.seq_relationship.weight', 'cls.seq_relationship.bias']
- This IS expected if you are initializing TFBertModel from a PyTorch model trained on another task or with another architecture (e.g. initializing a TFBertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing TFBertModel from a PyTorch model that you expect to be exactly identical (e.g. initializing a TFBertForSequenceClassification model from a BertForSequenceClassification model).
All the weights of TFBertModel were initialized from the PyTorch model.
If your task is similar to the task the model of the checkpoint was trained on, you can already use TFBertModel for predictions w

Starting training: imdb/AdamW_BERT/OptimA...
Epoch 1/3
INFO:tensorflow:Collective all_reduce tensors: 205 all_reduces, num_devices = 2, group_size = 2, implementation = CommunicationImplementation.AUTO, num_packs = 1
INFO:tensorflow:Collective all_reduce IndexedSlices: 3 all_reduces, num_devices =2, group_size = 2, implementation = CommunicationImplementation.AUTO
INFO:tensorflow:Collective all_reduce tensors: 1 all_reduces, num_devices = 2, group_size = 2, implementation = CommunicationImplementation.AUTO, num_packs = 1
INFO:tensorflow:Collective all_reduce tensors: 1 all_reduces, num_devices = 2, group_size = 2, implementation = CommunicationImplementation.AUTO, num_packs = 1
INFO:tensorflow:Collective all_reduce tensors: 1 all_reduces, num_devices = 2, group_size = 2, implementation = CommunicationImplementation.AUTO, num_packs = 1
INFO:tensorflow:Collective all_reduce tensors: 1 all_reduces, num_devices = 2, group_size = 2, implementation = CommunicationImplementation.AUTO, num_pac

2025-05-10 16:11:04.342518: I external/local_xla/xla/service/service.cc:168] XLA service 0x7b41521d6170 initialized for platform CUDA (this does not guarantee that XLA will be used). Devices:
2025-05-10 16:11:04.342541: I external/local_xla/xla/service/service.cc:176]   StreamExecutor device (0): NVIDIA RTX A4500, Compute Capability 8.6
2025-05-10 16:11:04.342547: I external/local_xla/xla/service/service.cc:176]   StreamExecutor device (1): NVIDIA RTX A4500, Compute Capability 8.6
2025-05-10 16:11:04.347475: I tensorflow/compiler/mlir/tensorflow/utils/dump_mlir_util.cc:269] disabling MLIR crash reproducer, set env var `MLIR_CRASH_REPRODUCER_DIRECTORY` to enable.
2025-05-10 16:11:04.366691: I external/local_xla/xla/stream_executor/cuda/cuda_dnn.cc:454] Loaded cuDNN version 8904
2025-05-10 16:11:04.368464: I external/local_xla/xla/stream_executor/cuda/cuda_dnn.cc:454] Loaded cuDNN version 8904
I0000 00:00:1746882664.434822   31920 device_compiler.h:186] Compiled cluster using XLA!  This 

INFO:tensorflow:Collective all_reduce tensors: 1 all_reduces, num_devices = 2, group_size = 2, implementation = CommunicationImplementation.AUTO, num_packs = 1
INFO:tensorflow:Collective all_reduce tensors: 1 all_reduces, num_devices = 2, group_size = 2, implementation = CommunicationImplementation.AUTO, num_packs = 1
INFO:tensorflow:Collective all_reduce tensors: 1 all_reduces, num_devices = 2, group_size = 2, implementation = CommunicationImplementation.AUTO, num_packs = 1
Epoch 2/3
Epoch 3/3
Evaluating model on test set: imdb/AdamW_BERT/OptimA...
      Test Loss: 0.3316, Test Accuracy: 0.8874, Time: 816.37s, Params: 109679623
    Activation: OptimALinear


Some weights of the PyTorch model were not used when initializing the TF 2.0 model TFBertModel: ['cls.predictions.transform.LayerNorm.weight', 'cls.predictions.transform.dense.bias', 'cls.predictions.bias', 'cls.predictions.transform.LayerNorm.bias', 'cls.predictions.transform.dense.weight', 'cls.seq_relationship.weight', 'cls.seq_relationship.bias']
- This IS expected if you are initializing TFBertModel from a PyTorch model trained on another task or with another architecture (e.g. initializing a TFBertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing TFBertModel from a PyTorch model that you expect to be exactly identical (e.g. initializing a TFBertForSequenceClassification model from a BertForSequenceClassification model).
All the weights of TFBertModel were initialized from the PyTorch model.
If your task is similar to the task the model of the checkpoint was trained on, you can already use TFBertModel for predictions w

Starting training: imdb/AdamW_BERT/OptimALinear...
Epoch 1/3
INFO:tensorflow:Collective all_reduce tensors: 205 all_reduces, num_devices = 2, group_size = 2, implementation = CommunicationImplementation.AUTO, num_packs = 1
INFO:tensorflow:Collective all_reduce IndexedSlices: 3 all_reduces, num_devices =2, group_size = 2, implementation = CommunicationImplementation.AUTO
INFO:tensorflow:Collective all_reduce tensors: 1 all_reduces, num_devices = 2, group_size = 2, implementation = CommunicationImplementation.AUTO, num_packs = 1
INFO:tensorflow:Collective all_reduce tensors: 1 all_reduces, num_devices = 2, group_size = 2, implementation = CommunicationImplementation.AUTO, num_packs = 1
INFO:tensorflow:Collective all_reduce tensors: 1 all_reduces, num_devices = 2, group_size = 2, implementation = CommunicationImplementation.AUTO, num_packs = 1
INFO:tensorflow:Collective all_reduce tensors: 1 all_reduces, num_devices = 2, group_size = 2, implementation = CommunicationImplementation.AUTO, n

Some weights of the PyTorch model were not used when initializing the TF 2.0 model TFBertModel: ['cls.predictions.transform.LayerNorm.weight', 'cls.predictions.transform.dense.bias', 'cls.predictions.bias', 'cls.predictions.transform.LayerNorm.bias', 'cls.predictions.transform.dense.weight', 'cls.seq_relationship.weight', 'cls.seq_relationship.bias']
- This IS expected if you are initializing TFBertModel from a PyTorch model trained on another task or with another architecture (e.g. initializing a TFBertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing TFBertModel from a PyTorch model that you expect to be exactly identical (e.g. initializing a TFBertForSequenceClassification model from a BertForSequenceClassification model).
All the weights of TFBertModel were initialized from the PyTorch model.
If your task is similar to the task the model of the checkpoint was trained on, you can already use TFBertModel for predictions w

Starting training: imdb/AdamW_BERT/GeLU...
Epoch 1/3
INFO:tensorflow:Collective all_reduce tensors: 200 all_reduces, num_devices = 2, group_size = 2, implementation = CommunicationImplementation.AUTO, num_packs = 1
INFO:tensorflow:Collective all_reduce IndexedSlices: 3 all_reduces, num_devices =2, group_size = 2, implementation = CommunicationImplementation.AUTO
INFO:tensorflow:Collective all_reduce tensors: 1 all_reduces, num_devices = 2, group_size = 2, implementation = CommunicationImplementation.AUTO, num_packs = 1
INFO:tensorflow:Collective all_reduce tensors: 1 all_reduces, num_devices = 2, group_size = 2, implementation = CommunicationImplementation.AUTO, num_packs = 1
INFO:tensorflow:Collective all_reduce tensors: 1 all_reduces, num_devices = 2, group_size = 2, implementation = CommunicationImplementation.AUTO, num_packs = 1
INFO:tensorflow:Collective all_reduce tensors: 1 all_reduces, num_devices = 2, group_size = 2, implementation = CommunicationImplementation.AUTO, num_packs

  13/1563 [..............................] - ETA: 2:51:35 - loss: 0.7680 - accuracy: 0.5481

  14/1563 [..............................] - ETA: 2:50:59 - loss: 0.7485 - accuracy: 0.5670

  15/1563 [..............................] - ETA: 2:51:08 - loss: 0.7497 - accuracy: 0.5625

  16/1563 [..............................] - ETA: 2:51:19 - loss: 0.7482 - accuracy: 0.5586

  17/1563 [..............................] - ETA: 2:51:48 - loss: 0.7619 - accuracy: 0.5515

  18/1563 [..............................] - ETA: 2:53:47 - loss: 0.7609 - accuracy: 0.5521

  19/1563 [..............................] - ETA: 2:54:15 - loss: 0.7614 - accuracy: 0.5559

  20/1563 [..............................] - ETA: 2:53:48 - loss: 0.7657 - accuracy: 0.5469

  21/1563 [..............................] - ETA: 2:53:26 - loss: 0.7687 - accuracy: 0.5417

  22/1563 [..............................] - ETA: 2:53:00 - loss: 0.7754 - accuracy: 0.5398

  23/1563 [..............................] - ETA: 2:53:04 - loss: 0.7709 - accuracy: 0.5462

  24/1563 [..............................] - ETA: 2:52:33 - loss: 0.7664 - accuracy: 0.5469

  25/1563 [..............................] - ETA: 2:52:08 - loss: 0.7626 - accuracy: 0.5525

  26/1563 [..............................] - ETA: 2:51:52 - loss: 0.7641 - accuracy: 0.5505

  27/1563 [..............................] - ETA: 2:51:39 - loss: 0.7613 - accuracy: 0.5509

  28/1563 [..............................] - ETA: 2:51:59 - loss: 0.7631 - accuracy: 0.5491

  29/1563 [..............................] - ETA: 2:51:43 - loss: 0.7563 - accuracy: 0.5517

  30/1563 [..............................] - ETA: 2:51:30 - loss: 0.7519 - accuracy: 0.5604

  31/1563 [..............................] - ETA: 2:51:13 - loss: 0.7504 - accuracy: 0.5625

  32/1563 [..............................] - ETA: 2:51:01 - loss: 0.7538 - accuracy: 0.5586

  33/1563 [..............................] - ETA: 2:51:07 - loss: 0.7544 - accuracy: 0.5587

  34/1563 [..............................] - ETA: 2:50:46 - loss: 0.7556 - accuracy: 0.5570

  35/1563 [..............................] - ETA: 2:50:34 - loss: 0.7566 - accuracy: 0.5500

  36/1563 [..............................] - ETA: 2:50:20 - loss: 0.7509 - accuracy: 0.5556

  37/1563 [..............................] - ETA: 2:50:11 - loss: 0.7472 - accuracy: 0.5574

  38/1563 [..............................] - ETA: 2:50:24 - loss: 0.7499 - accuracy: 0.5559

  39/1563 [..............................] - ETA: 2:50:13 - loss: 0.7541 - accuracy: 0.5497

  40/1563 [..............................] - ETA: 2:50:06 - loss: 0.7506 - accuracy: 0.5531

  41/1563 [..............................] - ETA: 2:49:59 - loss: 0.7499 - accuracy: 0.5564

  42/1563 [..............................] - ETA: 2:50:06 - loss: 0.7468 - accuracy: 0.5580

  43/1563 [..............................] - ETA: 2:50:07 - loss: 0.7444 - accuracy: 0.5596

  44/1563 [..............................] - ETA: 2:50:02 - loss: 0.7387 - accuracy: 0.5653

  45/1563 [..............................] - ETA: 2:49:52 - loss: 0.7381 - accuracy: 0.5681

  46/1563 [..............................] - ETA: 2:49:44 - loss: 0.7353 - accuracy: 0.5666

  47/1563 [..............................] - ETA: 2:49:57 - loss: 0.7351 - accuracy: 0.5678

  48/1563 [..............................] - ETA: 2:49:47 - loss: 0.7331 - accuracy: 0.5664

  49/1563 [..............................] - ETA: 2:49:42 - loss: 0.7345 - accuracy: 0.5663

  50/1563 [..............................] - ETA: 2:49:35 - loss: 0.7344 - accuracy: 0.5675

  51/1563 [..............................] - ETA: 2:49:26 - loss: 0.7282 - accuracy: 0.5723

  52/1563 [..............................] - ETA: 2:49:35 - loss: 0.7252 - accuracy: 0.5745

  53/1563 [>.............................] - ETA: 2:49:28 - loss: 0.7256 - accuracy: 0.5743

  54/1563 [>.............................] - ETA: 2:49:22 - loss: 0.7210 - accuracy: 0.5799

  55/1563 [>.............................] - ETA: 2:49:15 - loss: 0.7190 - accuracy: 0.5807

  56/1563 [>.............................] - ETA: 2:49:08 - loss: 0.7132 - accuracy: 0.5848

  57/1563 [>.............................] - ETA: 2:49:17 - loss: 0.7126 - accuracy: 0.5844

  58/1563 [>.............................] - ETA: 2:49:09 - loss: 0.7063 - accuracy: 0.5894

  59/1563 [>.............................] - ETA: 2:49:03 - loss: 0.7058 - accuracy: 0.5911

  60/1563 [>.............................] - ETA: 2:48:55 - loss: 0.7085 - accuracy: 0.5875

  61/1563 [>.............................] - ETA: 2:48:46 - loss: 0.7044 - accuracy: 0.5891

  62/1563 [>.............................] - ETA: 2:48:53 - loss: 0.7048 - accuracy: 0.5887

  63/1563 [>.............................] - ETA: 2:48:45 - loss: 0.7025 - accuracy: 0.5903

  64/1563 [>.............................] - ETA: 2:48:35 - loss: 0.7006 - accuracy: 0.5938

  65/1563 [>.............................] - ETA: 2:48:26 - loss: 0.6977 - accuracy: 0.5962

  66/1563 [>.............................] - ETA: 2:48:17 - loss: 0.6957 - accuracy: 0.5985

  67/1563 [>.............................] - ETA: 2:48:19 - loss: 0.6936 - accuracy: 0.5998

  68/1563 [>.............................] - ETA: 2:48:12 - loss: 0.6873 - accuracy: 0.6048

  69/1563 [>.............................] - ETA: 2:48:03 - loss: 0.6829 - accuracy: 0.6060

  70/1563 [>.............................] - ETA: 2:47:53 - loss: 0.6808 - accuracy: 0.6071

  71/1563 [>.............................] - ETA: 2:47:47 - loss: 0.6849 - accuracy: 0.6048

  72/1563 [>.............................] - ETA: 2:47:48 - loss: 0.6879 - accuracy: 0.6050

  73/1563 [>.............................] - ETA: 2:47:39 - loss: 0.6901 - accuracy: 0.6045

  74/1563 [>.............................] - ETA: 2:47:30 - loss: 0.6886 - accuracy: 0.6056

  75/1563 [>.............................] - ETA: 2:47:20 - loss: 0.6855 - accuracy: 0.6075

  76/1563 [>.............................] - ETA: 2:47:17 - loss: 0.6911 - accuracy: 0.6061

  77/1563 [>.............................] - ETA: 2:47:11 - loss: 0.6860 - accuracy: 0.6088

  78/1563 [>.............................] - ETA: 2:47:02 - loss: 0.6882 - accuracy: 0.6090

  79/1563 [>.............................] - ETA: 2:46:53 - loss: 0.6867 - accuracy: 0.6100

  80/1563 [>.............................] - ETA: 2:46:45 - loss: 0.6842 - accuracy: 0.6125

  81/1563 [>.............................] - ETA: 2:46:46 - loss: 0.6786 - accuracy: 0.6165

  82/1563 [>.............................] - ETA: 2:46:38 - loss: 0.6744 - accuracy: 0.6189

  83/1563 [>.............................] - ETA: 2:46:29 - loss: 0.6725 - accuracy: 0.6205

  84/1563 [>.............................] - ETA: 2:46:21 - loss: 0.6703 - accuracy: 0.6220

  85/1563 [>.............................] - ETA: 2:46:13 - loss: 0.6677 - accuracy: 0.6243

  86/1563 [>.............................] - ETA: 2:46:15 - loss: 0.6656 - accuracy: 0.6272

  87/1563 [>.............................] - ETA: 2:46:07 - loss: 0.6596 - accuracy: 0.6315

  88/1563 [>.............................] - ETA: 2:45:59 - loss: 0.6574 - accuracy: 0.6335

  89/1563 [>.............................] - ETA: 2:45:50 - loss: 0.6547 - accuracy: 0.6362

  90/1563 [>.............................] - ETA: 2:45:42 - loss: 0.6521 - accuracy: 0.6382

  91/1563 [>.............................] - ETA: 2:45:44 - loss: 0.6507 - accuracy: 0.6401

  92/1563 [>.............................] - ETA: 2:45:35 - loss: 0.6504 - accuracy: 0.6399

  93/1563 [>.............................] - ETA: 2:45:27 - loss: 0.6496 - accuracy: 0.6398

  94/1563 [>.............................] - ETA: 2:45:20 - loss: 0.6497 - accuracy: 0.6403

  95/1563 [>.............................] - ETA: 2:45:11 - loss: 0.6470 - accuracy: 0.6428

  96/1563 [>.............................] - ETA: 2:45:12 - loss: 0.6439 - accuracy: 0.6445

  97/1563 [>.............................] - ETA: 2:45:05 - loss: 0.6425 - accuracy: 0.6450

  98/1563 [>.............................] - ETA: 2:44:55 - loss: 0.6415 - accuracy: 0.6460

  99/1563 [>.............................] - ETA: 2:44:46 - loss: 0.6409 - accuracy: 0.6465

 100/1563 [>.............................] - ETA: 2:44:38 - loss: 0.6363 - accuracy: 0.6494

 101/1563 [>.............................] - ETA: 2:44:37 - loss: 0.6343 - accuracy: 0.6510

 102/1563 [>.............................] - ETA: 2:44:28 - loss: 0.6300 - accuracy: 0.6538

 103/1563 [>.............................] - ETA: 2:44:21 - loss: 0.6273 - accuracy: 0.6559

 104/1563 [>.............................] - ETA: 2:44:12 - loss: 0.6245 - accuracy: 0.6569

 105/1563 [=>............................] - ETA: 2:44:05 - loss: 0.6233 - accuracy: 0.6583

 106/1563 [=>............................] - ETA: 2:44:06 - loss: 0.6237 - accuracy: 0.6598

 107/1563 [=>............................] - ETA: 2:43:57 - loss: 0.6203 - accuracy: 0.6618

 108/1563 [=>............................] - ETA: 2:43:49 - loss: 0.6198 - accuracy: 0.6632

 109/1563 [=>............................] - ETA: 2:43:42 - loss: 0.6196 - accuracy: 0.6623

 110/1563 [=>............................] - ETA: 2:43:36 - loss: 0.6176 - accuracy: 0.6642

 111/1563 [=>............................] - ETA: 2:43:32 - loss: 0.6178 - accuracy: 0.6644

 112/1563 [=>............................] - ETA: 2:43:24 - loss: 0.6180 - accuracy: 0.6652

 113/1563 [=>............................] - ETA: 2:43:15 - loss: 0.6145 - accuracy: 0.6670

 114/1563 [=>............................] - ETA: 2:43:08 - loss: 0.6144 - accuracy: 0.6678

 115/1563 [=>............................] - ETA: 2:43:07 - loss: 0.6113 - accuracy: 0.6701

 116/1563 [=>............................] - ETA: 2:42:59 - loss: 0.6093 - accuracy: 0.6713

 117/1563 [=>............................] - ETA: 2:42:51 - loss: 0.6078 - accuracy: 0.6725

 118/1563 [=>............................] - ETA: 2:42:42 - loss: 0.6065 - accuracy: 0.6743

 119/1563 [=>............................] - ETA: 2:42:35 - loss: 0.6047 - accuracy: 0.6754

 120/1563 [=>............................] - ETA: 2:42:34 - loss: 0.6033 - accuracy: 0.6771

 121/1563 [=>............................] - ETA: 2:42:27 - loss: 0.6039 - accuracy: 0.6777

 122/1563 [=>............................] - ETA: 2:42:19 - loss: 0.6031 - accuracy: 0.6788

 123/1563 [=>............................] - ETA: 2:42:09 - loss: 0.6033 - accuracy: 0.6794

 124/1563 [=>............................] - ETA: 2:42:02 - loss: 0.6047 - accuracy: 0.6789

 125/1563 [=>............................] - ETA: 2:42:00 - loss: 0.6024 - accuracy: 0.6810

 126/1563 [=>............................] - ETA: 2:41:51 - loss: 0.6000 - accuracy: 0.6825

 127/1563 [=>............................] - ETA: 2:41:43 - loss: 0.5980 - accuracy: 0.6841

 128/1563 [=>............................] - ETA: 2:41:34 - loss: 0.5982 - accuracy: 0.6846

 129/1563 [=>............................] - ETA: 2:41:25 - loss: 0.5984 - accuracy: 0.6846

 130/1563 [=>............................] - ETA: 2:41:24 - loss: 0.5957 - accuracy: 0.6865

 131/1563 [=>............................] - ETA: 2:41:15 - loss: 0.5923 - accuracy: 0.6889

 132/1563 [=>............................] - ETA: 2:41:06 - loss: 0.5919 - accuracy: 0.6899

 133/1563 [=>............................] - ETA: 2:41:00 - loss: 0.5912 - accuracy: 0.6898

 134/1563 [=>............................] - ETA: 2:40:53 - loss: 0.5893 - accuracy: 0.6917

 135/1563 [=>............................] - ETA: 2:40:49 - loss: 0.5892 - accuracy: 0.6926

 136/1563 [=>............................] - ETA: 2:40:40 - loss: 0.5882 - accuracy: 0.6939

 137/1563 [=>............................] - ETA: 2:40:31 - loss: 0.5864 - accuracy: 0.6953

 138/1563 [=>............................] - ETA: 2:40:22 - loss: 0.5834 - accuracy: 0.6970

 139/1563 [=>............................] - ETA: 2:40:14 - loss: 0.5824 - accuracy: 0.6978

 140/1563 [=>............................] - ETA: 2:40:11 - loss: 0.5809 - accuracy: 0.6987

 141/1563 [=>............................] - ETA: 2:40:03 - loss: 0.5800 - accuracy: 0.6995

 142/1563 [=>............................] - ETA: 2:39:55 - loss: 0.5777 - accuracy: 0.7007

 143/1563 [=>............................] - ETA: 2:39:47 - loss: 0.5769 - accuracy: 0.7019

 144/1563 [=>............................] - ETA: 2:39:39 - loss: 0.5752 - accuracy: 0.7031

 145/1563 [=>............................] - ETA: 2:39:35 - loss: 0.5735 - accuracy: 0.7043

 146/1563 [=>............................] - ETA: 2:39:25 - loss: 0.5731 - accuracy: 0.7046

 147/1563 [=>............................] - ETA: 2:39:17 - loss: 0.5731 - accuracy: 0.7049

 148/1563 [=>............................] - ETA: 2:39:09 - loss: 0.5722 - accuracy: 0.7057

 149/1563 [=>............................] - ETA: 2:39:01 - loss: 0.5705 - accuracy: 0.7068

 150/1563 [=>............................] - ETA: 2:38:57 - loss: 0.5703 - accuracy: 0.7071

 151/1563 [=>............................] - ETA: 2:38:48 - loss: 0.5688 - accuracy: 0.7078

 152/1563 [=>............................] - ETA: 2:38:38 - loss: 0.5676 - accuracy: 0.7085

 153/1563 [=>............................] - ETA: 2:38:27 - loss: 0.5662 - accuracy: 0.7092

 154/1563 [=>............................] - ETA: 2:38:18 - loss: 0.5650 - accuracy: 0.7098

 155/1563 [=>............................] - ETA: 2:38:14 - loss: 0.5626 - accuracy: 0.7117

 156/1563 [=>............................] - ETA: 2:38:04 - loss: 0.5633 - accuracy: 0.7115

 157/1563 [==>...........................] - ETA: 2:37:56 - loss: 0.5623 - accuracy: 0.7122

 158/1563 [==>...........................] - ETA: 2:37:48 - loss: 0.5609 - accuracy: 0.7128

 159/1563 [==>...........................] - ETA: 2:37:40 - loss: 0.5592 - accuracy: 0.7138

 160/1563 [==>...........................] - ETA: 2:37:36 - loss: 0.5570 - accuracy: 0.7152

 161/1563 [==>...........................] - ETA: 2:37:28 - loss: 0.5554 - accuracy: 0.7166

 162/1563 [==>...........................] - ETA: 2:37:20 - loss: 0.5534 - accuracy: 0.7176

 163/1563 [==>...........................] - ETA: 2:37:11 - loss: 0.5516 - accuracy: 0.7186

 164/1563 [==>...........................] - ETA: 2:37:04 - loss: 0.5505 - accuracy: 0.7191

 165/1563 [==>...........................] - ETA: 2:37:00 - loss: 0.5497 - accuracy: 0.7189

 166/1563 [==>...........................] - ETA: 2:36:52 - loss: 0.5519 - accuracy: 0.7184

 167/1563 [==>...........................] - ETA: 2:36:46 - loss: 0.5515 - accuracy: 0.7186

 168/1563 [==>...........................] - ETA: 2:36:37 - loss: 0.5489 - accuracy: 0.7202

 169/1563 [==>...........................] - ETA: 2:36:30 - loss: 0.5491 - accuracy: 0.7212

 170/1563 [==>...........................] - ETA: 2:36:24 - loss: 0.5485 - accuracy: 0.7217

 171/1563 [==>...........................] - ETA: 2:36:16 - loss: 0.5467 - accuracy: 0.7226

 172/1563 [==>...........................] - ETA: 2:36:08 - loss: 0.5463 - accuracy: 0.7227

 173/1563 [==>...........................] - ETA: 2:36:00 - loss: 0.5453 - accuracy: 0.7236

 174/1563 [==>...........................] - ETA: 2:35:53 - loss: 0.5457 - accuracy: 0.7231

 175/1563 [==>...........................] - ETA: 2:35:47 - loss: 0.5446 - accuracy: 0.7239

 176/1563 [==>...........................] - ETA: 2:35:40 - loss: 0.5446 - accuracy: 0.7241

 177/1563 [==>...........................] - ETA: 2:35:32 - loss: 0.5430 - accuracy: 0.7253

 178/1563 [==>...........................] - ETA: 2:35:24 - loss: 0.5417 - accuracy: 0.7261

 179/1563 [==>...........................] - ETA: 2:35:19 - loss: 0.5400 - accuracy: 0.7273

 180/1563 [==>...........................] - ETA: 2:35:11 - loss: 0.5391 - accuracy: 0.7278

 181/1563 [==>...........................] - ETA: 2:35:04 - loss: 0.5405 - accuracy: 0.7269

 182/1563 [==>...........................] - ETA: 2:34:56 - loss: 0.5385 - accuracy: 0.7280

 183/1563 [==>...........................] - ETA: 2:34:48 - loss: 0.5373 - accuracy: 0.7285

 184/1563 [==>...........................] - ETA: 2:34:43 - loss: 0.5366 - accuracy: 0.7289

 185/1563 [==>...........................] - ETA: 2:34:36 - loss: 0.5361 - accuracy: 0.7287

 186/1563 [==>...........................] - ETA: 2:34:28 - loss: 0.5343 - accuracy: 0.7298

 187/1563 [==>...........................] - ETA: 2:34:20 - loss: 0.5330 - accuracy: 0.7306

 188/1563 [==>...........................] - ETA: 2:34:13 - loss: 0.5331 - accuracy: 0.7311

 189/1563 [==>...........................] - ETA: 2:34:09 - loss: 0.5341 - accuracy: 0.7308

 190/1563 [==>...........................] - ETA: 2:34:01 - loss: 0.5334 - accuracy: 0.7312

 191/1563 [==>...........................] - ETA: 2:33:53 - loss: 0.5333 - accuracy: 0.7313

 192/1563 [==>...........................] - ETA: 2:33:44 - loss: 0.5344 - accuracy: 0.7311

 193/1563 [==>...........................] - ETA: 2:33:37 - loss: 0.5350 - accuracy: 0.7312

 194/1563 [==>...........................] - ETA: 2:33:32 - loss: 0.5335 - accuracy: 0.7323

 195/1563 [==>...........................] - ETA: 2:33:24 - loss: 0.5327 - accuracy: 0.7324

 196/1563 [==>...........................] - ETA: 2:33:16 - loss: 0.5324 - accuracy: 0.7331

 197/1563 [==>...........................] - ETA: 2:33:09 - loss: 0.5324 - accuracy: 0.7329

 198/1563 [==>...........................] - ETA: 2:33:00 - loss: 0.5324 - accuracy: 0.7330

 199/1563 [==>...........................] - ETA: 2:32:56 - loss: 0.5329 - accuracy: 0.7327

 200/1563 [==>...........................] - ETA: 2:32:48 - loss: 0.5327 - accuracy: 0.7331

 201/1563 [==>...........................] - ETA: 2:32:40 - loss: 0.5312 - accuracy: 0.7341

 202/1563 [==>...........................] - ETA: 2:32:32 - loss: 0.5306 - accuracy: 0.7348

 203/1563 [==>...........................] - ETA: 2:32:24 - loss: 0.5298 - accuracy: 0.7352

 204/1563 [==>...........................] - ETA: 2:32:20 - loss: 0.5292 - accuracy: 0.7359

 205/1563 [==>...........................] - ETA: 2:32:13 - loss: 0.5292 - accuracy: 0.7363

 206/1563 [==>...........................] - ETA: 2:32:05 - loss: 0.5292 - accuracy: 0.7367

 207/1563 [==>...........................] - ETA: 2:31:57 - loss: 0.5280 - accuracy: 0.7373

 208/1563 [==>...........................] - ETA: 2:31:49 - loss: 0.5266 - accuracy: 0.7383

 209/1563 [===>..........................] - ETA: 2:31:45 - loss: 0.5254 - accuracy: 0.7386

 210/1563 [===>..........................] - ETA: 2:31:37 - loss: 0.5257 - accuracy: 0.7384

 211/1563 [===>..........................] - ETA: 2:31:29 - loss: 0.5248 - accuracy: 0.7390

 212/1563 [===>..........................] - ETA: 2:31:22 - loss: 0.5234 - accuracy: 0.7400

 213/1563 [===>..........................] - ETA: 2:31:14 - loss: 0.5234 - accuracy: 0.7400

 214/1563 [===>..........................] - ETA: 2:31:09 - loss: 0.5220 - accuracy: 0.7407

 215/1563 [===>..........................] - ETA: 2:31:02 - loss: 0.5207 - accuracy: 0.7416

 216/1563 [===>..........................] - ETA: 2:30:54 - loss: 0.5226 - accuracy: 0.7407

 217/1563 [===>..........................] - ETA: 2:30:46 - loss: 0.5238 - accuracy: 0.7402

 218/1563 [===>..........................] - ETA: 2:30:38 - loss: 0.5236 - accuracy: 0.7403

 219/1563 [===>..........................] - ETA: 2:30:33 - loss: 0.5228 - accuracy: 0.7403

 220/1563 [===>..........................] - ETA: 2:30:25 - loss: 0.5218 - accuracy: 0.7409

 221/1563 [===>..........................] - ETA: 2:30:18 - loss: 0.5203 - accuracy: 0.7421

 222/1563 [===>..........................] - ETA: 2:30:10 - loss: 0.5189 - accuracy: 0.7427

 223/1563 [===>..........................] - ETA: 2:30:03 - loss: 0.5179 - accuracy: 0.7430

 224/1563 [===>..........................] - ETA: 2:29:58 - loss: 0.5167 - accuracy: 0.7439

 225/1563 [===>..........................] - ETA: 2:29:50 - loss: 0.5156 - accuracy: 0.7442

 226/1563 [===>..........................] - ETA: 2:29:43 - loss: 0.5147 - accuracy: 0.7445

 227/1563 [===>..........................] - ETA: 2:29:36 - loss: 0.5130 - accuracy: 0.7456

 228/1563 [===>..........................] - ETA: 2:29:29 - loss: 0.5123 - accuracy: 0.7462

 229/1563 [===>..........................] - ETA: 2:29:24 - loss: 0.5107 - accuracy: 0.7470

 230/1563 [===>..........................] - ETA: 2:29:17 - loss: 0.5116 - accuracy: 0.7470

 231/1563 [===>..........................] - ETA: 2:29:09 - loss: 0.5104 - accuracy: 0.7476

 232/1563 [===>..........................] - ETA: 2:29:02 - loss: 0.5092 - accuracy: 0.7484

 233/1563 [===>..........................] - ETA: 2:28:55 - loss: 0.5095 - accuracy: 0.7487

 234/1563 [===>..........................] - ETA: 2:28:49 - loss: 0.5085 - accuracy: 0.7492

 235/1563 [===>..........................] - ETA: 2:28:41 - loss: 0.5072 - accuracy: 0.7500

 236/1563 [===>..........................] - ETA: 2:28:35 - loss: 0.5057 - accuracy: 0.7508

 237/1563 [===>..........................] - ETA: 2:28:28 - loss: 0.5047 - accuracy: 0.7513

 238/1563 [===>..........................] - ETA: 2:28:23 - loss: 0.5053 - accuracy: 0.7513

 239/1563 [===>..........................] - ETA: 2:28:19 - loss: 0.5040 - accuracy: 0.7521

 240/1563 [===>..........................] - ETA: 2:28:13 - loss: 0.5031 - accuracy: 0.7529

 241/1563 [===>..........................] - ETA: 2:28:06 - loss: 0.5023 - accuracy: 0.7531

 242/1563 [===>..........................] - ETA: 2:28:00 - loss: 0.5013 - accuracy: 0.7536

 243/1563 [===>..........................] - ETA: 2:27:54 - loss: 0.5007 - accuracy: 0.7541

 244/1563 [===>..........................] - ETA: 2:27:48 - loss: 0.5008 - accuracy: 0.7536

 245/1563 [===>..........................] - ETA: 2:27:41 - loss: 0.4996 - accuracy: 0.7543

 246/1563 [===>..........................] - ETA: 2:27:34 - loss: 0.5000 - accuracy: 0.7543

 247/1563 [===>..........................] - ETA: 2:27:27 - loss: 0.4984 - accuracy: 0.7551

 248/1563 [===>..........................] - ETA: 2:27:23 - loss: 0.4980 - accuracy: 0.7555

 249/1563 [===>..........................] - ETA: 2:27:18 - loss: 0.4969 - accuracy: 0.7563

 250/1563 [===>..........................] - ETA: 2:27:11 - loss: 0.4958 - accuracy: 0.7570

 251/1563 [===>..........................] - ETA: 2:27:05 - loss: 0.4944 - accuracy: 0.7575

 252/1563 [===>..........................] - ETA: 2:26:58 - loss: 0.4938 - accuracy: 0.7579

 253/1563 [===>..........................] - ETA: 2:26:55 - loss: 0.4943 - accuracy: 0.7579

 254/1563 [===>..........................] - ETA: 2:26:48 - loss: 0.4930 - accuracy: 0.7586

 255/1563 [===>..........................] - ETA: 2:26:42 - loss: 0.4924 - accuracy: 0.7593

 256/1563 [===>..........................] - ETA: 2:26:35 - loss: 0.4922 - accuracy: 0.7593

 257/1563 [===>..........................] - ETA: 2:26:28 - loss: 0.4921 - accuracy: 0.7590

 258/1563 [===>..........................] - ETA: 2:26:24 - loss: 0.4911 - accuracy: 0.7594

 259/1563 [===>..........................] - ETA: 2:26:16 - loss: 0.4913 - accuracy: 0.7592

 260/1563 [===>..........................] - ETA: 2:26:08 - loss: 0.4906 - accuracy: 0.7594

 261/1563 [====>.........................] - ETA: 2:26:01 - loss: 0.4902 - accuracy: 0.7593

 262/1563 [====>.........................] - ETA: 2:25:53 - loss: 0.4892 - accuracy: 0.7595

 263/1563 [====>.........................] - ETA: 2:25:47 - loss: 0.4893 - accuracy: 0.7593

 264/1563 [====>.........................] - ETA: 2:25:40 - loss: 0.4890 - accuracy: 0.7592

 265/1563 [====>.........................] - ETA: 2:25:32 - loss: 0.4890 - accuracy: 0.7594

 266/1563 [====>.........................] - ETA: 2:25:24 - loss: 0.4889 - accuracy: 0.7594

 267/1563 [====>.........................] - ETA: 2:25:17 - loss: 0.4883 - accuracy: 0.7598

 268/1563 [====>.........................] - ETA: 2:25:11 - loss: 0.4872 - accuracy: 0.7603

 269/1563 [====>.........................] - ETA: 2:25:03 - loss: 0.4873 - accuracy: 0.7602

 270/1563 [====>.........................] - ETA: 2:24:55 - loss: 0.4871 - accuracy: 0.7600

 271/1563 [====>.........................] - ETA: 2:24:47 - loss: 0.4868 - accuracy: 0.7599

 272/1563 [====>.........................] - ETA: 2:24:39 - loss: 0.4873 - accuracy: 0.7601

 273/1563 [====>.........................] - ETA: 2:24:34 - loss: 0.4866 - accuracy: 0.7603

 274/1563 [====>.........................] - ETA: 2:24:25 - loss: 0.4862 - accuracy: 0.7607

 275/1563 [====>.........................] - ETA: 2:24:17 - loss: 0.4858 - accuracy: 0.7609

 276/1563 [====>.........................] - ETA: 2:24:09 - loss: 0.4857 - accuracy: 0.7611

 277/1563 [====>.........................] - ETA: 2:24:01 - loss: 0.4846 - accuracy: 0.7620

 278/1563 [====>.........................] - ETA: 2:23:55 - loss: 0.4836 - accuracy: 0.7626

 279/1563 [====>.........................] - ETA: 2:23:46 - loss: 0.4828 - accuracy: 0.7632

 280/1563 [====>.........................] - ETA: 2:23:38 - loss: 0.4825 - accuracy: 0.7634

 281/1563 [====>.........................] - ETA: 2:23:29 - loss: 0.4821 - accuracy: 0.7638

 282/1563 [====>.........................] - ETA: 2:23:21 - loss: 0.4813 - accuracy: 0.7642

 283/1563 [====>.........................] - ETA: 2:23:15 - loss: 0.4808 - accuracy: 0.7646

 284/1563 [====>.........................] - ETA: 2:23:06 - loss: 0.4809 - accuracy: 0.7645

 285/1563 [====>.........................] - ETA: 2:22:58 - loss: 0.4805 - accuracy: 0.7649

 286/1563 [====>.........................] - ETA: 2:22:50 - loss: 0.4811 - accuracy: 0.7644

 287/1563 [====>.........................] - ETA: 2:22:42 - loss: 0.4812 - accuracy: 0.7648

 288/1563 [====>.........................] - ETA: 2:22:36 - loss: 0.4811 - accuracy: 0.7645

 289/1563 [====>.........................] - ETA: 2:22:28 - loss: 0.4807 - accuracy: 0.7647

 290/1563 [====>.........................] - ETA: 2:22:20 - loss: 0.4811 - accuracy: 0.7647

 291/1563 [====>.........................] - ETA: 2:22:12 - loss: 0.4801 - accuracy: 0.7652

 292/1563 [====>.........................] - ETA: 2:22:03 - loss: 0.4798 - accuracy: 0.7654

 293/1563 [====>.........................] - ETA: 2:21:57 - loss: 0.4791 - accuracy: 0.7658

 294/1563 [====>.........................] - ETA: 2:21:49 - loss: 0.4788 - accuracy: 0.7662

 295/1563 [====>.........................] - ETA: 2:21:41 - loss: 0.4775 - accuracy: 0.7669

 296/1563 [====>.........................] - ETA: 2:21:33 - loss: 0.4770 - accuracy: 0.7671

 297/1563 [====>.........................] - ETA: 2:21:25 - loss: 0.4774 - accuracy: 0.7668

 298/1563 [====>.........................] - ETA: 2:21:19 - loss: 0.4771 - accuracy: 0.7670

 299/1563 [====>.........................] - ETA: 2:21:11 - loss: 0.4775 - accuracy: 0.7669

 300/1563 [====>.........................] - ETA: 2:21:03 - loss: 0.4769 - accuracy: 0.7673

 301/1563 [====>.........................] - ETA: 2:20:55 - loss: 0.4765 - accuracy: 0.7676

 302/1563 [====>.........................] - ETA: 2:20:47 - loss: 0.4751 - accuracy: 0.7684

 303/1563 [====>.........................] - ETA: 2:20:41 - loss: 0.4748 - accuracy: 0.7684

 304/1563 [====>.........................] - ETA: 2:20:33 - loss: 0.4741 - accuracy: 0.7685

 305/1563 [====>.........................] - ETA: 2:20:24 - loss: 0.4741 - accuracy: 0.7684

 306/1563 [====>.........................] - ETA: 2:20:17 - loss: 0.4736 - accuracy: 0.7686

 307/1563 [====>.........................] - ETA: 2:20:08 - loss: 0.4737 - accuracy: 0.7687

 308/1563 [====>.........................] - ETA: 2:20:02 - loss: 0.4737 - accuracy: 0.7691

 309/1563 [====>.........................] - ETA: 2:19:54 - loss: 0.4733 - accuracy: 0.7694

 310/1563 [====>.........................] - ETA: 2:19:46 - loss: 0.4738 - accuracy: 0.7688

 311/1563 [====>.........................] - ETA: 2:19:38 - loss: 0.4737 - accuracy: 0.7687

 312/1563 [====>.........................] - ETA: 2:19:30 - loss: 0.4728 - accuracy: 0.7692

 313/1563 [=====>........................] - ETA: 2:19:24 - loss: 0.4729 - accuracy: 0.7694

 314/1563 [=====>........................] - ETA: 2:19:17 - loss: 0.4727 - accuracy: 0.7695

 315/1563 [=====>........................] - ETA: 2:19:09 - loss: 0.4726 - accuracy: 0.7694

 316/1563 [=====>........................] - ETA: 2:19:01 - loss: 0.4722 - accuracy: 0.7698

 317/1563 [=====>........................] - ETA: 2:18:53 - loss: 0.4710 - accuracy: 0.7705

 318/1563 [=====>........................] - ETA: 2:18:46 - loss: 0.4709 - accuracy: 0.7706

 319/1563 [=====>........................] - ETA: 2:18:39 - loss: 0.4707 - accuracy: 0.7710

 320/1563 [=====>........................] - ETA: 2:18:31 - loss: 0.4710 - accuracy: 0.7711

 321/1563 [=====>........................] - ETA: 2:18:24 - loss: 0.4713 - accuracy: 0.7712

 322/1563 [=====>........................] - ETA: 2:18:16 - loss: 0.4707 - accuracy: 0.7712

 323/1563 [=====>........................] - ETA: 2:18:10 - loss: 0.4710 - accuracy: 0.7707

 324/1563 [=====>........................] - ETA: 2:18:03 - loss: 0.4704 - accuracy: 0.7710

 325/1563 [=====>........................] - ETA: 2:17:55 - loss: 0.4707 - accuracy: 0.7708

 326/1563 [=====>........................] - ETA: 2:17:47 - loss: 0.4700 - accuracy: 0.7713

 327/1563 [=====>........................] - ETA: 2:17:40 - loss: 0.4695 - accuracy: 0.7716

 328/1563 [=====>........................] - ETA: 2:17:32 - loss: 0.4688 - accuracy: 0.7721

 329/1563 [=====>........................] - ETA: 2:17:25 - loss: 0.4688 - accuracy: 0.7720

 330/1563 [=====>........................] - ETA: 2:17:18 - loss: 0.4685 - accuracy: 0.7720

 331/1563 [=====>........................] - ETA: 2:17:09 - loss: 0.4681 - accuracy: 0.7723

 332/1563 [=====>........................] - ETA: 2:17:02 - loss: 0.4672 - accuracy: 0.7728

 333/1563 [=====>........................] - ETA: 2:16:54 - loss: 0.4665 - accuracy: 0.7731

 334/1563 [=====>........................] - ETA: 2:16:48 - loss: 0.4661 - accuracy: 0.7734

 335/1563 [=====>........................] - ETA: 2:16:40 - loss: 0.4660 - accuracy: 0.7733

 336/1563 [=====>........................] - ETA: 2:16:32 - loss: 0.4657 - accuracy: 0.7733

 337/1563 [=====>........................] - ETA: 2:16:24 - loss: 0.4656 - accuracy: 0.7732

 338/1563 [=====>........................] - ETA: 2:16:17 - loss: 0.4649 - accuracy: 0.7737

 339/1563 [=====>........................] - ETA: 2:16:10 - loss: 0.4640 - accuracy: 0.7743

 340/1563 [=====>........................] - ETA: 2:16:03 - loss: 0.4640 - accuracy: 0.7741

 341/1563 [=====>........................] - ETA: 2:15:55 - loss: 0.4634 - accuracy: 0.7746

 342/1563 [=====>........................] - ETA: 2:15:48 - loss: 0.4630 - accuracy: 0.7749

 343/1563 [=====>........................] - ETA: 2:15:40 - loss: 0.4628 - accuracy: 0.7748

 344/1563 [=====>........................] - ETA: 2:15:34 - loss: 0.4622 - accuracy: 0.7751

 345/1563 [=====>........................] - ETA: 2:15:26 - loss: 0.4612 - accuracy: 0.7757

 346/1563 [=====>........................] - ETA: 2:15:18 - loss: 0.4612 - accuracy: 0.7760

 347/1563 [=====>........................] - ETA: 2:15:11 - loss: 0.4609 - accuracy: 0.7763

 348/1563 [=====>........................] - ETA: 2:15:03 - loss: 0.4598 - accuracy: 0.7769

 349/1563 [=====>........................] - ETA: 2:14:57 - loss: 0.4593 - accuracy: 0.7769

 350/1563 [=====>........................] - ETA: 2:14:50 - loss: 0.4590 - accuracy: 0.7770

 351/1563 [=====>........................] - ETA: 2:14:42 - loss: 0.4592 - accuracy: 0.7767

 352/1563 [=====>........................] - ETA: 2:14:34 - loss: 0.4585 - accuracy: 0.7770

 353/1563 [=====>........................] - ETA: 2:14:26 - loss: 0.4581 - accuracy: 0.7771

 354/1563 [=====>........................] - ETA: 2:14:21 - loss: 0.4573 - accuracy: 0.7775

 355/1563 [=====>........................] - ETA: 2:14:13 - loss: 0.4566 - accuracy: 0.7778

 356/1563 [=====>........................] - ETA: 2:14:05 - loss: 0.4570 - accuracy: 0.7776

 357/1563 [=====>........................] - ETA: 2:13:58 - loss: 0.4572 - accuracy: 0.7775

 358/1563 [=====>........................] - ETA: 2:13:50 - loss: 0.4571 - accuracy: 0.7776

 359/1563 [=====>........................] - ETA: 2:13:44 - loss: 0.4564 - accuracy: 0.7777

 360/1563 [=====>........................] - ETA: 2:13:37 - loss: 0.4565 - accuracy: 0.7778

 361/1563 [=====>........................] - ETA: 2:13:29 - loss: 0.4560 - accuracy: 0.7782

 362/1563 [=====>........................] - ETA: 2:13:21 - loss: 0.4557 - accuracy: 0.7783

 363/1563 [=====>........................] - ETA: 2:13:14 - loss: 0.4558 - accuracy: 0.7784

 364/1563 [=====>........................] - ETA: 2:13:08 - loss: 0.4551 - accuracy: 0.7787

































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































Epoch 2/3


   1/1563 [..............................] - ETA: 3:06:27 - loss: 0.0853 - accuracy: 0.9375

   2/1563 [..............................] - ETA: 2:50:55 - loss: 0.1032 - accuracy: 0.9688

   3/1563 [..............................] - ETA: 2:52:41 - loss: 0.2177 - accuracy: 0.9167

   4/1563 [..............................] - ETA: 2:52:12 - loss: 0.2515 - accuracy: 0.9062

   5/1563 [..............................] - ETA: 2:52:48 - loss: 0.2275 - accuracy: 0.9125

   6/1563 [..............................] - ETA: 2:54:29 - loss: 0.2170 - accuracy: 0.9167

   7/1563 [..............................] - ETA: 2:53:57 - loss: 0.2015 - accuracy: 0.9286

   8/1563 [..............................] - ETA: 2:53:16 - loss: 0.1924 - accuracy: 0.9375

   9/1563 [..............................] - ETA: 2:53:17 - loss: 0.1755 - accuracy: 0.9444

  10/1563 [..............................] - ETA: 2:53:59 - loss: 0.1658 - accuracy: 0.9500

  11/1563 [..............................] - ETA: 2:53:49 - loss: 0.1603 - accuracy: 0.9545

  12/1563 [..............................] - ETA: 2:53:33 - loss: 0.1736 - accuracy: 0.9531

  13/1563 [..............................] - ETA: 2:53:17 - loss: 0.1773 - accuracy: 0.9423

  14/1563 [..............................] - ETA: 2:52:51 - loss: 0.1937 - accuracy: 0.9420

  15/1563 [..............................] - ETA: 2:53:36 - loss: 0.1897 - accuracy: 0.9417

  16/1563 [..............................] - ETA: 2:53:29 - loss: 0.2024 - accuracy: 0.9336

  17/1563 [..............................] - ETA: 2:53:17 - loss: 0.2007 - accuracy: 0.9338

  18/1563 [..............................] - ETA: 2:52:56 - loss: 0.1931 - accuracy: 0.9375

  19/1563 [..............................] - ETA: 2:52:39 - loss: 0.1872 - accuracy: 0.9408

  20/1563 [..............................] - ETA: 2:53:04 - loss: 0.1997 - accuracy: 0.9344

  21/1563 [..............................] - ETA: 2:52:46 - loss: 0.1987 - accuracy: 0.9345

  22/1563 [..............................] - ETA: 2:52:33 - loss: 0.1917 - accuracy: 0.9375

  23/1563 [..............................] - ETA: 2:52:19 - loss: 0.1933 - accuracy: 0.9348

  24/1563 [..............................] - ETA: 2:52:03 - loss: 0.1887 - accuracy: 0.9375

  25/1563 [..............................] - ETA: 2:52:29 - loss: 0.1878 - accuracy: 0.9375

  26/1563 [..............................] - ETA: 2:52:19 - loss: 0.1912 - accuracy: 0.9351

  27/1563 [..............................] - ETA: 2:52:03 - loss: 0.1873 - accuracy: 0.9352

  28/1563 [..............................] - ETA: 2:51:58 - loss: 0.1918 - accuracy: 0.9330

  29/1563 [..............................] - ETA: 2:51:49 - loss: 0.1865 - accuracy: 0.9353

  30/1563 [..............................] - ETA: 2:52:04 - loss: 0.1838 - accuracy: 0.9375

  31/1563 [..............................] - ETA: 2:51:56 - loss: 0.1804 - accuracy: 0.9395

  32/1563 [..............................] - ETA: 2:51:49 - loss: 0.1848 - accuracy: 0.9375

  33/1563 [..............................] - ETA: 2:51:38 - loss: 0.1864 - accuracy: 0.9375

  34/1563 [..............................] - ETA: 2:51:27 - loss: 0.1881 - accuracy: 0.9357

  35/1563 [..............................] - ETA: 2:51:44 - loss: 0.1880 - accuracy: 0.9357

  36/1563 [..............................] - ETA: 2:51:31 - loss: 0.1917 - accuracy: 0.9340

  37/1563 [..............................] - ETA: 2:51:21 - loss: 0.1886 - accuracy: 0.9341

  38/1563 [..............................] - ETA: 2:51:09 - loss: 0.1884 - accuracy: 0.9342

  39/1563 [..............................] - ETA: 2:51:00 - loss: 0.1889 - accuracy: 0.9343

  40/1563 [..............................] - ETA: 2:51:03 - loss: 0.1893 - accuracy: 0.9344

  41/1563 [..............................] - ETA: 2:50:56 - loss: 0.1866 - accuracy: 0.9360

  42/1563 [..............................] - ETA: 2:50:44 - loss: 0.1831 - accuracy: 0.9375

  43/1563 [..............................] - ETA: 2:50:33 - loss: 0.1802 - accuracy: 0.9390

  44/1563 [..............................] - ETA: 2:50:37 - loss: 0.1771 - accuracy: 0.9403

  45/1563 [..............................] - ETA: 2:50:28 - loss: 0.1809 - accuracy: 0.9389

  46/1563 [..............................] - ETA: 2:50:18 - loss: 0.1835 - accuracy: 0.9389

  47/1563 [..............................] - ETA: 2:50:10 - loss: 0.1815 - accuracy: 0.9388

  48/1563 [..............................] - ETA: 2:49:59 - loss: 0.1803 - accuracy: 0.9388

  49/1563 [..............................] - ETA: 2:50:08 - loss: 0.1847 - accuracy: 0.9375

  50/1563 [..............................] - ETA: 2:49:59 - loss: 0.1816 - accuracy: 0.9388

  51/1563 [..............................] - ETA: 2:49:49 - loss: 0.1804 - accuracy: 0.9387

  52/1563 [..............................] - ETA: 2:49:39 - loss: 0.1797 - accuracy: 0.9387

  53/1563 [>.............................] - ETA: 2:49:27 - loss: 0.1798 - accuracy: 0.9387

  54/1563 [>.............................] - ETA: 2:49:31 - loss: 0.1837 - accuracy: 0.9387

  55/1563 [>.............................] - ETA: 2:49:19 - loss: 0.1837 - accuracy: 0.9375

  56/1563 [>.............................] - ETA: 2:49:09 - loss: 0.1871 - accuracy: 0.9364

  57/1563 [>.............................] - ETA: 2:49:00 - loss: 0.1849 - accuracy: 0.9375

  58/1563 [>.............................] - ETA: 2:48:49 - loss: 0.1831 - accuracy: 0.9386

  59/1563 [>.............................] - ETA: 2:48:52 - loss: 0.1846 - accuracy: 0.9375

  60/1563 [>.............................] - ETA: 2:48:39 - loss: 0.1857 - accuracy: 0.9375

  61/1563 [>.............................] - ETA: 2:48:30 - loss: 0.1828 - accuracy: 0.9385

  62/1563 [>.............................] - ETA: 2:48:20 - loss: 0.1890 - accuracy: 0.9365

  63/1563 [>.............................] - ETA: 2:48:09 - loss: 0.1912 - accuracy: 0.9355

  64/1563 [>.............................] - ETA: 2:48:12 - loss: 0.1940 - accuracy: 0.9336

  65/1563 [>.............................] - ETA: 2:48:03 - loss: 0.1953 - accuracy: 0.9317

  66/1563 [>.............................] - ETA: 2:47:56 - loss: 0.1942 - accuracy: 0.9318

  67/1563 [>.............................] - ETA: 2:47:45 - loss: 0.1925 - accuracy: 0.9319

  68/1563 [>.............................] - ETA: 2:47:35 - loss: 0.1915 - accuracy: 0.9320

  69/1563 [>.............................] - ETA: 2:47:37 - loss: 0.1907 - accuracy: 0.9330

  70/1563 [>.............................] - ETA: 2:47:26 - loss: 0.1925 - accuracy: 0.9321

  71/1563 [>.............................] - ETA: 2:47:18 - loss: 0.1956 - accuracy: 0.9305

  72/1563 [>.............................] - ETA: 2:47:07 - loss: 0.1972 - accuracy: 0.9297

  73/1563 [>.............................] - ETA: 2:46:58 - loss: 0.1969 - accuracy: 0.9298

  74/1563 [>.............................] - ETA: 2:46:58 - loss: 0.1961 - accuracy: 0.9299

  75/1563 [>.............................] - ETA: 2:46:49 - loss: 0.1952 - accuracy: 0.9300

  76/1563 [>.............................] - ETA: 2:46:39 - loss: 0.1945 - accuracy: 0.9293

  77/1563 [>.............................] - ETA: 2:46:29 - loss: 0.1950 - accuracy: 0.9286

  78/1563 [>.............................] - ETA: 2:46:22 - loss: 0.1947 - accuracy: 0.9279

  79/1563 [>.............................] - ETA: 2:46:22 - loss: 0.1940 - accuracy: 0.9272

  80/1563 [>.............................] - ETA: 2:46:13 - loss: 0.1933 - accuracy: 0.9273

  81/1563 [>.............................] - ETA: 2:46:07 - loss: 0.1927 - accuracy: 0.9267

  82/1563 [>.............................] - ETA: 2:45:57 - loss: 0.1930 - accuracy: 0.9268

  83/1563 [>.............................] - ETA: 2:45:54 - loss: 0.1934 - accuracy: 0.9270

  84/1563 [>.............................] - ETA: 2:45:48 - loss: 0.1919 - accuracy: 0.9278

  85/1563 [>.............................] - ETA: 2:45:39 - loss: 0.1902 - accuracy: 0.9287

  86/1563 [>.............................] - ETA: 2:45:31 - loss: 0.1911 - accuracy: 0.9281

  87/1563 [>.............................] - ETA: 2:45:23 - loss: 0.1898 - accuracy: 0.9289

  88/1563 [>.............................] - ETA: 2:45:22 - loss: 0.1890 - accuracy: 0.9297

  89/1563 [>.............................] - ETA: 2:45:13 - loss: 0.1874 - accuracy: 0.9305

  90/1563 [>.............................] - ETA: 2:45:04 - loss: 0.1874 - accuracy: 0.9299

  91/1563 [>.............................] - ETA: 2:44:55 - loss: 0.1863 - accuracy: 0.9306

  92/1563 [>.............................] - ETA: 2:44:47 - loss: 0.1859 - accuracy: 0.9307

  93/1563 [>.............................] - ETA: 2:44:47 - loss: 0.1863 - accuracy: 0.9301

  94/1563 [>.............................] - ETA: 2:44:37 - loss: 0.1863 - accuracy: 0.9295

  95/1563 [>.............................] - ETA: 2:44:28 - loss: 0.1861 - accuracy: 0.9289

  96/1563 [>.............................] - ETA: 2:44:22 - loss: 0.1850 - accuracy: 0.9297

  97/1563 [>.............................] - ETA: 2:44:14 - loss: 0.1832 - accuracy: 0.9304

  98/1563 [>.............................] - ETA: 2:44:14 - loss: 0.1827 - accuracy: 0.9305

  99/1563 [>.............................] - ETA: 2:44:05 - loss: 0.1838 - accuracy: 0.9299

 100/1563 [>.............................] - ETA: 2:43:55 - loss: 0.1835 - accuracy: 0.9300

 101/1563 [>.............................] - ETA: 2:43:47 - loss: 0.1830 - accuracy: 0.9301

 102/1563 [>.............................] - ETA: 2:43:39 - loss: 0.1829 - accuracy: 0.9295

 103/1563 [>.............................] - ETA: 2:43:37 - loss: 0.1836 - accuracy: 0.9284

 104/1563 [>.............................] - ETA: 2:43:28 - loss: 0.1834 - accuracy: 0.9285

 105/1563 [=>............................] - ETA: 2:43:20 - loss: 0.1843 - accuracy: 0.9280

 106/1563 [=>............................] - ETA: 2:43:12 - loss: 0.1849 - accuracy: 0.9275

 107/1563 [=>............................] - ETA: 2:43:03 - loss: 0.1841 - accuracy: 0.9276

 108/1563 [=>............................] - ETA: 2:43:01 - loss: 0.1841 - accuracy: 0.9277

 109/1563 [=>............................] - ETA: 2:42:52 - loss: 0.1828 - accuracy: 0.9283

 110/1563 [=>............................] - ETA: 2:42:43 - loss: 0.1865 - accuracy: 0.9278

 111/1563 [=>............................] - ETA: 2:42:35 - loss: 0.1868 - accuracy: 0.9274

 112/1563 [=>............................] - ETA: 2:42:27 - loss: 0.1858 - accuracy: 0.9275

 113/1563 [=>............................] - ETA: 2:42:25 - loss: 0.1849 - accuracy: 0.9281

 114/1563 [=>............................] - ETA: 2:42:17 - loss: 0.1875 - accuracy: 0.9276

 115/1563 [=>............................] - ETA: 2:42:08 - loss: 0.1872 - accuracy: 0.9277

 116/1563 [=>............................] - ETA: 2:42:01 - loss: 0.1864 - accuracy: 0.9278

 117/1563 [=>............................] - ETA: 2:41:52 - loss: 0.1868 - accuracy: 0.9268

 118/1563 [=>............................] - ETA: 2:41:51 - loss: 0.1890 - accuracy: 0.9258

 119/1563 [=>............................] - ETA: 2:41:44 - loss: 0.1925 - accuracy: 0.9249

 120/1563 [=>............................] - ETA: 2:41:36 - loss: 0.1937 - accuracy: 0.9240

 121/1563 [=>............................] - ETA: 2:41:28 - loss: 0.1928 - accuracy: 0.9246

 122/1563 [=>............................] - ETA: 2:41:20 - loss: 0.1924 - accuracy: 0.9247

 123/1563 [=>............................] - ETA: 2:41:18 - loss: 0.1921 - accuracy: 0.9248

 124/1563 [=>............................] - ETA: 2:41:11 - loss: 0.1921 - accuracy: 0.9249

 125/1563 [=>............................] - ETA: 2:41:03 - loss: 0.1912 - accuracy: 0.9255

 126/1563 [=>............................] - ETA: 2:40:54 - loss: 0.1910 - accuracy: 0.9256

 127/1563 [=>............................] - ETA: 2:40:48 - loss: 0.1903 - accuracy: 0.9262

 128/1563 [=>............................] - ETA: 2:40:43 - loss: 0.1892 - accuracy: 0.9268

 129/1563 [=>............................] - ETA: 2:40:36 - loss: 0.1912 - accuracy: 0.9264

 130/1563 [=>............................] - ETA: 2:40:28 - loss: 0.1904 - accuracy: 0.9269

 131/1563 [=>............................] - ETA: 2:40:20 - loss: 0.1933 - accuracy: 0.9251

 132/1563 [=>............................] - ETA: 2:40:17 - loss: 0.1930 - accuracy: 0.9247

 133/1563 [=>............................] - ETA: 2:40:08 - loss: 0.1922 - accuracy: 0.9253

 134/1563 [=>............................] - ETA: 2:40:01 - loss: 0.1914 - accuracy: 0.9258

 135/1563 [=>............................] - ETA: 2:39:56 - loss: 0.1912 - accuracy: 0.9259

 136/1563 [=>............................] - ETA: 2:39:49 - loss: 0.1913 - accuracy: 0.9260

 137/1563 [=>............................] - ETA: 2:39:49 - loss: 0.1916 - accuracy: 0.9261

 138/1563 [=>............................] - ETA: 2:39:44 - loss: 0.1914 - accuracy: 0.9262

 139/1563 [=>............................] - ETA: 2:39:37 - loss: 0.1916 - accuracy: 0.9263

 140/1563 [=>............................] - ETA: 2:39:30 - loss: 0.1905 - accuracy: 0.9268

 141/1563 [=>............................] - ETA: 2:39:23 - loss: 0.1897 - accuracy: 0.9273

 142/1563 [=>............................] - ETA: 2:39:23 - loss: 0.1929 - accuracy: 0.9269

 143/1563 [=>............................] - ETA: 2:39:17 - loss: 0.1929 - accuracy: 0.9270

 144/1563 [=>............................] - ETA: 2:39:11 - loss: 0.1930 - accuracy: 0.9271

 145/1563 [=>............................] - ETA: 2:39:05 - loss: 0.1921 - accuracy: 0.9276

 146/1563 [=>............................] - ETA: 2:38:59 - loss: 0.1916 - accuracy: 0.9277

 147/1563 [=>............................] - ETA: 2:38:58 - loss: 0.1907 - accuracy: 0.9281

 148/1563 [=>............................] - ETA: 2:38:52 - loss: 0.1896 - accuracy: 0.9286

 149/1563 [=>............................] - ETA: 2:38:44 - loss: 0.1896 - accuracy: 0.9283

 150/1563 [=>............................] - ETA: 2:38:37 - loss: 0.1903 - accuracy: 0.9279

 151/1563 [=>............................] - ETA: 2:38:33 - loss: 0.1897 - accuracy: 0.9284

 152/1563 [=>............................] - ETA: 2:38:27 - loss: 0.1892 - accuracy: 0.9289

 153/1563 [=>............................] - ETA: 2:38:19 - loss: 0.1882 - accuracy: 0.9293

 154/1563 [=>............................] - ETA: 2:38:11 - loss: 0.1918 - accuracy: 0.9286

 155/1563 [=>............................] - ETA: 2:38:03 - loss: 0.1930 - accuracy: 0.9278

 156/1563 [=>............................] - ETA: 2:38:00 - loss: 0.1945 - accuracy: 0.9275

 157/1563 [==>...........................] - ETA: 2:37:53 - loss: 0.1963 - accuracy: 0.9268

 158/1563 [==>...........................] - ETA: 2:37:45 - loss: 0.1968 - accuracy: 0.9264

 159/1563 [==>...........................] - ETA: 2:37:37 - loss: 0.1976 - accuracy: 0.9265

 160/1563 [==>...........................] - ETA: 2:37:30 - loss: 0.1989 - accuracy: 0.9258

 161/1563 [==>...........................] - ETA: 2:37:27 - loss: 0.1982 - accuracy: 0.9259

 162/1563 [==>...........................] - ETA: 2:37:19 - loss: 0.1983 - accuracy: 0.9259

 163/1563 [==>...........................] - ETA: 2:37:11 - loss: 0.1986 - accuracy: 0.9256

 164/1563 [==>...........................] - ETA: 2:37:03 - loss: 0.1986 - accuracy: 0.9257

 165/1563 [==>...........................] - ETA: 2:36:55 - loss: 0.1980 - accuracy: 0.9261

 166/1563 [==>...........................] - ETA: 2:36:52 - loss: 0.1978 - accuracy: 0.9262

 167/1563 [==>...........................] - ETA: 2:36:44 - loss: 0.1977 - accuracy: 0.9263

 168/1563 [==>...........................] - ETA: 2:36:37 - loss: 0.1976 - accuracy: 0.9263

 169/1563 [==>...........................] - ETA: 2:36:30 - loss: 0.1988 - accuracy: 0.9257

 170/1563 [==>...........................] - ETA: 2:36:23 - loss: 0.1981 - accuracy: 0.9261

 171/1563 [==>...........................] - ETA: 2:36:19 - loss: 0.1976 - accuracy: 0.9262

 172/1563 [==>...........................] - ETA: 2:36:12 - loss: 0.1986 - accuracy: 0.9251

 173/1563 [==>...........................] - ETA: 2:36:04 - loss: 0.1980 - accuracy: 0.9256

 174/1563 [==>...........................] - ETA: 2:35:56 - loss: 0.1973 - accuracy: 0.9260

 175/1563 [==>...........................] - ETA: 2:35:49 - loss: 0.1990 - accuracy: 0.9257

 176/1563 [==>...........................] - ETA: 2:35:46 - loss: 0.1983 - accuracy: 0.9261

 177/1563 [==>...........................] - ETA: 2:35:38 - loss: 0.1990 - accuracy: 0.9258

 178/1563 [==>...........................] - ETA: 2:35:30 - loss: 0.1986 - accuracy: 0.9263

 179/1563 [==>...........................] - ETA: 2:35:23 - loss: 0.1979 - accuracy: 0.9267

 180/1563 [==>...........................] - ETA: 2:35:15 - loss: 0.1986 - accuracy: 0.9264

 181/1563 [==>...........................] - ETA: 2:35:11 - loss: 0.1994 - accuracy: 0.9265

 182/1563 [==>...........................] - ETA: 2:35:03 - loss: 0.2012 - accuracy: 0.9258

 183/1563 [==>...........................] - ETA: 2:34:56 - loss: 0.2003 - accuracy: 0.9262

 184/1563 [==>...........................] - ETA: 2:34:51 - loss: 0.1999 - accuracy: 0.9266

 185/1563 [==>...........................] - ETA: 2:34:49 - loss: 0.1996 - accuracy: 0.9267

 186/1563 [==>...........................] - ETA: 2:34:50 - loss: 0.1994 - accuracy: 0.9264

 187/1563 [==>...........................] - ETA: 2:34:49 - loss: 0.1992 - accuracy: 0.9265

 188/1563 [==>...........................] - ETA: 2:34:45 - loss: 0.1993 - accuracy: 0.9262

 189/1563 [==>...........................] - ETA: 2:34:38 - loss: 0.2012 - accuracy: 0.9253

 190/1563 [==>...........................] - ETA: 2:34:34 - loss: 0.2009 - accuracy: 0.9253

 191/1563 [==>...........................] - ETA: 2:34:27 - loss: 0.2015 - accuracy: 0.9247

 192/1563 [==>...........................] - ETA: 2:34:19 - loss: 0.2007 - accuracy: 0.9251

 193/1563 [==>...........................] - ETA: 2:34:11 - loss: 0.2001 - accuracy: 0.9255

 194/1563 [==>...........................] - ETA: 2:34:04 - loss: 0.1992 - accuracy: 0.9259

 195/1563 [==>...........................] - ETA: 2:34:00 - loss: 0.1985 - accuracy: 0.9263

 196/1563 [==>...........................] - ETA: 2:33:53 - loss: 0.1979 - accuracy: 0.9267

 197/1563 [==>...........................] - ETA: 2:33:46 - loss: 0.1983 - accuracy: 0.9264

 198/1563 [==>...........................] - ETA: 2:33:38 - loss: 0.1996 - accuracy: 0.9261

 199/1563 [==>...........................] - ETA: 2:33:30 - loss: 0.1994 - accuracy: 0.9262

 200/1563 [==>...........................] - ETA: 2:33:26 - loss: 0.1987 - accuracy: 0.9266

 201/1563 [==>...........................] - ETA: 2:33:19 - loss: 0.1991 - accuracy: 0.9263

 202/1563 [==>...........................] - ETA: 2:33:11 - loss: 0.2010 - accuracy: 0.9251

 203/1563 [==>...........................] - ETA: 2:33:03 - loss: 0.2000 - accuracy: 0.9255

 204/1563 [==>...........................] - ETA: 2:32:56 - loss: 0.2003 - accuracy: 0.9256

 205/1563 [==>...........................] - ETA: 2:32:50 - loss: 0.1998 - accuracy: 0.9256

 206/1563 [==>...........................] - ETA: 2:32:43 - loss: 0.1995 - accuracy: 0.9257

 207/1563 [==>...........................] - ETA: 2:32:36 - loss: 0.1995 - accuracy: 0.9257

 208/1563 [==>...........................] - ETA: 2:32:28 - loss: 0.2000 - accuracy: 0.9258

 209/1563 [===>..........................] - ETA: 2:32:23 - loss: 0.1991 - accuracy: 0.9261

 210/1563 [===>..........................] - ETA: 2:32:16 - loss: 0.2000 - accuracy: 0.9262

 211/1563 [===>..........................] - ETA: 2:32:09 - loss: 0.1997 - accuracy: 0.9262

 212/1563 [===>..........................] - ETA: 2:32:02 - loss: 0.2000 - accuracy: 0.9257

 213/1563 [===>..........................] - ETA: 2:31:54 - loss: 0.2001 - accuracy: 0.9255

 214/1563 [===>..........................] - ETA: 2:31:50 - loss: 0.1995 - accuracy: 0.9258

 215/1563 [===>..........................] - ETA: 2:31:42 - loss: 0.1992 - accuracy: 0.9259

 216/1563 [===>..........................] - ETA: 2:31:35 - loss: 0.1985 - accuracy: 0.9262

 217/1563 [===>..........................] - ETA: 2:31:28 - loss: 0.1990 - accuracy: 0.9263

 218/1563 [===>..........................] - ETA: 2:31:20 - loss: 0.2005 - accuracy: 0.9257

 219/1563 [===>..........................] - ETA: 2:31:15 - loss: 0.2010 - accuracy: 0.9252

 220/1563 [===>..........................] - ETA: 2:31:08 - loss: 0.2033 - accuracy: 0.9247

 221/1563 [===>..........................] - ETA: 2:31:00 - loss: 0.2033 - accuracy: 0.9242

 222/1563 [===>..........................] - ETA: 2:30:53 - loss: 0.2026 - accuracy: 0.9245

 223/1563 [===>..........................] - ETA: 2:30:46 - loss: 0.2023 - accuracy: 0.9246

 224/1563 [===>..........................] - ETA: 2:30:41 - loss: 0.2020 - accuracy: 0.9247

 225/1563 [===>..........................] - ETA: 2:30:34 - loss: 0.2020 - accuracy: 0.9244

 226/1563 [===>..........................] - ETA: 2:30:26 - loss: 0.2024 - accuracy: 0.9242

 227/1563 [===>..........................] - ETA: 2:30:18 - loss: 0.2016 - accuracy: 0.9246

 228/1563 [===>..........................] - ETA: 2:30:11 - loss: 0.2019 - accuracy: 0.9243

 229/1563 [===>..........................] - ETA: 2:30:06 - loss: 0.2016 - accuracy: 0.9244

 230/1563 [===>..........................] - ETA: 2:29:59 - loss: 0.2011 - accuracy: 0.9247

 231/1563 [===>..........................] - ETA: 2:29:51 - loss: 0.2014 - accuracy: 0.9245

 232/1563 [===>..........................] - ETA: 2:29:44 - loss: 0.2012 - accuracy: 0.9243

 233/1563 [===>..........................] - ETA: 2:29:36 - loss: 0.2014 - accuracy: 0.9244

 234/1563 [===>..........................] - ETA: 2:29:32 - loss: 0.2019 - accuracy: 0.9239

 235/1563 [===>..........................] - ETA: 2:29:24 - loss: 0.2019 - accuracy: 0.9239

 236/1563 [===>..........................] - ETA: 2:29:17 - loss: 0.2018 - accuracy: 0.9240

 237/1563 [===>..........................] - ETA: 2:29:10 - loss: 0.2016 - accuracy: 0.9241

 238/1563 [===>..........................] - ETA: 2:29:03 - loss: 0.2013 - accuracy: 0.9241

 239/1563 [===>..........................] - ETA: 2:28:57 - loss: 0.2011 - accuracy: 0.9242

 240/1563 [===>..........................] - ETA: 2:28:50 - loss: 0.2009 - accuracy: 0.9240

 241/1563 [===>..........................] - ETA: 2:28:42 - loss: 0.2004 - accuracy: 0.9243

 242/1563 [===>..........................] - ETA: 2:28:35 - loss: 0.2000 - accuracy: 0.9246

 243/1563 [===>..........................] - ETA: 2:28:29 - loss: 0.1996 - accuracy: 0.9249

 244/1563 [===>..........................] - ETA: 2:28:22 - loss: 0.2001 - accuracy: 0.9249

 245/1563 [===>..........................] - ETA: 2:28:14 - loss: 0.2007 - accuracy: 0.9247

 246/1563 [===>..........................] - ETA: 2:28:07 - loss: 0.2009 - accuracy: 0.9248

 247/1563 [===>..........................] - ETA: 2:28:00 - loss: 0.2010 - accuracy: 0.9248

 248/1563 [===>..........................] - ETA: 2:27:55 - loss: 0.2011 - accuracy: 0.9246

 249/1563 [===>..........................] - ETA: 2:27:48 - loss: 0.2008 - accuracy: 0.9247

 250/1563 [===>..........................] - ETA: 2:27:42 - loss: 0.2013 - accuracy: 0.9247

 251/1563 [===>..........................] - ETA: 2:27:35 - loss: 0.2013 - accuracy: 0.9248

 252/1563 [===>..........................] - ETA: 2:27:27 - loss: 0.2009 - accuracy: 0.9251

 253/1563 [===>..........................] - ETA: 2:27:23 - loss: 0.2015 - accuracy: 0.9251

 254/1563 [===>..........................] - ETA: 2:27:16 - loss: 0.2017 - accuracy: 0.9250

 255/1563 [===>..........................] - ETA: 2:27:09 - loss: 0.2012 - accuracy: 0.9252

 256/1563 [===>..........................] - ETA: 2:27:02 - loss: 0.2007 - accuracy: 0.9255

 257/1563 [===>..........................] - ETA: 2:26:55 - loss: 0.2022 - accuracy: 0.9253

 258/1563 [===>..........................] - ETA: 2:26:51 - loss: 0.2027 - accuracy: 0.9254

 259/1563 [===>..........................] - ETA: 2:26:44 - loss: 0.2027 - accuracy: 0.9254

 260/1563 [===>..........................] - ETA: 2:26:37 - loss: 0.2023 - accuracy: 0.9255

 261/1563 [====>.........................] - ETA: 2:26:30 - loss: 0.2019 - accuracy: 0.9258

 262/1563 [====>.........................] - ETA: 2:26:24 - loss: 0.2021 - accuracy: 0.9258

 263/1563 [====>.........................] - ETA: 2:26:19 - loss: 0.2030 - accuracy: 0.9254

 264/1563 [====>.........................] - ETA: 2:26:11 - loss: 0.2027 - accuracy: 0.9254

 265/1563 [====>.........................] - ETA: 2:26:04 - loss: 0.2024 - accuracy: 0.9255

 266/1563 [====>.........................] - ETA: 2:25:57 - loss: 0.2028 - accuracy: 0.9253

 267/1563 [====>.........................] - ETA: 2:25:49 - loss: 0.2028 - accuracy: 0.9253

 268/1563 [====>.........................] - ETA: 2:25:45 - loss: 0.2021 - accuracy: 0.9256

 269/1563 [====>.........................] - ETA: 2:25:38 - loss: 0.2023 - accuracy: 0.9254

 270/1563 [====>.........................] - ETA: 2:25:30 - loss: 0.2020 - accuracy: 0.9255

 271/1563 [====>.........................] - ETA: 2:25:23 - loss: 0.2018 - accuracy: 0.9255

 272/1563 [====>.........................] - ETA: 2:25:17 - loss: 0.2013 - accuracy: 0.9258

 273/1563 [====>.........................] - ETA: 2:25:10 - loss: 0.2011 - accuracy: 0.9258

 274/1563 [====>.........................] - ETA: 2:25:03 - loss: 0.2009 - accuracy: 0.9261

 275/1563 [====>.........................] - ETA: 2:24:56 - loss: 0.2008 - accuracy: 0.9261

 276/1563 [====>.........................] - ETA: 2:24:49 - loss: 0.2002 - accuracy: 0.9264

 277/1563 [====>.........................] - ETA: 2:24:44 - loss: 0.2004 - accuracy: 0.9260

 278/1563 [====>.........................] - ETA: 2:24:37 - loss: 0.2004 - accuracy: 0.9260

 279/1563 [====>.........................] - ETA: 2:24:30 - loss: 0.2001 - accuracy: 0.9261

 280/1563 [====>.........................] - ETA: 2:24:23 - loss: 0.1996 - accuracy: 0.9263

 281/1563 [====>.........................] - ETA: 2:24:17 - loss: 0.1995 - accuracy: 0.9262

 282/1563 [====>.........................] - ETA: 2:24:12 - loss: 0.1996 - accuracy: 0.9262

 283/1563 [====>.........................] - ETA: 2:24:05 - loss: 0.2002 - accuracy: 0.9260

 284/1563 [====>.........................] - ETA: 2:23:58 - loss: 0.1998 - accuracy: 0.9263

 285/1563 [====>.........................] - ETA: 2:23:51 - loss: 0.1995 - accuracy: 0.9263

 286/1563 [====>.........................] - ETA: 2:23:44 - loss: 0.1993 - accuracy: 0.9264

 287/1563 [====>.........................] - ETA: 2:23:39 - loss: 0.1989 - accuracy: 0.9266

 288/1563 [====>.........................] - ETA: 2:23:32 - loss: 0.1999 - accuracy: 0.9266

 289/1563 [====>.........................] - ETA: 2:23:25 - loss: 0.2006 - accuracy: 0.9265

 290/1563 [====>.........................] - ETA: 2:23:18 - loss: 0.2013 - accuracy: 0.9263

 291/1563 [====>.........................] - ETA: 2:23:11 - loss: 0.2015 - accuracy: 0.9259

 292/1563 [====>.........................] - ETA: 2:23:06 - loss: 0.2011 - accuracy: 0.9262

 293/1563 [====>.........................] - ETA: 2:23:00 - loss: 0.2007 - accuracy: 0.9264

 294/1563 [====>.........................] - ETA: 2:22:53 - loss: 0.2003 - accuracy: 0.9267

 295/1563 [====>.........................] - ETA: 2:22:45 - loss: 0.2002 - accuracy: 0.9267

 296/1563 [====>.........................] - ETA: 2:22:39 - loss: 0.2001 - accuracy: 0.9267

 297/1563 [====>.........................] - ETA: 2:22:34 - loss: 0.1999 - accuracy: 0.9268

 298/1563 [====>.........................] - ETA: 2:22:26 - loss: 0.1996 - accuracy: 0.9268

 299/1563 [====>.........................] - ETA: 2:22:19 - loss: 0.1993 - accuracy: 0.9270

 300/1563 [====>.........................] - ETA: 2:22:12 - loss: 0.1992 - accuracy: 0.9271

 301/1563 [====>.........................] - ETA: 2:22:06 - loss: 0.1987 - accuracy: 0.9273

 302/1563 [====>.........................] - ETA: 2:21:59 - loss: 0.1989 - accuracy: 0.9274

 303/1563 [====>.........................] - ETA: 2:21:52 - loss: 0.1986 - accuracy: 0.9276

 304/1563 [====>.........................] - ETA: 2:21:44 - loss: 0.1984 - accuracy: 0.9276

 305/1563 [====>.........................] - ETA: 2:21:37 - loss: 0.1982 - accuracy: 0.9277

 306/1563 [====>.........................] - ETA: 2:21:32 - loss: 0.1980 - accuracy: 0.9277

 307/1563 [====>.........................] - ETA: 2:21:25 - loss: 0.1976 - accuracy: 0.9277

 308/1563 [====>.........................] - ETA: 2:21:17 - loss: 0.1971 - accuracy: 0.9280

 309/1563 [====>.........................] - ETA: 2:21:11 - loss: 0.1972 - accuracy: 0.9278

 310/1563 [====>.........................] - ETA: 2:21:03 - loss: 0.1966 - accuracy: 0.9280

 311/1563 [====>.........................] - ETA: 2:20:58 - loss: 0.1968 - accuracy: 0.9281

 312/1563 [====>.........................] - ETA: 2:20:51 - loss: 0.1965 - accuracy: 0.9283

 313/1563 [=====>........................] - ETA: 2:20:44 - loss: 0.1960 - accuracy: 0.9285

 314/1563 [=====>........................] - ETA: 2:20:37 - loss: 0.1954 - accuracy: 0.9287

 315/1563 [=====>........................] - ETA: 2:20:30 - loss: 0.1957 - accuracy: 0.9288

 316/1563 [=====>........................] - ETA: 2:20:25 - loss: 0.1951 - accuracy: 0.9290

 317/1563 [=====>........................] - ETA: 2:20:17 - loss: 0.1951 - accuracy: 0.9288

 318/1563 [=====>........................] - ETA: 2:20:10 - loss: 0.1953 - accuracy: 0.9289

 319/1563 [=====>........................] - ETA: 2:20:03 - loss: 0.1951 - accuracy: 0.9289

 320/1563 [=====>........................] - ETA: 2:19:56 - loss: 0.1946 - accuracy: 0.9291

 321/1563 [=====>........................] - ETA: 2:19:51 - loss: 0.1950 - accuracy: 0.9287

 322/1563 [=====>........................] - ETA: 2:19:45 - loss: 0.1949 - accuracy: 0.9288

 323/1563 [=====>........................] - ETA: 2:19:37 - loss: 0.1946 - accuracy: 0.9288

 324/1563 [=====>........................] - ETA: 2:19:30 - loss: 0.1946 - accuracy: 0.9286

 325/1563 [=====>........................] - ETA: 2:19:23 - loss: 0.1942 - accuracy: 0.9288

 326/1563 [=====>........................] - ETA: 2:19:18 - loss: 0.1944 - accuracy: 0.9287

 327/1563 [=====>........................] - ETA: 2:19:11 - loss: 0.1942 - accuracy: 0.9285

 328/1563 [=====>........................] - ETA: 2:19:04 - loss: 0.1943 - accuracy: 0.9285

 329/1563 [=====>........................] - ETA: 2:18:57 - loss: 0.1941 - accuracy: 0.9286

 330/1563 [=====>........................] - ETA: 2:18:51 - loss: 0.1935 - accuracy: 0.9288

 331/1563 [=====>........................] - ETA: 2:18:45 - loss: 0.1934 - accuracy: 0.9288

 332/1563 [=====>........................] - ETA: 2:18:37 - loss: 0.1934 - accuracy: 0.9287

 333/1563 [=====>........................] - ETA: 2:18:30 - loss: 0.1930 - accuracy: 0.9289

 334/1563 [=====>........................] - ETA: 2:18:23 - loss: 0.1927 - accuracy: 0.9289

 335/1563 [=====>........................] - ETA: 2:18:18 - loss: 0.1926 - accuracy: 0.9289

 336/1563 [=====>........................] - ETA: 2:18:11 - loss: 0.1928 - accuracy: 0.9289

 337/1563 [=====>........................] - ETA: 2:18:04 - loss: 0.1924 - accuracy: 0.9290

 338/1563 [=====>........................] - ETA: 2:17:56 - loss: 0.1919 - accuracy: 0.9292

 339/1563 [=====>........................] - ETA: 2:17:49 - loss: 0.1922 - accuracy: 0.9290

 340/1563 [=====>........................] - ETA: 2:17:44 - loss: 0.1933 - accuracy: 0.9287

 341/1563 [=====>........................] - ETA: 2:17:37 - loss: 0.1942 - accuracy: 0.9285

 342/1563 [=====>........................] - ETA: 2:17:31 - loss: 0.1940 - accuracy: 0.9285

 343/1563 [=====>........................] - ETA: 2:17:24 - loss: 0.1950 - accuracy: 0.9282

 344/1563 [=====>........................] - ETA: 2:17:17 - loss: 0.1946 - accuracy: 0.9284

 345/1563 [=====>........................] - ETA: 2:17:12 - loss: 0.1949 - accuracy: 0.9283

 346/1563 [=====>........................] - ETA: 2:17:05 - loss: 0.1946 - accuracy: 0.9283

 347/1563 [=====>........................] - ETA: 2:16:58 - loss: 0.1944 - accuracy: 0.9283

 348/1563 [=====>........................] - ETA: 2:16:51 - loss: 0.1945 - accuracy: 0.9283

 349/1563 [=====>........................] - ETA: 2:16:44 - loss: 0.1942 - accuracy: 0.9284

 350/1563 [=====>........................] - ETA: 2:16:39 - loss: 0.1940 - accuracy: 0.9284

 351/1563 [=====>........................] - ETA: 2:16:32 - loss: 0.1937 - accuracy: 0.9286

 352/1563 [=====>........................] - ETA: 2:16:25 - loss: 0.1937 - accuracy: 0.9286

 353/1563 [=====>........................] - ETA: 2:16:19 - loss: 0.1937 - accuracy: 0.9286

 354/1563 [=====>........................] - ETA: 2:16:13 - loss: 0.1939 - accuracy: 0.9285

 355/1563 [=====>........................] - ETA: 2:16:07 - loss: 0.1947 - accuracy: 0.9278

 356/1563 [=====>........................] - ETA: 2:16:00 - loss: 0.1943 - accuracy: 0.9280

 357/1563 [=====>........................] - ETA: 2:15:53 - loss: 0.1940 - accuracy: 0.9282

 358/1563 [=====>........................] - ETA: 2:15:46 - loss: 0.1944 - accuracy: 0.9281

 359/1563 [=====>........................] - ETA: 2:15:41 - loss: 0.1944 - accuracy: 0.9279

 360/1563 [=====>........................] - ETA: 2:15:34 - loss: 0.1944 - accuracy: 0.9280

 361/1563 [=====>........................] - ETA: 2:15:27 - loss: 0.1941 - accuracy: 0.9280

 362/1563 [=====>........................] - ETA: 2:15:20 - loss: 0.1939 - accuracy: 0.9282

 363/1563 [=====>........................] - ETA: 2:15:13 - loss: 0.1940 - accuracy: 0.9280

 364/1563 [=====>........................] - ETA: 2:15:08 - loss: 0.1939 - accuracy: 0.9281

































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































Epoch 3/3


   1/1563 [..............................] - ETA: 2:50:52 - loss: 0.1532 - accuracy: 0.9375

   2/1563 [..............................] - ETA: 2:58:03 - loss: 0.1219 - accuracy: 0.9688

   3/1563 [..............................] - ETA: 2:53:34 - loss: 0.0883 - accuracy: 0.9792

   4/1563 [..............................] - ETA: 2:51:35 - loss: 0.1027 - accuracy: 0.9688

   5/1563 [..............................] - ETA: 2:50:13 - loss: 0.1214 - accuracy: 0.9625

   6/1563 [..............................] - ETA: 2:49:54 - loss: 0.1517 - accuracy: 0.9375

   7/1563 [..............................] - ETA: 2:50:58 - loss: 0.1321 - accuracy: 0.9464

   8/1563 [..............................] - ETA: 2:50:18 - loss: 0.1334 - accuracy: 0.9453

   9/1563 [..............................] - ETA: 2:49:57 - loss: 0.1283 - accuracy: 0.9514

  10/1563 [..............................] - ETA: 2:49:15 - loss: 0.1171 - accuracy: 0.9563

  11/1563 [..............................] - ETA: 2:49:43 - loss: 0.1106 - accuracy: 0.9602

  12/1563 [..............................] - ETA: 2:50:29 - loss: 0.1105 - accuracy: 0.9583

  13/1563 [..............................] - ETA: 2:50:17 - loss: 0.1065 - accuracy: 0.9615

  14/1563 [..............................] - ETA: 2:50:10 - loss: 0.1136 - accuracy: 0.9598

  15/1563 [..............................] - ETA: 2:50:04 - loss: 0.1240 - accuracy: 0.9542

  16/1563 [..............................] - ETA: 2:50:35 - loss: 0.1355 - accuracy: 0.9531

  17/1563 [..............................] - ETA: 2:50:49 - loss: 0.1316 - accuracy: 0.9559

  18/1563 [..............................] - ETA: 2:50:35 - loss: 0.1382 - accuracy: 0.9514

  19/1563 [..............................] - ETA: 2:50:15 - loss: 0.1322 - accuracy: 0.9539

  20/1563 [..............................] - ETA: 2:49:54 - loss: 0.1288 - accuracy: 0.9563

  21/1563 [..............................] - ETA: 2:50:17 - loss: 0.1238 - accuracy: 0.9583

  22/1563 [..............................] - ETA: 2:49:58 - loss: 0.1237 - accuracy: 0.9574

  23/1563 [..............................] - ETA: 2:49:50 - loss: 0.1237 - accuracy: 0.9565

  24/1563 [..............................] - ETA: 2:49:36 - loss: 0.1212 - accuracy: 0.9583

  25/1563 [..............................] - ETA: 2:49:15 - loss: 0.1179 - accuracy: 0.9600

  26/1563 [..............................] - ETA: 2:49:33 - loss: 0.1158 - accuracy: 0.9591

  27/1563 [..............................] - ETA: 2:49:15 - loss: 0.1130 - accuracy: 0.9606

  28/1563 [..............................] - ETA: 2:49:01 - loss: 0.1101 - accuracy: 0.9621

  29/1563 [..............................] - ETA: 2:48:51 - loss: 0.1083 - accuracy: 0.9634

  30/1563 [..............................] - ETA: 2:48:45 - loss: 0.1072 - accuracy: 0.9646

  31/1563 [..............................] - ETA: 2:49:02 - loss: 0.1043 - accuracy: 0.9657

  32/1563 [..............................] - ETA: 2:48:56 - loss: 0.1022 - accuracy: 0.9668

  33/1563 [..............................] - ETA: 2:48:42 - loss: 0.0997 - accuracy: 0.9678

  34/1563 [..............................] - ETA: 2:48:24 - loss: 0.0972 - accuracy: 0.9688

  35/1563 [..............................] - ETA: 2:48:13 - loss: 0.0972 - accuracy: 0.9679

  36/1563 [..............................] - ETA: 2:48:25 - loss: 0.0963 - accuracy: 0.9670

  37/1563 [..............................] - ETA: 2:48:14 - loss: 0.0991 - accuracy: 0.9645

  38/1563 [..............................] - ETA: 2:48:08 - loss: 0.0968 - accuracy: 0.9655

  39/1563 [..............................] - ETA: 2:48:00 - loss: 0.0971 - accuracy: 0.9647

  40/1563 [..............................] - ETA: 2:47:51 - loss: 0.1014 - accuracy: 0.9641

  41/1563 [..............................] - ETA: 2:48:12 - loss: 0.1002 - accuracy: 0.9649

  42/1563 [..............................] - ETA: 2:48:08 - loss: 0.0988 - accuracy: 0.9658

  43/1563 [..............................] - ETA: 2:48:02 - loss: 0.0974 - accuracy: 0.9666

  44/1563 [..............................] - ETA: 2:47:54 - loss: 0.0965 - accuracy: 0.9659

  45/1563 [..............................] - ETA: 2:47:47 - loss: 0.0946 - accuracy: 0.9667

  46/1563 [..............................] - ETA: 2:48:05 - loss: 0.0957 - accuracy: 0.9660

  47/1563 [..............................] - ETA: 2:47:59 - loss: 0.0944 - accuracy: 0.9668

  48/1563 [..............................] - ETA: 2:47:51 - loss: 0.0927 - accuracy: 0.9674

  49/1563 [..............................] - ETA: 2:47:36 - loss: 0.0910 - accuracy: 0.9681

  50/1563 [..............................] - ETA: 2:47:24 - loss: 0.0898 - accuracy: 0.9688

  51/1563 [..............................] - ETA: 2:47:27 - loss: 0.0914 - accuracy: 0.9681

  52/1563 [..............................] - ETA: 2:47:19 - loss: 0.0897 - accuracy: 0.9688

  53/1563 [>.............................] - ETA: 2:47:12 - loss: 0.0911 - accuracy: 0.9682

  54/1563 [>.............................] - ETA: 2:47:07 - loss: 0.0895 - accuracy: 0.9688

  55/1563 [>.............................] - ETA: 2:46:59 - loss: 0.0934 - accuracy: 0.9670

  56/1563 [>.............................] - ETA: 2:47:09 - loss: 0.0919 - accuracy: 0.9676

  57/1563 [>.............................] - ETA: 2:46:58 - loss: 0.0912 - accuracy: 0.9682

  58/1563 [>.............................] - ETA: 2:46:46 - loss: 0.0899 - accuracy: 0.9688

  59/1563 [>.............................] - ETA: 2:46:36 - loss: 0.0885 - accuracy: 0.9693

  60/1563 [>.............................] - ETA: 2:46:26 - loss: 0.0902 - accuracy: 0.9688

  61/1563 [>.............................] - ETA: 2:46:30 - loss: 0.0897 - accuracy: 0.9682

  62/1563 [>.............................] - ETA: 2:46:19 - loss: 0.0883 - accuracy: 0.9688

  63/1563 [>.............................] - ETA: 2:46:09 - loss: 0.0876 - accuracy: 0.9683

  64/1563 [>.............................] - ETA: 2:45:56 - loss: 0.0865 - accuracy: 0.9688

  65/1563 [>.............................] - ETA: 2:45:48 - loss: 0.0857 - accuracy: 0.9692

  66/1563 [>.............................] - ETA: 2:45:49 - loss: 0.0860 - accuracy: 0.9688

  67/1563 [>.............................] - ETA: 2:45:37 - loss: 0.0849 - accuracy: 0.9692

  68/1563 [>.............................] - ETA: 2:45:27 - loss: 0.0838 - accuracy: 0.9697

  69/1563 [>.............................] - ETA: 2:45:16 - loss: 0.0836 - accuracy: 0.9692

  70/1563 [>.............................] - ETA: 2:45:04 - loss: 0.0855 - accuracy: 0.9688

  71/1563 [>.............................] - ETA: 2:45:07 - loss: 0.0852 - accuracy: 0.9692

  72/1563 [>.............................] - ETA: 2:44:57 - loss: 0.0840 - accuracy: 0.9696

  73/1563 [>.............................] - ETA: 2:44:45 - loss: 0.0840 - accuracy: 0.9700

  74/1563 [>.............................] - ETA: 2:44:34 - loss: 0.0830 - accuracy: 0.9704

  75/1563 [>.............................] - ETA: 2:44:23 - loss: 0.0848 - accuracy: 0.9700

  76/1563 [>.............................] - ETA: 2:44:25 - loss: 0.0850 - accuracy: 0.9696

  77/1563 [>.............................] - ETA: 2:44:15 - loss: 0.0854 - accuracy: 0.9692

  78/1563 [>.............................] - ETA: 2:44:05 - loss: 0.0860 - accuracy: 0.9688

  79/1563 [>.............................] - ETA: 2:43:55 - loss: 0.0853 - accuracy: 0.9691

  80/1563 [>.............................] - ETA: 2:43:45 - loss: 0.0843 - accuracy: 0.9695

  81/1563 [>.............................] - ETA: 2:43:47 - loss: 0.0834 - accuracy: 0.9699

  82/1563 [>.............................] - ETA: 2:43:38 - loss: 0.0825 - accuracy: 0.9703

  83/1563 [>.............................] - ETA: 2:43:29 - loss: 0.0818 - accuracy: 0.9706

  84/1563 [>.............................] - ETA: 2:43:19 - loss: 0.0815 - accuracy: 0.9710

  85/1563 [>.............................] - ETA: 2:43:10 - loss: 0.0809 - accuracy: 0.9713

  86/1563 [>.............................] - ETA: 2:43:10 - loss: 0.0820 - accuracy: 0.9709

  87/1563 [>.............................] - ETA: 2:43:01 - loss: 0.0815 - accuracy: 0.9713

  88/1563 [>.............................] - ETA: 2:42:53 - loss: 0.0818 - accuracy: 0.9716

  89/1563 [>.............................] - ETA: 2:42:44 - loss: 0.0823 - accuracy: 0.9712

  90/1563 [>.............................] - ETA: 2:42:37 - loss: 0.0815 - accuracy: 0.9715

  91/1563 [>.............................] - ETA: 2:42:34 - loss: 0.0810 - accuracy: 0.9718

  92/1563 [>.............................] - ETA: 2:42:26 - loss: 0.0806 - accuracy: 0.9721

  93/1563 [>.............................] - ETA: 2:42:17 - loss: 0.0813 - accuracy: 0.9718

  94/1563 [>.............................] - ETA: 2:42:08 - loss: 0.0806 - accuracy: 0.9721

  95/1563 [>.............................] - ETA: 2:42:03 - loss: 0.0801 - accuracy: 0.9724

  96/1563 [>.............................] - ETA: 2:41:58 - loss: 0.0795 - accuracy: 0.9727

  97/1563 [>.............................] - ETA: 2:41:51 - loss: 0.0788 - accuracy: 0.9729

  98/1563 [>.............................] - ETA: 2:41:43 - loss: 0.0784 - accuracy: 0.9732

  99/1563 [>.............................] - ETA: 2:41:33 - loss: 0.0777 - accuracy: 0.9735

 100/1563 [>.............................] - ETA: 2:41:30 - loss: 0.0774 - accuracy: 0.9737

 101/1563 [>.............................] - ETA: 2:41:23 - loss: 0.0771 - accuracy: 0.9740

 102/1563 [>.............................] - ETA: 2:41:15 - loss: 0.0791 - accuracy: 0.9737

 103/1563 [>.............................] - ETA: 2:41:06 - loss: 0.0783 - accuracy: 0.9739

 104/1563 [>.............................] - ETA: 2:40:58 - loss: 0.0777 - accuracy: 0.9742

 105/1563 [=>............................] - ETA: 2:40:55 - loss: 0.0773 - accuracy: 0.9744

 106/1563 [=>............................] - ETA: 2:40:49 - loss: 0.0767 - accuracy: 0.9746

 107/1563 [=>............................] - ETA: 2:40:41 - loss: 0.0777 - accuracy: 0.9743

 108/1563 [=>............................] - ETA: 2:40:33 - loss: 0.0794 - accuracy: 0.9740

 109/1563 [=>............................] - ETA: 2:40:26 - loss: 0.0788 - accuracy: 0.9742

 110/1563 [=>............................] - ETA: 2:40:23 - loss: 0.0787 - accuracy: 0.9744

 111/1563 [=>............................] - ETA: 2:40:16 - loss: 0.0800 - accuracy: 0.9735

 112/1563 [=>............................] - ETA: 2:40:07 - loss: 0.0796 - accuracy: 0.9738

 113/1563 [=>............................] - ETA: 2:39:59 - loss: 0.0792 - accuracy: 0.9740

 114/1563 [=>............................] - ETA: 2:39:50 - loss: 0.0789 - accuracy: 0.9742

 115/1563 [=>............................] - ETA: 2:39:48 - loss: 0.0796 - accuracy: 0.9739

 116/1563 [=>............................] - ETA: 2:39:40 - loss: 0.0799 - accuracy: 0.9736

 117/1563 [=>............................] - ETA: 2:39:30 - loss: 0.0795 - accuracy: 0.9738

 118/1563 [=>............................] - ETA: 2:39:21 - loss: 0.0789 - accuracy: 0.9740

 119/1563 [=>............................] - ETA: 2:39:14 - loss: 0.0798 - accuracy: 0.9732

 120/1563 [=>............................] - ETA: 2:39:12 - loss: 0.0795 - accuracy: 0.9734

 121/1563 [=>............................] - ETA: 2:39:03 - loss: 0.0797 - accuracy: 0.9731

 122/1563 [=>............................] - ETA: 2:38:55 - loss: 0.0792 - accuracy: 0.9734

 123/1563 [=>............................] - ETA: 2:38:47 - loss: 0.0788 - accuracy: 0.9736

 124/1563 [=>............................] - ETA: 2:38:39 - loss: 0.0784 - accuracy: 0.9738

 125/1563 [=>............................] - ETA: 2:38:36 - loss: 0.0824 - accuracy: 0.9735

 126/1563 [=>............................] - ETA: 2:38:29 - loss: 0.0833 - accuracy: 0.9732

 127/1563 [=>............................] - ETA: 2:38:20 - loss: 0.0828 - accuracy: 0.9734

 128/1563 [=>............................] - ETA: 2:38:13 - loss: 0.0836 - accuracy: 0.9731

 129/1563 [=>............................] - ETA: 2:38:04 - loss: 0.0838 - accuracy: 0.9729

 130/1563 [=>............................] - ETA: 2:38:02 - loss: 0.0840 - accuracy: 0.9726

 131/1563 [=>............................] - ETA: 2:37:54 - loss: 0.0834 - accuracy: 0.9728

 132/1563 [=>............................] - ETA: 2:37:45 - loss: 0.0837 - accuracy: 0.9725

 133/1563 [=>............................] - ETA: 2:37:38 - loss: 0.0838 - accuracy: 0.9723

 134/1563 [=>............................] - ETA: 2:37:29 - loss: 0.0847 - accuracy: 0.9720

 135/1563 [=>............................] - ETA: 2:37:28 - loss: 0.0841 - accuracy: 0.9722

 136/1563 [=>............................] - ETA: 2:37:20 - loss: 0.0837 - accuracy: 0.9724

 137/1563 [=>............................] - ETA: 2:37:11 - loss: 0.0852 - accuracy: 0.9717

 138/1563 [=>............................] - ETA: 2:37:04 - loss: 0.0851 - accuracy: 0.9719

 139/1563 [=>............................] - ETA: 2:36:56 - loss: 0.0847 - accuracy: 0.9721

 140/1563 [=>............................] - ETA: 2:36:52 - loss: 0.0846 - accuracy: 0.9719

 141/1563 [=>............................] - ETA: 2:36:45 - loss: 0.0841 - accuracy: 0.9721

 142/1563 [=>............................] - ETA: 2:36:38 - loss: 0.0846 - accuracy: 0.9718

 143/1563 [=>............................] - ETA: 2:36:30 - loss: 0.0841 - accuracy: 0.9720

 144/1563 [=>............................] - ETA: 2:36:23 - loss: 0.0836 - accuracy: 0.9722

 145/1563 [=>............................] - ETA: 2:36:21 - loss: 0.0830 - accuracy: 0.9724

 146/1563 [=>............................] - ETA: 2:36:14 - loss: 0.0826 - accuracy: 0.9726

 147/1563 [=>............................] - ETA: 2:36:08 - loss: 0.0822 - accuracy: 0.9728

 148/1563 [=>............................] - ETA: 2:36:02 - loss: 0.0824 - accuracy: 0.9730

 149/1563 [=>............................] - ETA: 2:35:53 - loss: 0.0822 - accuracy: 0.9732

 150/1563 [=>............................] - ETA: 2:35:48 - loss: 0.0837 - accuracy: 0.9729

 151/1563 [=>............................] - ETA: 2:35:39 - loss: 0.0850 - accuracy: 0.9727

 152/1563 [=>............................] - ETA: 2:35:31 - loss: 0.0845 - accuracy: 0.9729

 153/1563 [=>............................] - ETA: 2:35:21 - loss: 0.0841 - accuracy: 0.9730

 154/1563 [=>............................] - ETA: 2:35:10 - loss: 0.0838 - accuracy: 0.9732

 155/1563 [=>............................] - ETA: 2:35:03 - loss: 0.0835 - accuracy: 0.9734

 156/1563 [=>............................] - ETA: 2:34:53 - loss: 0.0831 - accuracy: 0.9736

 157/1563 [==>...........................] - ETA: 2:34:43 - loss: 0.0829 - accuracy: 0.9737

 158/1563 [==>...........................] - ETA: 2:34:33 - loss: 0.0827 - accuracy: 0.9739

 159/1563 [==>...........................] - ETA: 2:34:23 - loss: 0.0836 - accuracy: 0.9737

 160/1563 [==>...........................] - ETA: 2:34:14 - loss: 0.0835 - accuracy: 0.9734

 161/1563 [==>...........................] - ETA: 2:34:06 - loss: 0.0831 - accuracy: 0.9736

 162/1563 [==>...........................] - ETA: 2:33:56 - loss: 0.0828 - accuracy: 0.9738

 163/1563 [==>...........................] - ETA: 2:33:46 - loss: 0.0833 - accuracy: 0.9735

 164/1563 [==>...........................] - ETA: 2:33:36 - loss: 0.0828 - accuracy: 0.9737

 165/1563 [==>...........................] - ETA: 2:33:26 - loss: 0.0838 - accuracy: 0.9731

 166/1563 [==>...........................] - ETA: 2:33:21 - loss: 0.0833 - accuracy: 0.9733

 167/1563 [==>...........................] - ETA: 2:33:12 - loss: 0.0829 - accuracy: 0.9734

 168/1563 [==>...........................] - ETA: 2:33:04 - loss: 0.0846 - accuracy: 0.9732

 169/1563 [==>...........................] - ETA: 2:32:58 - loss: 0.0844 - accuracy: 0.9734

 170/1563 [==>...........................] - ETA: 2:32:51 - loss: 0.0841 - accuracy: 0.9735

 171/1563 [==>...........................] - ETA: 2:32:47 - loss: 0.0837 - accuracy: 0.9737

 172/1563 [==>...........................] - ETA: 2:32:40 - loss: 0.0846 - accuracy: 0.9735

 173/1563 [==>...........................] - ETA: 2:32:34 - loss: 0.0843 - accuracy: 0.9736

 174/1563 [==>...........................] - ETA: 2:32:27 - loss: 0.0839 - accuracy: 0.9738

 175/1563 [==>...........................] - ETA: 2:32:25 - loss: 0.0846 - accuracy: 0.9732

 176/1563 [==>...........................] - ETA: 2:32:21 - loss: 0.0850 - accuracy: 0.9730

 177/1563 [==>...........................] - ETA: 2:32:16 - loss: 0.0847 - accuracy: 0.9732

 178/1563 [==>...........................] - ETA: 2:32:09 - loss: 0.0849 - accuracy: 0.9730

 179/1563 [==>...........................] - ETA: 2:32:03 - loss: 0.0855 - accuracy: 0.9728

 180/1563 [==>...........................] - ETA: 2:32:01 - loss: 0.0856 - accuracy: 0.9726

 181/1563 [==>...........................] - ETA: 2:31:54 - loss: 0.0863 - accuracy: 0.9724

 182/1563 [==>...........................] - ETA: 2:31:48 - loss: 0.0866 - accuracy: 0.9722

 183/1563 [==>...........................] - ETA: 2:31:42 - loss: 0.0864 - accuracy: 0.9723

 184/1563 [==>...........................] - ETA: 2:31:35 - loss: 0.0862 - accuracy: 0.9725

 185/1563 [==>...........................] - ETA: 2:31:32 - loss: 0.0859 - accuracy: 0.9726

 186/1563 [==>...........................] - ETA: 2:31:26 - loss: 0.0880 - accuracy: 0.9724

 187/1563 [==>...........................] - ETA: 2:31:19 - loss: 0.0880 - accuracy: 0.9723

 188/1563 [==>...........................] - ETA: 2:31:12 - loss: 0.0878 - accuracy: 0.9724

 189/1563 [==>...........................] - ETA: 2:31:05 - loss: 0.0882 - accuracy: 0.9722

 190/1563 [==>...........................] - ETA: 2:31:02 - loss: 0.0883 - accuracy: 0.9720

 191/1563 [==>...........................] - ETA: 2:30:57 - loss: 0.0894 - accuracy: 0.9715

 192/1563 [==>...........................] - ETA: 2:30:50 - loss: 0.0893 - accuracy: 0.9717

 193/1563 [==>...........................] - ETA: 2:30:43 - loss: 0.0891 - accuracy: 0.9718

 194/1563 [==>...........................] - ETA: 2:30:36 - loss: 0.0891 - accuracy: 0.9716

 195/1563 [==>...........................] - ETA: 2:30:32 - loss: 0.0909 - accuracy: 0.9712

 196/1563 [==>...........................] - ETA: 2:30:25 - loss: 0.0906 - accuracy: 0.9713

 197/1563 [==>...........................] - ETA: 2:30:17 - loss: 0.0902 - accuracy: 0.9714

 198/1563 [==>...........................] - ETA: 2:30:08 - loss: 0.0899 - accuracy: 0.9716

 199/1563 [==>...........................] - ETA: 2:29:59 - loss: 0.0895 - accuracy: 0.9717

 200/1563 [==>...........................] - ETA: 2:29:54 - loss: 0.0895 - accuracy: 0.9719

 201/1563 [==>...........................] - ETA: 2:29:46 - loss: 0.0892 - accuracy: 0.9720

 202/1563 [==>...........................] - ETA: 2:29:39 - loss: 0.0889 - accuracy: 0.9722

 203/1563 [==>...........................] - ETA: 2:29:30 - loss: 0.0886 - accuracy: 0.9723

 204/1563 [==>...........................] - ETA: 2:29:20 - loss: 0.0883 - accuracy: 0.9724

 205/1563 [==>...........................] - ETA: 2:29:15 - loss: 0.0884 - accuracy: 0.9723

 206/1563 [==>...........................] - ETA: 2:29:07 - loss: 0.0882 - accuracy: 0.9724

 207/1563 [==>...........................] - ETA: 2:28:58 - loss: 0.0879 - accuracy: 0.9725

 208/1563 [==>...........................] - ETA: 2:28:49 - loss: 0.0895 - accuracy: 0.9721

 209/1563 [===>..........................] - ETA: 2:28:40 - loss: 0.0894 - accuracy: 0.9722

 210/1563 [===>..........................] - ETA: 2:28:34 - loss: 0.0898 - accuracy: 0.9720

 211/1563 [===>..........................] - ETA: 2:28:26 - loss: 0.0906 - accuracy: 0.9716

 212/1563 [===>..........................] - ETA: 2:28:18 - loss: 0.0903 - accuracy: 0.9717

 213/1563 [===>..........................] - ETA: 2:28:09 - loss: 0.0902 - accuracy: 0.9718

 214/1563 [===>..........................] - ETA: 2:28:00 - loss: 0.0898 - accuracy: 0.9720

 215/1563 [===>..........................] - ETA: 2:27:52 - loss: 0.0895 - accuracy: 0.9721

 216/1563 [===>..........................] - ETA: 2:27:46 - loss: 0.0891 - accuracy: 0.9722

 217/1563 [===>..........................] - ETA: 2:27:37 - loss: 0.0891 - accuracy: 0.9724

 218/1563 [===>..........................] - ETA: 2:27:28 - loss: 0.0889 - accuracy: 0.9725

 219/1563 [===>..........................] - ETA: 2:27:20 - loss: 0.0886 - accuracy: 0.9726

 220/1563 [===>..........................] - ETA: 2:27:12 - loss: 0.0889 - accuracy: 0.9724

 221/1563 [===>..........................] - ETA: 2:27:07 - loss: 0.0885 - accuracy: 0.9726

 222/1563 [===>..........................] - ETA: 2:26:58 - loss: 0.0884 - accuracy: 0.9724

 223/1563 [===>..........................] - ETA: 2:26:50 - loss: 0.0885 - accuracy: 0.9723

 224/1563 [===>..........................] - ETA: 2:26:42 - loss: 0.0893 - accuracy: 0.9721

 225/1563 [===>..........................] - ETA: 2:26:33 - loss: 0.0892 - accuracy: 0.9719

 226/1563 [===>..........................] - ETA: 2:26:28 - loss: 0.0890 - accuracy: 0.9721

 227/1563 [===>..........................] - ETA: 2:26:19 - loss: 0.0890 - accuracy: 0.9719

 228/1563 [===>..........................] - ETA: 2:26:11 - loss: 0.0887 - accuracy: 0.9720

 229/1563 [===>..........................] - ETA: 2:26:03 - loss: 0.0884 - accuracy: 0.9722

 230/1563 [===>..........................] - ETA: 2:25:54 - loss: 0.0883 - accuracy: 0.9723

 231/1563 [===>..........................] - ETA: 2:25:49 - loss: 0.0881 - accuracy: 0.9724

 232/1563 [===>..........................] - ETA: 2:25:40 - loss: 0.0878 - accuracy: 0.9725

 233/1563 [===>..........................] - ETA: 2:25:32 - loss: 0.0874 - accuracy: 0.9726

 234/1563 [===>..........................] - ETA: 2:25:24 - loss: 0.0871 - accuracy: 0.9728

 235/1563 [===>..........................] - ETA: 2:25:15 - loss: 0.0871 - accuracy: 0.9726

 236/1563 [===>..........................] - ETA: 2:25:11 - loss: 0.0869 - accuracy: 0.9727

 237/1563 [===>..........................] - ETA: 2:25:03 - loss: 0.0874 - accuracy: 0.9723

 238/1563 [===>..........................] - ETA: 2:24:56 - loss: 0.0871 - accuracy: 0.9724

 239/1563 [===>..........................] - ETA: 2:24:48 - loss: 0.0877 - accuracy: 0.9723

 240/1563 [===>..........................] - ETA: 2:24:41 - loss: 0.0873 - accuracy: 0.9724

 241/1563 [===>..........................] - ETA: 2:24:36 - loss: 0.0874 - accuracy: 0.9723

 242/1563 [===>..........................] - ETA: 2:24:28 - loss: 0.0871 - accuracy: 0.9724

 243/1563 [===>..........................] - ETA: 2:24:20 - loss: 0.0868 - accuracy: 0.9725

 244/1563 [===>..........................] - ETA: 2:24:13 - loss: 0.0864 - accuracy: 0.9726

 245/1563 [===>..........................] - ETA: 2:24:04 - loss: 0.0861 - accuracy: 0.9727

 246/1563 [===>..........................] - ETA: 2:23:59 - loss: 0.0858 - accuracy: 0.9728

 247/1563 [===>..........................] - ETA: 2:23:51 - loss: 0.0856 - accuracy: 0.9729

 248/1563 [===>..........................] - ETA: 2:23:43 - loss: 0.0854 - accuracy: 0.9730

 249/1563 [===>..........................] - ETA: 2:23:34 - loss: 0.0851 - accuracy: 0.9731

 250/1563 [===>..........................] - ETA: 2:23:26 - loss: 0.0848 - accuracy: 0.9732

 251/1563 [===>..........................] - ETA: 2:23:21 - loss: 0.0845 - accuracy: 0.9734

 252/1563 [===>..........................] - ETA: 2:23:14 - loss: 0.0842 - accuracy: 0.9735

 253/1563 [===>..........................] - ETA: 2:23:05 - loss: 0.0839 - accuracy: 0.9736

 254/1563 [===>..........................] - ETA: 2:22:57 - loss: 0.0836 - accuracy: 0.9737

 255/1563 [===>..........................] - ETA: 2:22:49 - loss: 0.0833 - accuracy: 0.9738

 256/1563 [===>..........................] - ETA: 2:22:43 - loss: 0.0833 - accuracy: 0.9736

 257/1563 [===>..........................] - ETA: 2:22:35 - loss: 0.0830 - accuracy: 0.9737

 258/1563 [===>..........................] - ETA: 2:22:27 - loss: 0.0827 - accuracy: 0.9738

 259/1563 [===>..........................] - ETA: 2:22:19 - loss: 0.0830 - accuracy: 0.9737

 260/1563 [===>..........................] - ETA: 2:22:11 - loss: 0.0828 - accuracy: 0.9738

 261/1563 [====>.........................] - ETA: 2:22:04 - loss: 0.0836 - accuracy: 0.9737

 262/1563 [====>.........................] - ETA: 2:21:57 - loss: 0.0833 - accuracy: 0.9738

 263/1563 [====>.........................] - ETA: 2:21:49 - loss: 0.0830 - accuracy: 0.9739

 264/1563 [====>.........................] - ETA: 2:21:41 - loss: 0.0828 - accuracy: 0.9740

 265/1563 [====>.........................] - ETA: 2:21:33 - loss: 0.0825 - accuracy: 0.9741

 266/1563 [====>.........................] - ETA: 2:21:26 - loss: 0.0824 - accuracy: 0.9739

 267/1563 [====>.........................] - ETA: 2:21:20 - loss: 0.0821 - accuracy: 0.9740

 268/1563 [====>.........................] - ETA: 2:21:12 - loss: 0.0823 - accuracy: 0.9739

 269/1563 [====>.........................] - ETA: 2:21:03 - loss: 0.0821 - accuracy: 0.9740

 270/1563 [====>.........................] - ETA: 2:20:56 - loss: 0.0824 - accuracy: 0.9736

 271/1563 [====>.........................] - ETA: 2:20:48 - loss: 0.0822 - accuracy: 0.9737

 272/1563 [====>.........................] - ETA: 2:20:42 - loss: 0.0822 - accuracy: 0.9736

 273/1563 [====>.........................] - ETA: 2:20:34 - loss: 0.0820 - accuracy: 0.9737

 274/1563 [====>.........................] - ETA: 2:20:25 - loss: 0.0824 - accuracy: 0.9735

 275/1563 [====>.........................] - ETA: 2:20:18 - loss: 0.0822 - accuracy: 0.9736

 276/1563 [====>.........................] - ETA: 2:20:11 - loss: 0.0819 - accuracy: 0.9737

 277/1563 [====>.........................] - ETA: 2:20:05 - loss: 0.0817 - accuracy: 0.9738

 278/1563 [====>.........................] - ETA: 2:19:57 - loss: 0.0820 - accuracy: 0.9735

 279/1563 [====>.........................] - ETA: 2:19:50 - loss: 0.0818 - accuracy: 0.9736

 280/1563 [====>.........................] - ETA: 2:19:42 - loss: 0.0815 - accuracy: 0.9737

 281/1563 [====>.........................] - ETA: 2:19:35 - loss: 0.0820 - accuracy: 0.9735

 282/1563 [====>.........................] - ETA: 2:19:29 - loss: 0.0826 - accuracy: 0.9734

 283/1563 [====>.........................] - ETA: 2:19:21 - loss: 0.0830 - accuracy: 0.9733

 284/1563 [====>.........................] - ETA: 2:19:13 - loss: 0.0827 - accuracy: 0.9734

 285/1563 [====>.........................] - ETA: 2:19:06 - loss: 0.0825 - accuracy: 0.9735

 286/1563 [====>.........................] - ETA: 2:18:59 - loss: 0.0823 - accuracy: 0.9736

 287/1563 [====>.........................] - ETA: 2:18:54 - loss: 0.0824 - accuracy: 0.9734

 288/1563 [====>.........................] - ETA: 2:18:46 - loss: 0.0822 - accuracy: 0.9735

 289/1563 [====>.........................] - ETA: 2:18:39 - loss: 0.0821 - accuracy: 0.9736

 290/1563 [====>.........................] - ETA: 2:18:32 - loss: 0.0819 - accuracy: 0.9737

 291/1563 [====>.........................] - ETA: 2:18:26 - loss: 0.0821 - accuracy: 0.9736

 292/1563 [====>.........................] - ETA: 2:18:21 - loss: 0.0823 - accuracy: 0.9735

 293/1563 [====>.........................] - ETA: 2:18:14 - loss: 0.0828 - accuracy: 0.9733

 294/1563 [====>.........................] - ETA: 2:18:07 - loss: 0.0828 - accuracy: 0.9732

 295/1563 [====>.........................] - ETA: 2:18:00 - loss: 0.0827 - accuracy: 0.9733

 296/1563 [====>.........................] - ETA: 2:17:53 - loss: 0.0825 - accuracy: 0.9734

 297/1563 [====>.........................] - ETA: 2:17:49 - loss: 0.0823 - accuracy: 0.9735

 298/1563 [====>.........................] - ETA: 2:17:42 - loss: 0.0837 - accuracy: 0.9732

 299/1563 [====>.........................] - ETA: 2:17:34 - loss: 0.0849 - accuracy: 0.9728

 300/1563 [====>.........................] - ETA: 2:17:27 - loss: 0.0846 - accuracy: 0.9729

 301/1563 [====>.........................] - ETA: 2:17:21 - loss: 0.0844 - accuracy: 0.9730

 302/1563 [====>.........................] - ETA: 2:17:16 - loss: 0.0843 - accuracy: 0.9731

 303/1563 [====>.........................] - ETA: 2:17:08 - loss: 0.0842 - accuracy: 0.9732

 304/1563 [====>.........................] - ETA: 2:17:01 - loss: 0.0847 - accuracy: 0.9731

 305/1563 [====>.........................] - ETA: 2:16:54 - loss: 0.0846 - accuracy: 0.9732

 306/1563 [====>.........................] - ETA: 2:16:48 - loss: 0.0844 - accuracy: 0.9732

 307/1563 [====>.........................] - ETA: 2:16:43 - loss: 0.0842 - accuracy: 0.9733

 308/1563 [====>.........................] - ETA: 2:16:36 - loss: 0.0841 - accuracy: 0.9734

 309/1563 [====>.........................] - ETA: 2:16:29 - loss: 0.0840 - accuracy: 0.9733

 310/1563 [====>.........................] - ETA: 2:16:22 - loss: 0.0838 - accuracy: 0.9734

 311/1563 [====>.........................] - ETA: 2:16:15 - loss: 0.0840 - accuracy: 0.9733

 312/1563 [====>.........................] - ETA: 2:16:10 - loss: 0.0840 - accuracy: 0.9734

 313/1563 [=====>........................] - ETA: 2:16:02 - loss: 0.0839 - accuracy: 0.9734

 314/1563 [=====>........................] - ETA: 2:15:55 - loss: 0.0839 - accuracy: 0.9733

 315/1563 [=====>........................] - ETA: 2:15:48 - loss: 0.0837 - accuracy: 0.9734

 316/1563 [=====>........................] - ETA: 2:15:41 - loss: 0.0844 - accuracy: 0.9733

 317/1563 [=====>........................] - ETA: 2:15:36 - loss: 0.0843 - accuracy: 0.9732

 318/1563 [=====>........................] - ETA: 2:15:29 - loss: 0.0843 - accuracy: 0.9733

 319/1563 [=====>........................] - ETA: 2:15:22 - loss: 0.0845 - accuracy: 0.9732

 320/1563 [=====>........................] - ETA: 2:15:15 - loss: 0.0843 - accuracy: 0.9732

 321/1563 [=====>........................] - ETA: 2:15:08 - loss: 0.0842 - accuracy: 0.9733

 322/1563 [=====>........................] - ETA: 2:15:03 - loss: 0.0839 - accuracy: 0.9734

 323/1563 [=====>........................] - ETA: 2:14:56 - loss: 0.0843 - accuracy: 0.9731

 324/1563 [=====>........................] - ETA: 2:14:48 - loss: 0.0844 - accuracy: 0.9728

 325/1563 [=====>........................] - ETA: 2:14:41 - loss: 0.0856 - accuracy: 0.9727

 326/1563 [=====>........................] - ETA: 2:14:34 - loss: 0.0854 - accuracy: 0.9728

 327/1563 [=====>........................] - ETA: 2:14:28 - loss: 0.0856 - accuracy: 0.9727

 328/1563 [=====>........................] - ETA: 2:14:21 - loss: 0.0855 - accuracy: 0.9728

 329/1563 [=====>........................] - ETA: 2:14:13 - loss: 0.0852 - accuracy: 0.9728

 330/1563 [=====>........................] - ETA: 2:14:05 - loss: 0.0851 - accuracy: 0.9729

 331/1563 [=====>........................] - ETA: 2:13:57 - loss: 0.0850 - accuracy: 0.9730

 332/1563 [=====>........................] - ETA: 2:13:50 - loss: 0.0848 - accuracy: 0.9731

 333/1563 [=====>........................] - ETA: 2:13:44 - loss: 0.0847 - accuracy: 0.9732

 334/1563 [=====>........................] - ETA: 2:13:36 - loss: 0.0845 - accuracy: 0.9732

 335/1563 [=====>........................] - ETA: 2:13:28 - loss: 0.0843 - accuracy: 0.9733

 336/1563 [=====>........................] - ETA: 2:13:21 - loss: 0.0843 - accuracy: 0.9734

 337/1563 [=====>........................] - ETA: 2:13:13 - loss: 0.0843 - accuracy: 0.9735

 338/1563 [=====>........................] - ETA: 2:13:07 - loss: 0.0847 - accuracy: 0.9734

 339/1563 [=====>........................] - ETA: 2:12:59 - loss: 0.0849 - accuracy: 0.9733

 340/1563 [=====>........................] - ETA: 2:12:51 - loss: 0.0847 - accuracy: 0.9733

 341/1563 [=====>........................] - ETA: 2:12:44 - loss: 0.0848 - accuracy: 0.9732

 342/1563 [=====>........................] - ETA: 2:12:37 - loss: 0.0847 - accuracy: 0.9733

 343/1563 [=====>........................] - ETA: 2:12:31 - loss: 0.0857 - accuracy: 0.9730

 344/1563 [=====>........................] - ETA: 2:12:23 - loss: 0.0860 - accuracy: 0.9729

 345/1563 [=====>........................] - ETA: 2:12:18 - loss: 0.0862 - accuracy: 0.9728

 346/1563 [=====>........................] - ETA: 2:12:12 - loss: 0.0861 - accuracy: 0.9729

 347/1563 [=====>........................] - ETA: 2:12:05 - loss: 0.0865 - accuracy: 0.9728

 348/1563 [=====>........................] - ETA: 2:12:01 - loss: 0.0862 - accuracy: 0.9729

 349/1563 [=====>........................] - ETA: 2:11:54 - loss: 0.0861 - accuracy: 0.9730

 350/1563 [=====>........................] - ETA: 2:11:47 - loss: 0.0862 - accuracy: 0.9729

 351/1563 [=====>........................] - ETA: 2:11:40 - loss: 0.0861 - accuracy: 0.9729

 352/1563 [=====>........................] - ETA: 2:11:32 - loss: 0.0868 - accuracy: 0.9725

 353/1563 [=====>........................] - ETA: 2:11:29 - loss: 0.0866 - accuracy: 0.9726

 354/1563 [=====>........................] - ETA: 2:11:23 - loss: 0.0865 - accuracy: 0.9726

 355/1563 [=====>........................] - ETA: 2:11:17 - loss: 0.0865 - accuracy: 0.9725

 356/1563 [=====>........................] - ETA: 2:11:10 - loss: 0.0864 - accuracy: 0.9726

 357/1563 [=====>........................] - ETA: 2:11:04 - loss: 0.0865 - accuracy: 0.9725

 358/1563 [=====>........................] - ETA: 2:11:00 - loss: 0.0865 - accuracy: 0.9724

 359/1563 [=====>........................] - ETA: 2:10:53 - loss: 0.0864 - accuracy: 0.9725

 360/1563 [=====>........................] - ETA: 2:10:46 - loss: 0.0862 - accuracy: 0.9726

 361/1563 [=====>........................] - ETA: 2:10:41 - loss: 0.0863 - accuracy: 0.9725

 362/1563 [=====>........................] - ETA: 2:10:35 - loss: 0.0862 - accuracy: 0.9725

 363/1563 [=====>........................] - ETA: 2:10:30 - loss: 0.0861 - accuracy: 0.9726

 364/1563 [=====>........................] - ETA: 2:10:24 - loss: 0.0859 - accuracy: 0.9727
































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































Epoch 3: ReduceLROnPlateau reducing learning rate to 3.999999898951501e-06.




Evaluating model on test set: imdb/AdamW_BERT/OptimA...
