# Notebook for both CNN's and Convolution + Machine Learning

## Importing Libraries

In [None]:
import numpy as np
import cv2
import albumentations as A
import torch
from pathlib import Path
import json
from sklearn.preprocessing import LabelEncoder
from tqdm import tqdm
import pandas as pd
from sklearn.metrics import accuracy_score, f1_score, recall_score, precision_score

# Mounting Drive
from google.colab import drive
drive.mount('/content/drive')

  check_for_updates()


Mounted at /content/drive


## Dataset Preparation

This code gets the dataset.zip from the TKPR221 folder in Google Drive and unzips it to the colab workspace, so that it is much faster when loading the data to the model.

Delete comment signs (''') to make this block work.

In [None]:
import shutil
from pathlib import Path
def extract_drive_dataset(
    zip_path='/content/drive/MyDrive/TKPR221/traffic_signs_dataset.zip',
    extract_path='/content/dataset'
):
    """
    Copy ZIP from Drive to Colab and extract it
    """
    zip_path = Path(zip_path)
    if not zip_path.exists():
        raise FileNotFoundError(f"ZIP file not found at: {zip_path}")

    # Create temporary directory for ZIP
    temp_dir = Path('/content/temp')
    temp_dir.mkdir(exist_ok=True)
    temp_zip = temp_dir / 'dataset.zip'

    # Copy ZIP to Colab
    print(f"\nCopying ZIP from Drive to Colab...")
    print(f"Source: {zip_path}")
    print(f"Destination: {temp_zip}")
    shutil.copy2(zip_path, temp_zip)

    # Verify copy
    if temp_zip.exists():
        zip_size = temp_zip.stat().st_size / (1024 * 1024)  # Size in MB
        print(f"ZIP copied successfully! Size: {zip_size:.2f} MB")
    else:
        raise RuntimeError("Failed to copy ZIP file")

    # Create extraction directory
    extract_dir = Path(extract_path)
    extract_dir.mkdir(parents=True, exist_ok=True)

    # Extract ZIP
    print(f"\nExtracting ZIP to: {extract_dir}")
    print("This might take a while...")
    shutil.unpack_archive(str(temp_zip), str(extract_dir))

    # Clean up temporary ZIP
    print("\nCleaning up temporary files...")
    temp_zip.unlink()
    temp_dir.rmdir()

    # Verify extraction
    crops_dir = extract_dir / 'crops'
    csv_file = crops_dir / 'dataset.csv'

    print("\nVerifying extracted files:")
    print(f"Crops directory exists: {crops_dir.exists()}")
    print(f"Dataset CSV exists: {csv_file.exists()}")

    if crops_dir.exists():
        batch_folders = list(crops_dir.glob('batch_*'))
        print(f"Number of batch folders found: {len(batch_folders)}")

        # Print some statistics
        total_images = sum(len(list(folder.glob('*.jpg'))) for folder in batch_folders)
        print(f"Total number of images found: {total_images}")

        # Print folder structure
        print("\nFolder structure:")
        print(f"└── {crops_dir.name}/")
        print(f"    ├── dataset.csv")
        for i, batch in enumerate(sorted(batch_folders)):
            is_last = i == len(batch_folders) - 1
            prefix = "    └── " if is_last else "    ├── "
            n_images = len(list(batch.glob('*.jpg')))
            print(f"{prefix}{batch.name}/ ({n_images} images)")

    return str(crops_dir)

# Usage
try:
    dataset_dir = extract_drive_dataset()
    print(f"\nDataset extracted successfully to: {dataset_dir}")
except Exception as e:
    print(f"Error: {str(e)}")


Copying ZIP from Drive to Colab...
Source: /content/drive/MyDrive/TKPR221/traffic_signs_dataset.zip
Destination: /content/temp/dataset.zip
ZIP copied successfully! Size: 126.81 MB

Extracting ZIP to: /content/dataset
This might take a while...

Cleaning up temporary files...

Verifying extracted files:
Crops directory exists: False
Dataset CSV exists: False

Dataset extracted successfully to: /content/dataset/crops


This code generates a PyTorch dataset. Custom PyTorch dataset allows us to:


1.   Batch train sklearn models.
2.   Apply augmentations to the data.
3.   Add more customizations if needed.



In [None]:
# Custom dataset class for batch loading and transformations
class TrafficSignDataset(torch.utils.data.Dataset):
    def __init__(self, image_dir, csv, transformations=None, size=None, flatten=False, label_encoder=None,reorder=False,tensor=False):
        self.image_dir = Path(image_dir)
        self.csv = csv
        self.transformations = transformations
        self.size = size
        self.flatten = flatten
        self.reorder = reorder
        self.tensor = tensor

        if label_encoder is None:
            self.label_encoder = LabelEncoder()
            self.csv['label'] = self.label_encoder.fit_transform(self.csv['label'])
        else:
            self.label_encoder = label_encoder
            self.csv['label'] = self.label_encoder.transform(self.csv['label'])

        # Store labels for class weights
        self.labels = self.csv['label'].values

    def __len__(self):
        return len(self.csv)

    def __getitem__(self, idx):
        # Get image data and load the image
        image_data = self.csv.iloc[idx]
        image = cv2.imread(f"{self.image_dir}/{image_data['filename']}")
        # Apply transformations (using albumentations)
        if self.transformations:
            transformed = self.transformations(image=image)
            image = transformed['image']
        if self.size is not None:
            image = self.resize_with_pad(image, (self.size, self.size))
        if self.reorder:
            image = self.rearrange(image)
        if self.flatten:
            image = image.flatten()

        if self.tensor:
            image = torch.from_numpy(image).float()
            image_label = torch.tensor(image_data['label'],dtype=torch.long)
        else:
            image = image.astype(np.float32) / 255.0
            image_label = image_data['label']
        return image, image_label

    def transform(self, image):
        return self.transformations(image)


    def resize_with_pad(self,image: np.array,
                    new_shape: tuple[int, int],
                    padding_color: tuple[int, ...] = (0, 0, 0)) -> np.array:

        ## COPIED FROM : https://gist.github.com/IdeaKing/11cf5e146d23c5bb219ba3508cca89ec
        """Maintains aspect ratio and resizes with padding.
        Params:
            image: Image to be resized.
            new_shape: Expected (width, height) of new image.
            padding_color: Tuple in BGR of padding color
        Returns:
            image: Resized image with padding
        """
        original_shape = (image.shape[1], image.shape[0])
        ratio = float(max(new_shape))/max(original_shape)
        new_size = tuple([int(x*ratio) for x in original_shape])
        image = cv2.resize(image, new_size)
        delta_w = new_shape[0] - new_size[0]
        delta_h = new_shape[1] - new_size[1]
        top, bottom = delta_h//2, delta_h-(delta_h//2)
        left, right = delta_w//2, delta_w-(delta_w//2)
        image = cv2.copyMakeBorder(image, top, bottom, left, right, cv2.BORDER_CONSTANT, value=padding_color)
        return image

    # Some helper functions for partial_fit in sklearn
    def get_label_encoded_classes(self):
        classes = self.label_encoder.classes_
        encoded_classes = self.label_encoder.transform(classes)
        return encoded_classes

    def rearrange(self,image):
        return np.moveaxis(image, [0,1,2], [2,1,0])


## Modeling

### CNN MODEL:



In [None]:
import torch.nn as nn
import torch.nn.functional as F

class CNN(nn.Module):
    def __init__(self, n_classes, return_convolution=False):
        super().__init__()
        self.return_convolution = return_convolution
        self.conv1 = nn.Conv2d(in_channels=3, out_channels=32, kernel_size=3, stride=1, padding=1)
        self.batchnorm1 = nn.BatchNorm2d(32)
        self.conv2 = nn.Conv2d(in_channels=32, out_channels=64, kernel_size=3, stride=1, padding=1)
        self.batchnorm2 = nn.BatchNorm2d(64)
        self.conv3 = nn.Conv2d(in_channels=64, out_channels=128, kernel_size=3, stride=1, padding=1)
        self.batchnorm3 = nn.BatchNorm2d(128)
        self.pooling = nn.MaxPool2d(kernel_size=2, stride=2)
        self.fc1 = nn.Linear(128 * 28 * 28, 256)
        self.fc2 = nn.Linear(256, 128)
        self.fc3 = nn.Linear(128, n_classes)
        self.dropout = nn.Dropout(0.4)

    def forward(self, x):
        x = self.pooling(F.leaky_relu(self.batchnorm1(self.conv1(x))))
        x = self.dropout(x)
        x = self.pooling(F.leaky_relu(self.batchnorm2(self.conv2(x))))
        x = self.dropout(x)
        x = self.pooling(F.leaky_relu(self.batchnorm3(self.conv3(x))))
        x = self.dropout(x)

        x = x.view(x.size(0), -1)  # Flatten

        if self.return_convolution:
            return x

        x = self.dropout(F.leaky_relu(self.fc1(x)))
        x = self.dropout(F.leaky_relu(self.fc2(x)))
        x = self.fc3(x)
        return x

In [None]:
import torchvision.models as models
from torchvision import transforms

class TrafficSignResNet(nn.Module):
    def __init__(self, num_classes, model_name='resnet50', pretrained=True):
        super().__init__()
        if model_name == 'resnet50':
            self.backbone = models.resnet50(weights=models.ResNet50_Weights.IMAGENET1K_V2)
        # Freeze early layers
        for param in list(self.backbone.parameters())[:-30]:
            param.requires_grad = False
        in_features = self.backbone.fc.in_features
        self.backbone.fc = nn.Sequential(
            nn.Linear(in_features, 1024),
            nn.BatchNorm1d(1024),
            nn.ReLU(),
            nn.Dropout(0.3),
            nn.Linear(1024, 512),
            nn.BatchNorm1d(512),
            nn.ReLU(),
            nn.Dropout(0.3),
            nn.Linear(512, num_classes)
        )

    def forward(self, x):
        return self.backbone(x)

In [None]:
!pip install neptune

Collecting neptune
  Downloading neptune-1.13.0-py3-none-any.whl.metadata (16 kB)
Collecting boto3>=1.28.0 (from neptune)
  Downloading boto3-1.35.90-py3-none-any.whl.metadata (6.7 kB)
Collecting bravado<12.0.0,>=11.0.0 (from neptune)
  Downloading bravado-11.0.3-py2.py3-none-any.whl.metadata (5.9 kB)
Collecting swagger-spec-validator>=2.7.4 (from neptune)
  Downloading swagger_spec_validator-3.0.4-py2.py3-none-any.whl.metadata (2.5 kB)
Collecting botocore<1.36.0,>=1.35.90 (from boto3>=1.28.0->neptune)
  Downloading botocore-1.35.90-py3-none-any.whl.metadata (5.7 kB)
Collecting jmespath<2.0.0,>=0.7.1 (from boto3>=1.28.0->neptune)
  Downloading jmespath-1.0.1-py3-none-any.whl.metadata (7.6 kB)
Collecting s3transfer<0.11.0,>=0.10.0 (from boto3>=1.28.0->neptune)
  Downloading s3transfer-0.10.4-py3-none-any.whl.metadata (1.7 kB)
Collecting bravado-core>=5.16.1 (from bravado<12.0.0,>=11.0.0->neptune)
  Downloading bravado-core-6.1.1.tar.gz (63 kB)
[2K     [90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━

In [None]:
!rm -rf /content/dataset/traffic_signs_dataset/synthetic_images

In [None]:
import pandas as pd
import numpy as np
import cv2
from pathlib import Path
from imblearn.over_sampling import SMOTE

# Set these paths from google drive
# You need to set the TKPR folder as your favourite to see in the colab
crops_dir = "/content/dataset/traffic_signs_dataset/"
dataset_csv = "/content/dataset/traffic_signs_dataset/dataset.csv"
df = pd.read_csv(dataset_csv)

# Get class counts and find biggest classes
class_counts = df['label'].value_counts()
print("Original class distribution:")
print(class_counts)

# Select 1200 samples from each of the biggest classes
samples_per_class = 1200
df_filtered = pd.DataFrame()
for label in class_counts.index:
    class_samples = df[df['label'] == label]
    if len(class_samples) > samples_per_class:
        df_filtered = pd.concat([df_filtered, class_samples.sample(n=samples_per_class, random_state=42)])
    else:
        df_filtered = pd.concat([df_filtered, class_samples])

# Create directory for synthetic images
synthetic_dir = Path(crops_dir) / "synthetic_images"
synthetic_dir.mkdir(exist_ok=True)

image_data = []
paths = []
labels = []

for _, row in df_filtered.iterrows():
    img_path = Path(crops_dir) / row['filename']
    img = cv2.imread(str(img_path))
    img = cv2.resize(img, (32, 32))
    image_data.append(img.flatten())
    paths.append(row['filename'])
    labels.append(row['label'])

X = np.array(image_data)
y = np.array(labels)

# SMOTE
min_samples = 6
valid_labels = []
for label in np.unique(y):
    if np.sum(y == label) >= min_samples:
        valid_labels.append(label)

# Filter data to only include classes with sufficient samples
mask = np.isin(y, valid_labels)
X = X[mask]
y = y[mask]
filtered_paths = np.array(paths)[mask]

smote = SMOTE(sampling_strategy={label: samples_per_class for label in valid_labels}, random_state=42)
X_resampled, y_resampled = smote.fit_resample(X, y)

# Save original and synthetic images
all_new_paths = []
all_new_labels = []

for i, (img_array, label) in enumerate(zip(X_resampled, y_resampled)):
    if i < len(filtered_paths):  # Original image
        all_new_paths.append(filtered_paths[i])
    else:  # Synthetic image
        img = img_array.reshape(32, 32, 3).astype(np.uint8)
        synthetic_path = f"synthetic_images/synthetic_{label}_{i}.jpg"
        cv2.imwrite(str(Path(crops_dir) / synthetic_path), img)
        all_new_paths.append(synthetic_path)
    all_new_labels.append(label)

# Create balanced dataframe
df_balanced = pd.DataFrame({
    'filename': all_new_paths,
    'label': all_new_labels
})

print("\nBalanced class distribution:")
print(df_balanced['label'].value_counts())
print(f"\nSynthetic images saved to: {synthetic_dir}")

# Use the balanced dataframe for further processing
df_filtered = df_balanced.copy()


Original class distribution:
label
other-sign                                               39121
regulatory--yield--g1                                      827
information--pedestrians-crossing--g1                      685
regulatory--no-entry--g1                                   600
complementary--chevron-right--g1                           531
                                                         ...  
regulatory--turning-vehicles-yield-to-pedestrians--g1        2
regulatory--roundabout--g2                                   2
regulatory--end-of-maximum-speed-limit-70--g1                2
regulatory--dual-lanes-turn-right-or-straight--g1            1
Name: count, Length: 399, dtype: int64





Balanced class distribution:
label
regulatory--end-of-maximum-speed-limit-30--g2    1200
other-sign                                       1200
regulatory--yield--g1                            1200
information--pedestrians-crossing--g1            1200
regulatory--no-entry--g1                         1200
                                                 ... 
regulatory--one-way-straight--g1                 1200
regulatory--keep-right--g4                       1200
regulatory--no-parking--g5                       1200
regulatory--height-limit--g1                     1200
Name: count, Length: 368, dtype: int64

Synthetic images saved to: /content/dataset/traffic_signs_dataset/synthetic_images


Creating the dataset instance and dataloaders.

In [None]:
# Split the data into training and testing sets
from sklearn.model_selection import train_test_split

# Split into train and test sets (80-20 split)
train_df, test_df = train_test_split(df_filtered, test_size=0.2, stratify=df_filtered['label'])

# Further split training data into train and validation (80-20 split of training data)
train_df, val_df = train_test_split(train_df, test_size=0.2, stratify=train_df['label'])

print("Dataset splits:")
print(f"Training samples: {len(train_df)}")
print(f"Validation samples: {len(val_df)}")
print(f"Testing samples: {len(test_df)}")

# Verify class distribution in splits
print("\nClass distribution in training set:")
print(train_df['label'].value_counts())
print("\nClass distribution in validation set:")
print(val_df['label'].value_counts())
print("\nClass distribution in test set:")
print(test_df['label'].value_counts())


Dataset splits:
Training samples: 282624
Validation samples: 70656
Testing samples: 88320

Class distribution in training set:
label
regulatory--keep-left--g1                         768
regulatory--no-parking-or-no-stopping--g1         768
regulatory--maximum-speed-limit-65--g2            768
                                                 ... 
regulatory--dual-lanes-turn-left-no-u-turn--g1    768
information--pedestrians-crossing--g1             768
complementary--turn-right--g2                     768
regulatory--end-of-buses-only--g1                 768
Name: count, Length: 368, dtype: int64

Class distribution in validation set:
label
regulatory--no-left-turn--g2                192
regulatory--maximum-speed-limit-45--g3      192
regulatory--go-straight-or-turn-left--g1    192
                                           ... 
regulatory--turn-left-ahead--g1             192
regulatory--no-stopping--g2                 192
other-sign                                  192
information--te

In [None]:
from torch.utils.data import random_split
import neptune
from sklearn.linear_model import SGDClassifier
import time
from sklearn.metrics import accuracy_score, f1_score, recall_score, precision_score
import torch
import torch.nn as nn
import torch.optim as optim

# Hyperparameters
n_epochs = 10
batch_size = 128
train_size = 0.8
val_size = 0.1
test_size = 0.1
image_size = 224

train_transform = A.Compose([
    A.RandomBrightnessContrast(p=0.2),
    A.HorizontalFlip(p=0.5),
    A.Rotate(limit=10, p=0.3),
    A.Normalize()
])

val_transform = A.Compose([
    A.Normalize()
])


train_dataset = TrafficSignDataset(
    crops_dir,
    train_df,
    transformations=train_transform,
    flatten=False,
    reorder=True,
    tensor=True,
    size=224
)

val_dataset = TrafficSignDataset(
    crops_dir,
    val_df,
    transformations=val_transform,
    flatten=False,
    reorder=True,
    tensor=True,
    size=224,
    label_encoder=train_dataset.label_encoder
)

test_dataset = TrafficSignDataset(
    crops_dir,
    test_df,
    transformations=val_transform,
    flatten=False,
    reorder=True,
    tensor=True,
    size=224,
    label_encoder=train_dataset.label_encoder
)


Getting the device (for training on gpu), and creating loss, optimizer and model objects.

In [None]:
# Set device
device = torch.device('cuda' if torch.cuda.is_available() else 'cpu')
print(f"Using device: {device}")

from sklearn.utils.class_weight import compute_class_weight

# Create data loaders
train_loader = torch.utils.data.DataLoader(
    train_dataset,
    batch_size=batch_size,
    pin_memory=True,
    num_workers=4
)

val_loader = torch.utils.data.DataLoader(
    val_dataset,
    batch_size=batch_size,
    shuffle=False,
    pin_memory=True,
    num_workers=4
)

test_loader = torch.utils.data.DataLoader(
    test_dataset,
    batch_size=batch_size,
    shuffle=False,
    pin_memory=True,
    num_workers=4
)

n_classes = len(train_dataset.label_encoder.classes_)
model = TrafficSignResNet(n_classes).to(device)

optimizer = torch.optim.AdamW(
    model.parameters(),
    lr=0.001,
    betas=(0.9, 0.999),
    eps=1e-8,
    weight_decay=0.0001
)
criterion = nn.CrossEntropyLoss().to(device)



Using device: cuda


Downloading: "https://download.pytorch.org/models/resnet50-11ad3fa6.pth" to /root/.cache/torch/hub/checkpoints/resnet50-11ad3fa6.pth
100%|██████████| 97.8M/97.8M [00:00<00:00, 224MB/s]


Initializing Neptune run for the experiment tracking.

You can change the run structure.

In [None]:
run_name = f"CNN_Synthetic{time.strftime('%Y%m%d_%H%M%S')}"
run = neptune.init_run(
    project="muguryalcin/TKPR221",
    api_token="eyJhcGlfYWRkcmVzcyI6Imh0dHBzOi8vYXBwLm5lcHR1bmUuYWkiLCJhcGlfdXJsIjoiaHR0cHM6Ly9hcHAubmVwdHVuZS5haSIsImFwaV9rZXkiOiJhZmVmNTk2YS1iZDFmLTQ5NDAtODBkZi01NjFiMWQxOTg0NWYifQ==",
    name=run_name,
    description="CNN model for traffic sign classification",
    tags=["CNN", "Custom Architecture", "Synthetic Data"]
)

# Log the hyperparameters
run["hyperparameters"] = {
    "n_epochs": n_epochs,
    # Model Architecture Parameters
    "model": {
        "type": "Custom CNN",
        "architecture": [
            "Conv2d(3, 16, 3, padding=1)",
            "MaxPool2d(2, 2)",
            "Dropout(0.2)",
            "Conv2d(16, 32, 3, padding=1)",
            "MaxPool2d(2, 2)",
            "Dropout(0.2)",
            "Linear(32 * 56 * 56, 128)",
            "Dropout(0.2)",
            "Linear(128, n_classes)"
        ]
    },
    # Optimizer Parameters
    "optimizer": {
        "type": "AdamW",
        "learning_rate": 0.001,
        "weight_decay": 0.01
    },
    # Loss Function
    "loss": {
        "type": "CrossEntropyLoss"
    },
    # Dataset Specific Parameters
    "dataset": {
        "batch_size": batch_size,
        "num_workers": 4,
        "pin_memory": True
    }
}


[neptune] [info   ] Neptune initialized. Open in the app: https://app.neptune.ai/muguryalcin/TKPR221/e/TKPR-192


In [None]:
run_name = f"ResNet_Synthetic{time.strftime('%Y%m%d_%H%M%S')}"
run = neptune.init_run(
    project="muguryalcin/TKPR221",
    api_token="",
    name=run_name,
    description="ResNet50 model for traffic sign classification",
    tags=["ResNet50", "Transfer Learning","Synthetic Data"]
)
run["hyperparameters"] = {
    "n_epochs": n_epochs,
    "model": {
        "type": "ResNet50",
        "pretrained": True,
        "backbone": "resnet50",
        "fc_layers": [
            {"in_features": 2048, "out_features": 512},
            {"in_features": 512, "out_features": 256},
            {"in_features": 256, "out_features": n_classes}
        ],
        "dropout_rates": [0.5, 0.3, 0.2]
    },
    "optimizer": {
        "type": "AdamW",
        "learning_rate": 1e-4,
        "weight_decay": 0.01
    },
    "loss": {
        "type": "CrossEntropyLoss"
    },
    "dataset": {
        "batch_size": 32,
        "num_workers": 4,
        "image_size": 224,  # ResNet standard input size
        "normalization": {
            "mean": [0.485, 0.456, 0.406],
            "std": [0.229, 0.224, 0.225]
        },
        "augmentations": {
            "train": ["Resize", "HorizontalFlip", "RandomBrightnessContrast", "Normalize"],
            "val": ["Resize", "Normalize"]
        }
    },
    "lr_scheduler": {
        "type": "ReduceLROnPlateau",
        "mode": "min",
        "factor": 0.1,
        "patience": 3
    }
}


[neptune] [info   ] Neptune initialized. Open in the app: https://app.neptune.ai/muguryalcin/TKPR221/e/TKPR-193


Training loop of the CNN.

In [None]:
# Early Stopping
best_val_loss = float('inf')
patience = 3
patience_counter = 0

# LR Scheduler
scheduler = torch.optim.lr_scheduler.ReduceLROnPlateau(optimizer, mode='min', factor=0.1, patience=3, verbose=True)

# Gradient Scaler
scaler = torch.cuda.amp.GradScaler()

model_save_path = f'/content/drive/MyDrive/TKPR221/models/{run_name}.pth'

for epoch in tqdm(range(n_epochs), desc="Training epochs"):
    # Train
    model.train()
    train_loss = 0
    train_preds = []
    train_labels = []
    print(f"\nStarting epoch {epoch+1}/{n_epochs}")
    for i, (images, batch_labels) in enumerate(tqdm(train_loader, desc=f"Epoch {epoch+1}/{n_epochs}", leave=False)):
        images = images.to(device)
        batch_labels = batch_labels.to(device)
        optimizer.zero_grad()

        with torch.cuda.amp.autocast():
            outputs = model(images)
            loss = criterion(outputs, batch_labels)

        scaler.scale(loss).backward()
        scaler.step(optimizer)
        scaler.update()

        train_loss += loss.item()

        _, batch_preds = torch.max(outputs.data, 1)
        train_preds.extend(batch_preds.cpu().numpy())
        train_labels.extend(batch_labels.cpu().numpy())

        if i % 25 == 0:
            batch_accuracy = accuracy_score(train_labels, train_preds)
            batch_f1 = f1_score(train_labels, train_preds, average='weighted')
            print(f"Batch {i}: Training loss = {loss.item():.4f}, Training accuracy = {batch_accuracy:.4f}, F1 = {batch_f1:.4f}")

    # Calculating Train Metrics
    avg_train_loss = train_loss / len(train_loader)
    train_accuracy = accuracy_score(train_labels, train_preds)
    train_f1 = f1_score(train_labels, train_preds, average='weighted')
    train_precision = precision_score(train_labels, train_preds, average='weighted')
    train_recall = recall_score(train_labels, train_preds, average='weighted')
    # Logging Train Metrics
    run["training/loss"].append(avg_train_loss)
    run["training/accuracy"].append(train_accuracy)
    run["training/f1"].append(train_f1)
    run["training/precision"].append(train_precision)
    run["training/recall"].append(train_recall)
    # Printing Train Metrics
    print(f"\nEpoch {epoch+1} Training Metrics:")
    print(f"Loss: {avg_train_loss:.4f}")
    print(f"Accuracy: {train_accuracy:.4f}")
    print(f"F1 Score: {train_f1:.4f}")
    print(f"Precision: {train_precision:.4f}")
    print(f"Recall: {train_recall:.4f}")
    # Validation
    print("\nStarting validation...")
    model.eval()
    val_loss = 0
    val_preds = []
    val_labels = []

    with torch.no_grad():
        for images, batch_labels in tqdm(val_loader, desc="Validation", leave=False):
            images = images.to(device)
            batch_labels = batch_labels.to(device)
            outputs = model(images)
            loss = criterion(outputs, batch_labels)
            val_loss += loss.item()

            _, batch_preds = torch.max(outputs.data, 1)
            val_preds.extend(batch_preds.cpu().numpy())
            val_labels.extend(batch_labels.cpu().numpy())
    # Calculating Validation Metrics
    avg_val_loss = val_loss / len(val_loader)
    val_accuracy = accuracy_score(val_labels, val_preds)
    val_f1 = f1_score(val_labels, val_preds, average='weighted')
    val_precision = precision_score(val_labels, val_preds, average='weighted')
    val_recall = recall_score(val_labels, val_preds, average='weighted')
    # Logging Validation Metrics
    run["validation/loss"].append(avg_val_loss)
    run["validation/accuracy"].append(val_accuracy)
    run["validation/f1"].append(val_f1)
    run["validation/precision"].append(val_precision)
    run["validation/recall"].append(val_recall)
    # Printing Validation Metrics
    print(f"\nEpoch {epoch+1} Validation Metrics:")
    print(f"Loss: {avg_val_loss:.4f}")
    print(f"Accuracy: {val_accuracy:.4f}")
    print(f"F1 Score: {val_f1:.4f}")
    print(f"Precision: {val_precision:.4f}")
    print(f"Recall: {val_recall:.4f}")

    scheduler.step(avg_val_loss)
    # Looking for early stopping
    if avg_val_loss < best_val_loss:
        best_val_loss = avg_val_loss
        patience_counter = 0
        torch.save({
            'epoch': epoch,
            'model_state_dict': model.state_dict(),
            'optimizer_state_dict': optimizer.state_dict(),
            'val_loss': avg_val_loss,
        }, model_save_path)
    else:
        patience_counter += 1
        if patience_counter >= patience:
            print(f"Stopped {epoch + 1} epochs")
            break

# Save the trained model
model_save_path = f'/content/drive/MyDrive/TKPR221/models/{run_name}.pth'
print("Saving the model...")
torch.save({
    'model_state_dict': model.state_dict(),
    'optimizer_state_dict': optimizer.state_dict(),
}, model_save_path)

print(f"Model saved to {model_save_path}")
checkpoint = torch.load(model_save_path)
model.load_state_dict(checkpoint['model_state_dict'])
print("Saved the model to", model_save_path)

# Testing
print("\nStarting final testing...")
model.eval()
test_loss = 0
test_preds = []
test_labels = []

with torch.no_grad():
    for images, batch_labels in tqdm(test_loader, desc="Testing", leave=False):
        images = images.to(device)
        batch_labels = batch_labels.to(device)
        outputs = model(images)
        loss = criterion(outputs, batch_labels)
        test_loss += loss.item()

        _, batch_preds = torch.max(outputs.data, 1)
        test_preds.extend(batch_preds.cpu().numpy())
        test_labels.extend(batch_labels.cpu().numpy())
# Calculating Test Metrics
avg_test_loss = test_loss / len(test_loader)
test_accuracy = accuracy_score(test_labels, test_preds)
test_f1 = f1_score(test_labels, test_preds, average='weighted')
test_precision = precision_score(test_labels, test_preds, average='weighted')
test_recall = recall_score(test_labels, test_preds, average='weighted')
# Log Test Metrics
run["test/loss"].log(avg_test_loss)
run["test/accuracy"].log(test_accuracy)
run["test/f1"].log(test_f1)
run["test/precision"].log(test_precision)
run["test/recall"].log(test_recall)
# Print Test Metrics
print("\nFinal Test Metrics:")
print(f"Loss: {avg_test_loss:.4f}")
print(f"Accuracy: {test_accuracy:.4f}")
print(f"F1 Score: {test_f1:.4f}")
print(f"Precision: {test_precision:.4f}")
print(f"Recall: {test_recall:.4f}")

run.stop()


  scaler = torch.cuda.amp.GradScaler()
Training epochs:   0%|          | 0/10 [00:00<?, ?it/s]


Starting epoch 1/10



  with torch.cuda.amp.autocast():

  with torch.cuda.amp.autocast():

Epoch 1/10:   0%|          | 3/2208 [00:02<19:50,  1.85it/s]  [A

Batch 0: Training loss = 6.0214, Training accuracy = 0.0078, F1 = 0.0104



Epoch 1/10:   0%|          | 5/2208 [00:02<10:38,  3.45it/s][A
Epoch 1/10:   0%|          | 8/2208 [00:02<05:58,  6.14it/s][A
Epoch 1/10:   0%|          | 11/2208 [00:02<04:08,  8.84it/s][A
Epoch 1/10:   1%|          | 14/2208 [00:02<03:13, 11.35it/s][A
Epoch 1/10:   1%|          | 16/2208 [00:02<02:53, 12.62it/s][A
Epoch 1/10:   1%|          | 18/2208 [00:02<02:53, 12.64it/s][A
Epoch 1/10:   1%|          | 20/2208 [00:02<02:41, 13.59it/s][A
Epoch 1/10:   1%|          | 22/2208 [00:03<02:28, 14.76it/s][A
Epoch 1/10:   1%|          | 24/2208 [00:03<02:29, 14.63it/s][A
  with torch.cuda.amp.autocast():

Epoch 1/10:   1%|▏         | 29/2208 [00:03<02:05, 17.32it/s][A

Batch 25: Training loss = 5.6347, Training accuracy = 0.0120, F1 = 0.0058



Epoch 1/10:   1%|▏         | 31/2208 [00:03<02:22, 15.29it/s][A
Epoch 1/10:   2%|▏         | 34/2208 [00:03<02:08, 16.96it/s][A
Epoch 1/10:   2%|▏         | 37/2208 [00:03<01:58, 18.29it/s][A
Epoch 1/10:   2%|▏         | 40/2208 [00:04<01:53, 19.05it/s][A
Epoch 1/10:   2%|▏         | 43/2208 [00:04<01:49, 19.69it/s][A
Epoch 1/10:   2%|▏         | 46/2208 [00:04<01:49, 19.79it/s][A
  with torch.cuda.amp.autocast():

Epoch 1/10:   2%|▏         | 52/2208 [00:04<01:54, 18.76it/s][A

Batch 50: Training loss = 4.9013, Training accuracy = 0.0234, F1 = 0.0166



Epoch 1/10:   2%|▏         | 55/2208 [00:04<01:50, 19.52it/s][A
Epoch 1/10:   3%|▎         | 57/2208 [00:04<01:52, 19.18it/s][A
Epoch 1/10:   3%|▎         | 60/2208 [00:05<01:48, 19.76it/s][A
Epoch 1/10:   3%|▎         | 63/2208 [00:05<01:45, 20.31it/s][A
Epoch 1/10:   3%|▎         | 66/2208 [00:05<01:44, 20.59it/s][A
Epoch 1/10:   3%|▎         | 69/2208 [00:05<01:43, 20.72it/s][A
Epoch 1/10:   3%|▎         | 72/2208 [00:05<01:43, 20.60it/s][A
  with torch.cuda.amp.autocast():

Epoch 1/10:   4%|▎         | 78/2208 [00:05<01:58, 17.98it/s][A

Batch 75: Training loss = 4.3765, Training accuracy = 0.0372, F1 = 0.0292



Epoch 1/10:   4%|▎         | 81/2208 [00:06<01:52, 18.94it/s][A
Epoch 1/10:   4%|▍         | 84/2208 [00:06<01:51, 19.02it/s][A
Epoch 1/10:   4%|▍         | 87/2208 [00:06<01:47, 19.71it/s][A
Epoch 1/10:   4%|▍         | 90/2208 [00:06<01:53, 18.64it/s][A
Epoch 1/10:   4%|▍         | 93/2208 [00:06<01:48, 19.45it/s][A
Epoch 1/10:   4%|▍         | 96/2208 [00:06<01:48, 19.48it/s][A
  with torch.cuda.amp.autocast():

Epoch 1/10:   5%|▍         | 102/2208 [00:07<01:48, 19.46it/s][A
Epoch 1/10:   5%|▍         | 104/2208 [00:07<01:50, 19.08it/s][A

Batch 100: Training loss = 3.7685, Training accuracy = 0.0552, F1 = 0.0476



Epoch 1/10:   5%|▍         | 107/2208 [00:07<01:46, 19.81it/s][A
Epoch 1/10:   5%|▍         | 110/2208 [00:07<01:44, 20.13it/s][A
Epoch 1/10:   5%|▌         | 113/2208 [00:07<01:41, 20.58it/s][A
Epoch 1/10:   5%|▌         | 116/2208 [00:07<01:42, 20.36it/s][A
Epoch 1/10:   5%|▌         | 119/2208 [00:08<01:41, 20.53it/s][A
Epoch 1/10:   6%|▌         | 122/2208 [00:08<01:41, 20.65it/s][A
  with torch.cuda.amp.autocast():

Epoch 1/10:   6%|▌         | 128/2208 [00:08<01:44, 19.89it/s][A

Batch 125: Training loss = 3.4180, Training accuracy = 0.0765, F1 = 0.0674



Epoch 1/10:   6%|▌         | 131/2208 [00:08<01:42, 20.33it/s][A
Epoch 1/10:   6%|▌         | 134/2208 [00:08<01:40, 20.56it/s][A
Epoch 1/10:   6%|▌         | 137/2208 [00:08<01:39, 20.73it/s][A
Epoch 1/10:   6%|▋         | 140/2208 [00:09<01:38, 20.89it/s][A
Epoch 1/10:   6%|▋         | 143/2208 [00:09<01:38, 21.00it/s][A
Epoch 1/10:   7%|▋         | 146/2208 [00:09<01:37, 21.15it/s][A
  with torch.cuda.amp.autocast():

Epoch 1/10:   7%|▋         | 152/2208 [00:09<01:49, 18.81it/s][A
Epoch 1/10:   7%|▋         | 155/2208 [00:09<01:45, 19.50it/s][A

Batch 150: Training loss = 3.2287, Training accuracy = 0.0963, F1 = 0.0872



Epoch 1/10:   7%|▋         | 158/2208 [00:09<01:42, 19.94it/s][A
Epoch 1/10:   7%|▋         | 161/2208 [00:10<01:41, 20.22it/s][A
Epoch 1/10:   7%|▋         | 164/2208 [00:10<01:39, 20.61it/s][A
Epoch 1/10:   8%|▊         | 167/2208 [00:10<01:37, 20.89it/s][A
Epoch 1/10:   8%|▊         | 170/2208 [00:10<01:37, 20.94it/s][A
Epoch 1/10:   8%|▊         | 173/2208 [00:10<01:36, 21.05it/s][A
  with torch.cuda.amp.autocast():

Epoch 1/10:   8%|▊         | 179/2208 [00:10<01:40, 20.13it/s][A

Batch 175: Training loss = 2.8488, Training accuracy = 0.1167, F1 = 0.1082



Epoch 1/10:   8%|▊         | 182/2208 [00:11<01:38, 20.53it/s][A
Epoch 1/10:   8%|▊         | 185/2208 [00:11<01:37, 20.78it/s][A
Epoch 1/10:   9%|▊         | 188/2208 [00:11<01:36, 20.88it/s][A
Epoch 1/10:   9%|▊         | 191/2208 [00:11<01:36, 21.01it/s][A
Epoch 1/10:   9%|▉         | 194/2208 [00:11<01:36, 20.98it/s][A
Epoch 1/10:   9%|▉         | 197/2208 [00:11<01:35, 21.04it/s][A
  with torch.cuda.amp.autocast():

Epoch 1/10:   9%|▉         | 203/2208 [00:12<01:42, 19.53it/s][A

Batch 200: Training loss = 2.6006, Training accuracy = 0.1370, F1 = 0.1294



Epoch 1/10:   9%|▉         | 206/2208 [00:12<01:39, 20.12it/s][A
Epoch 1/10:   9%|▉         | 209/2208 [00:12<01:37, 20.48it/s][A
Epoch 1/10:  10%|▉         | 212/2208 [00:12<01:36, 20.77it/s][A
Epoch 1/10:  10%|▉         | 215/2208 [00:12<01:34, 21.03it/s][A
Epoch 1/10:  10%|▉         | 218/2208 [00:12<01:34, 21.04it/s][A
Epoch 1/10:  10%|█         | 221/2208 [00:12<01:34, 21.13it/s][A
  with torch.cuda.amp.autocast():

Epoch 1/10:  10%|█         | 227/2208 [00:13<01:42, 19.34it/s][A
Epoch 1/10:  10%|█         | 230/2208 [00:13<01:39, 19.93it/s][A

Batch 225: Training loss = 2.3595, Training accuracy = 0.1572, F1 = 0.1504



Epoch 1/10:  11%|█         | 233/2208 [00:13<01:37, 20.32it/s][A
Epoch 1/10:  11%|█         | 236/2208 [00:13<01:35, 20.57it/s][A
Epoch 1/10:  11%|█         | 239/2208 [00:13<01:34, 20.79it/s][A
Epoch 1/10:  11%|█         | 242/2208 [00:14<01:34, 20.90it/s][A
Epoch 1/10:  11%|█         | 245/2208 [00:14<01:34, 20.88it/s][A
Epoch 1/10:  11%|█         | 248/2208 [00:14<01:33, 20.88it/s][A
  with torch.cuda.amp.autocast():

Epoch 1/10:  12%|█▏        | 254/2208 [00:14<01:45, 18.48it/s][A

Batch 250: Training loss = 2.6083, Training accuracy = 0.1778, F1 = 0.1713



Epoch 1/10:  12%|█▏        | 257/2208 [00:14<01:41, 19.28it/s][A
Epoch 1/10:  12%|█▏        | 260/2208 [00:14<01:38, 19.79it/s][A
Epoch 1/10:  12%|█▏        | 263/2208 [00:15<01:37, 20.02it/s][A
Epoch 1/10:  12%|█▏        | 266/2208 [00:15<01:39, 19.50it/s][A
Epoch 1/10:  12%|█▏        | 268/2208 [00:15<01:39, 19.59it/s][A
Epoch 1/10:  12%|█▏        | 271/2208 [00:15<01:36, 20.13it/s][A
  with torch.cuda.amp.autocast():

Epoch 1/10:  13%|█▎        | 277/2208 [00:15<01:45, 18.32it/s][A
Epoch 1/10:  13%|█▎        | 279/2208 [00:15<01:45, 18.24it/s][A

Batch 275: Training loss = 2.0224, Training accuracy = 0.1979, F1 = 0.1919



Epoch 1/10:  13%|█▎        | 282/2208 [00:16<01:41, 19.04it/s][A
Epoch 1/10:  13%|█▎        | 284/2208 [00:16<01:46, 18.10it/s][A
Epoch 1/10:  13%|█▎        | 286/2208 [00:16<01:43, 18.49it/s][A
Epoch 1/10:  13%|█▎        | 289/2208 [00:16<01:39, 19.38it/s][A
Epoch 1/10:  13%|█▎        | 291/2208 [00:16<01:49, 17.45it/s][A
Epoch 1/10:  13%|█▎        | 294/2208 [00:16<01:42, 18.68it/s][A
Epoch 1/10:  13%|█▎        | 296/2208 [00:16<01:44, 18.37it/s][A
Epoch 1/10:  14%|█▎        | 299/2208 [00:17<01:41, 18.81it/s][A
  with torch.cuda.amp.autocast():

Epoch 1/10:  14%|█▍        | 304/2208 [00:17<01:43, 18.37it/s][A

Batch 300: Training loss = 1.8745, Training accuracy = 0.2166, F1 = 0.2111



Epoch 1/10:  14%|█▍        | 307/2208 [00:17<01:38, 19.26it/s][A
Epoch 1/10:  14%|█▍        | 310/2208 [00:17<01:36, 19.73it/s][A
Epoch 1/10:  14%|█▍        | 313/2208 [00:17<01:33, 20.18it/s][A
Epoch 1/10:  14%|█▍        | 316/2208 [00:17<01:43, 18.28it/s][A
Epoch 1/10:  14%|█▍        | 319/2208 [00:18<01:38, 19.09it/s][A
Epoch 1/10:  15%|█▍        | 322/2208 [00:18<01:35, 19.74it/s][A
  with torch.cuda.amp.autocast():

Epoch 1/10:  15%|█▍        | 327/2208 [00:18<01:52, 16.73it/s][A
Epoch 1/10:  15%|█▍        | 330/2208 [00:18<01:45, 17.85it/s][A

Batch 325: Training loss = 1.8646, Training accuracy = 0.2345, F1 = 0.2291



Epoch 1/10:  15%|█▌        | 333/2208 [00:18<01:39, 18.83it/s][A
Epoch 1/10:  15%|█▌        | 336/2208 [00:19<01:35, 19.51it/s][A
Epoch 1/10:  15%|█▌        | 339/2208 [00:19<01:32, 20.15it/s][A
Epoch 1/10:  15%|█▌        | 342/2208 [00:19<01:30, 20.57it/s][A
Epoch 1/10:  16%|█▌        | 345/2208 [00:19<01:29, 20.71it/s][A
Epoch 1/10:  16%|█▌        | 348/2208 [00:19<01:29, 20.78it/s][A
  with torch.cuda.amp.autocast():

Epoch 1/10:  16%|█▌        | 353/2208 [00:19<01:44, 17.70it/s]

Batch 350: Training loss = 1.6510, Training accuracy = 0.2518, F1 = 0.2466


[A
Epoch 1/10:  16%|█▌        | 355/2208 [00:20<02:04, 14.86it/s][A
Epoch 1/10:  16%|█▌        | 358/2208 [00:20<01:51, 16.58it/s][A
Epoch 1/10:  16%|█▋        | 361/2208 [00:20<01:43, 17.87it/s][A
Epoch 1/10:  16%|█▋        | 364/2208 [00:20<01:37, 18.99it/s][A
Epoch 1/10:  17%|█▋        | 367/2208 [00:20<01:33, 19.60it/s][A
Epoch 1/10:  17%|█▋        | 370/2208 [00:20<01:31, 20.01it/s][A
Epoch 1/10:  17%|█▋        | 373/2208 [00:20<01:29, 20.49it/s][A
  with torch.cuda.amp.autocast():

Epoch 1/10:  17%|█▋        | 379/2208 [00:21<01:35, 19.15it/s][A

Batch 375: Training loss = 1.8767, Training accuracy = 0.2691, F1 = 0.2643



Epoch 1/10:  17%|█▋        | 382/2208 [00:21<01:32, 19.72it/s][A
Epoch 1/10:  17%|█▋        | 385/2208 [00:21<01:30, 20.19it/s][A
Epoch 1/10:  18%|█▊        | 388/2208 [00:21<01:28, 20.46it/s][A
Epoch 1/10:  18%|█▊        | 391/2208 [00:21<01:28, 20.64it/s][A
Epoch 1/10:  18%|█▊        | 394/2208 [00:22<01:27, 20.66it/s][A
Epoch 1/10:  18%|█▊        | 397/2208 [00:22<01:26, 21.00it/s][A
  with torch.cuda.amp.autocast():

Epoch 1/10:  18%|█▊        | 403/2208 [00:22<01:37, 18.47it/s][A

Batch 400: Training loss = 1.3959, Training accuracy = 0.2853, F1 = 0.2807



Epoch 1/10:  18%|█▊        | 406/2208 [00:22<01:33, 19.22it/s][A
Epoch 1/10:  19%|█▊        | 409/2208 [00:22<01:30, 19.93it/s][A
Epoch 1/10:  19%|█▊        | 412/2208 [00:22<01:28, 20.34it/s][A
Epoch 1/10:  19%|█▉        | 415/2208 [00:23<01:26, 20.69it/s][A
Epoch 1/10:  19%|█▉        | 418/2208 [00:23<01:25, 20.82it/s][A
Epoch 1/10:  19%|█▉        | 421/2208 [00:23<01:25, 21.02it/s][A
  with torch.cuda.amp.autocast():

Epoch 1/10:  19%|█▉        | 427/2208 [00:23<01:37, 18.20it/s][A
Epoch 1/10:  19%|█▉        | 430/2208 [00:23<01:33, 19.11it/s][A

Batch 425: Training loss = 1.4386, Training accuracy = 0.3001, F1 = 0.2956



Epoch 1/10:  20%|█▉        | 433/2208 [00:23<01:29, 19.73it/s][A
Epoch 1/10:  20%|█▉        | 436/2208 [00:24<01:28, 20.01it/s][A
Epoch 1/10:  20%|█▉        | 439/2208 [00:24<01:26, 20.41it/s][A
Epoch 1/10:  20%|██        | 442/2208 [00:24<01:25, 20.63it/s][A
Epoch 1/10:  20%|██        | 445/2208 [00:24<01:24, 20.89it/s][A
Epoch 1/10:  20%|██        | 448/2208 [00:24<01:23, 21.02it/s][A
  with torch.cuda.amp.autocast():

Epoch 1/10:  21%|██        | 454/2208 [00:25<01:32, 18.90it/s][A

Batch 450: Training loss = 1.5786, Training accuracy = 0.3148, F1 = 0.3103



Epoch 1/10:  21%|██        | 457/2208 [00:25<01:29, 19.63it/s][A
Epoch 1/10:  21%|██        | 460/2208 [00:25<01:26, 20.19it/s][A
Epoch 1/10:  21%|██        | 463/2208 [00:25<01:24, 20.55it/s][A
Epoch 1/10:  21%|██        | 466/2208 [00:25<01:23, 20.93it/s][A
Epoch 1/10:  21%|██        | 469/2208 [00:25<01:22, 21.08it/s][A
Epoch 1/10:  21%|██▏       | 472/2208 [00:25<01:22, 21.12it/s][A
  with torch.cuda.amp.autocast():

Epoch 1/10:  22%|██▏       | 478/2208 [00:26<01:35, 18.16it/s][A

Batch 475: Training loss = 1.3194, Training accuracy = 0.3281, F1 = 0.3236



Epoch 1/10:  22%|██▏       | 481/2208 [00:26<01:30, 19.09it/s][A
Epoch 1/10:  22%|██▏       | 484/2208 [00:26<01:27, 19.73it/s][A
Epoch 1/10:  22%|██▏       | 487/2208 [00:26<01:25, 20.19it/s][A
Epoch 1/10:  22%|██▏       | 490/2208 [00:26<01:23, 20.56it/s][A
Epoch 1/10:  22%|██▏       | 493/2208 [00:26<01:22, 20.74it/s][A
Epoch 1/10:  22%|██▏       | 496/2208 [00:27<01:22, 20.84it/s][A
  with torch.cuda.amp.autocast():

Epoch 1/10:  23%|██▎       | 502/2208 [00:27<01:35, 17.79it/s][A
Epoch 1/10:  23%|██▎       | 505/2208 [00:27<01:30, 18.79it/s][A

Batch 500: Training loss = 1.3103, Training accuracy = 0.3417, F1 = 0.3374



Epoch 1/10:  23%|██▎       | 508/2208 [00:27<01:27, 19.47it/s][A
Epoch 1/10:  23%|██▎       | 511/2208 [00:27<01:25, 19.84it/s][A
Epoch 1/10:  23%|██▎       | 514/2208 [00:28<01:23, 20.29it/s][A
Epoch 1/10:  23%|██▎       | 517/2208 [00:28<01:21, 20.68it/s][A
Epoch 1/10:  24%|██▎       | 520/2208 [00:28<01:21, 20.70it/s][A
Epoch 1/10:  24%|██▎       | 523/2208 [00:28<01:20, 20.87it/s][A
  with torch.cuda.amp.autocast():

Epoch 1/10:  24%|██▍       | 529/2208 [00:28<01:33, 17.97it/s][A

Batch 525: Training loss = 1.3374, Training accuracy = 0.3537, F1 = 0.3494



Epoch 1/10:  24%|██▍       | 532/2208 [00:28<01:28, 18.91it/s][A
Epoch 1/10:  24%|██▍       | 535/2208 [00:29<01:25, 19.66it/s][A
Epoch 1/10:  24%|██▍       | 538/2208 [00:29<01:22, 20.24it/s][A
Epoch 1/10:  25%|██▍       | 541/2208 [00:29<01:35, 17.37it/s][A
Epoch 1/10:  25%|██▍       | 544/2208 [00:29<01:30, 18.39it/s][A
Epoch 1/10:  25%|██▍       | 547/2208 [00:29<01:26, 19.12it/s][A
Epoch 1/10:  25%|██▍       | 549/2208 [00:29<01:26, 19.26it/s][A
  with torch.cuda.amp.autocast():

Epoch 1/10:  25%|██▌       | 553/2208 [00:30<01:47, 15.42it/s][A

Batch 550: Training loss = 1.3592, Training accuracy = 0.3663, F1 = 0.3622



Epoch 1/10:  25%|██▌       | 556/2208 [00:30<01:36, 17.18it/s][A
Epoch 1/10:  25%|██▌       | 559/2208 [00:30<01:29, 18.50it/s][A
Epoch 1/10:  25%|██▌       | 562/2208 [00:30<01:25, 19.16it/s][A
Epoch 1/10:  26%|██▌       | 565/2208 [00:30<01:23, 19.61it/s][A
Epoch 1/10:  26%|██▌       | 568/2208 [00:30<01:21, 20.21it/s][A
Epoch 1/10:  26%|██▌       | 571/2208 [00:31<01:20, 20.45it/s][A
Epoch 1/10:  26%|██▌       | 574/2208 [00:31<01:33, 17.43it/s][A
  with torch.cuda.amp.autocast():

Epoch 1/10:  26%|██▌       | 578/2208 [00:31<01:42, 15.87it/s][A

Batch 575: Training loss = 1.2400, Training accuracy = 0.3773, F1 = 0.3733



Epoch 1/10:  26%|██▋       | 581/2208 [00:31<01:33, 17.41it/s][A
Epoch 1/10:  26%|██▋       | 584/2208 [00:31<01:27, 18.51it/s][A
Epoch 1/10:  27%|██▋       | 586/2208 [00:31<01:27, 18.51it/s][A
Epoch 1/10:  27%|██▋       | 589/2208 [00:32<01:33, 17.36it/s][A
Epoch 1/10:  27%|██▋       | 591/2208 [00:32<01:30, 17.78it/s][A
Epoch 1/10:  27%|██▋       | 593/2208 [00:32<01:28, 18.30it/s][A
Epoch 1/10:  27%|██▋       | 596/2208 [00:32<01:23, 19.28it/s][A
Epoch 1/10:  27%|██▋       | 598/2208 [00:32<01:29, 17.93it/s][A
  with torch.cuda.amp.autocast():

Epoch 1/10:  27%|██▋       | 604/2208 [00:33<01:34, 16.95it/s][A

Batch 600: Training loss = 1.4516, Training accuracy = 0.3878, F1 = 0.3839



Epoch 1/10:  27%|██▋       | 606/2208 [00:33<01:31, 17.59it/s][A
Epoch 1/10:  28%|██▊       | 609/2208 [00:33<01:26, 18.54it/s][A
Epoch 1/10:  28%|██▊       | 612/2208 [00:33<01:22, 19.37it/s][A
Epoch 1/10:  28%|██▊       | 615/2208 [00:33<01:19, 19.93it/s][A
Epoch 1/10:  28%|██▊       | 618/2208 [00:33<01:18, 20.20it/s][A
Epoch 1/10:  28%|██▊       | 621/2208 [00:33<01:17, 20.57it/s][A
  with torch.cuda.amp.autocast():

Epoch 1/10:  28%|██▊       | 627/2208 [00:34<01:36, 16.35it/s][A
Epoch 1/10:  29%|██▊       | 630/2208 [00:34<01:29, 17.70it/s][A

Batch 625: Training loss = 1.2643, Training accuracy = 0.3972, F1 = 0.3934



Epoch 1/10:  29%|██▊       | 633/2208 [00:34<01:24, 18.66it/s][A
Epoch 1/10:  29%|██▉       | 636/2208 [00:34<01:21, 19.40it/s][A
Epoch 1/10:  29%|██▉       | 639/2208 [00:34<01:18, 20.00it/s][A
Epoch 1/10:  29%|██▉       | 642/2208 [00:34<01:16, 20.41it/s][A
Epoch 1/10:  29%|██▉       | 645/2208 [00:35<01:15, 20.80it/s][A
Epoch 1/10:  29%|██▉       | 648/2208 [00:35<01:14, 20.97it/s][A
  with torch.cuda.amp.autocast():

Epoch 1/10:  30%|██▉       | 654/2208 [00:35<01:25, 18.21it/s][A

Batch 650: Training loss = 1.0566, Training accuracy = 0.4069, F1 = 0.4031



Epoch 1/10:  30%|██▉       | 657/2208 [00:35<01:21, 19.11it/s][A
Epoch 1/10:  30%|██▉       | 660/2208 [00:35<01:18, 19.62it/s][A
Epoch 1/10:  30%|███       | 663/2208 [00:36<01:16, 20.12it/s][A
Epoch 1/10:  30%|███       | 666/2208 [00:36<01:15, 20.47it/s][A
Epoch 1/10:  30%|███       | 669/2208 [00:36<01:14, 20.72it/s][A
Epoch 1/10:  30%|███       | 672/2208 [00:36<01:13, 20.80it/s][A
  with torch.cuda.amp.autocast():

Epoch 1/10:  31%|███       | 678/2208 [00:36<01:30, 16.84it/s][A

Batch 675: Training loss = 1.2343, Training accuracy = 0.4161, F1 = 0.4124



Epoch 1/10:  31%|███       | 681/2208 [00:37<01:24, 17.99it/s][A
Epoch 1/10:  31%|███       | 684/2208 [00:37<01:20, 18.82it/s][A
Epoch 1/10:  31%|███       | 687/2208 [00:37<01:17, 19.58it/s][A
Epoch 1/10:  31%|███▏      | 690/2208 [00:37<01:15, 20.13it/s][A
Epoch 1/10:  31%|███▏      | 693/2208 [00:37<01:14, 20.47it/s][A
Epoch 1/10:  32%|███▏      | 696/2208 [00:37<01:13, 20.70it/s][A
  with torch.cuda.amp.autocast():

Epoch 1/10:  32%|███▏      | 702/2208 [00:38<01:29, 16.82it/s][A
Epoch 1/10:  32%|███▏      | 705/2208 [00:38<01:23, 18.05it/s][A

Batch 700: Training loss = 1.1480, Training accuracy = 0.4249, F1 = 0.4212



Epoch 1/10:  32%|███▏      | 708/2208 [00:38<01:19, 18.95it/s][A
Epoch 1/10:  32%|███▏      | 711/2208 [00:38<01:16, 19.48it/s][A
Epoch 1/10:  32%|███▏      | 714/2208 [00:38<01:14, 20.06it/s][A
Epoch 1/10:  32%|███▏      | 717/2208 [00:38<01:12, 20.43it/s][A
Epoch 1/10:  33%|███▎      | 720/2208 [00:38<01:11, 20.70it/s][A
Epoch 1/10:  33%|███▎      | 723/2208 [00:39<01:11, 20.77it/s][A
  with torch.cuda.amp.autocast():

Epoch 1/10:  33%|███▎      | 729/2208 [00:39<01:23, 17.81it/s][A

Batch 725: Training loss = 1.0979, Training accuracy = 0.4333, F1 = 0.4296



Epoch 1/10:  33%|███▎      | 732/2208 [00:39<01:18, 18.81it/s][A
Epoch 1/10:  33%|███▎      | 735/2208 [00:39<01:15, 19.45it/s][A
Epoch 1/10:  33%|███▎      | 738/2208 [00:39<01:13, 20.04it/s][A
Epoch 1/10:  34%|███▎      | 741/2208 [00:40<01:12, 20.31it/s][A
Epoch 1/10:  34%|███▎      | 744/2208 [00:40<01:11, 20.50it/s][A
Epoch 1/10:  34%|███▍      | 747/2208 [00:40<01:10, 20.73it/s][A
  with torch.cuda.amp.autocast():

Epoch 1/10:  34%|███▍      | 753/2208 [00:40<01:27, 16.66it/s][A

Batch 750: Training loss = 1.2042, Training accuracy = 0.4415, F1 = 0.4378



Epoch 1/10:  34%|███▍      | 756/2208 [00:40<01:21, 17.91it/s][A
Epoch 1/10:  34%|███▍      | 759/2208 [00:41<01:17, 18.82it/s][A
Epoch 1/10:  35%|███▍      | 762/2208 [00:41<01:14, 19.44it/s][A
Epoch 1/10:  35%|███▍      | 765/2208 [00:41<01:12, 19.88it/s][A
Epoch 1/10:  35%|███▍      | 768/2208 [00:41<01:10, 20.29it/s][A
Epoch 1/10:  35%|███▍      | 771/2208 [00:41<01:09, 20.56it/s][A
  with torch.cuda.amp.autocast():

Epoch 1/10:  35%|███▌      | 777/2208 [00:42<01:33, 15.30it/s][A
Epoch 1/10:  35%|███▌      | 780/2208 [00:42<01:24, 16.80it/s][A

Batch 775: Training loss = 0.9215, Training accuracy = 0.4492, F1 = 0.4455



Epoch 1/10:  35%|███▌      | 783/2208 [00:42<01:19, 17.98it/s][A
Epoch 1/10:  36%|███▌      | 786/2208 [00:42<01:15, 18.90it/s][A
Epoch 1/10:  36%|███▌      | 789/2208 [00:42<01:12, 19.48it/s][A
Epoch 1/10:  36%|███▌      | 792/2208 [00:42<01:10, 20.00it/s][A
Epoch 1/10:  36%|███▌      | 795/2208 [00:42<01:10, 20.07it/s][A
Epoch 1/10:  36%|███▌      | 798/2208 [00:43<01:09, 20.25it/s][A
  with torch.cuda.amp.autocast():

Epoch 1/10:  36%|███▋      | 804/2208 [00:43<01:21, 17.13it/s][A

Batch 800: Training loss = 0.8877, Training accuracy = 0.4563, F1 = 0.4526



Epoch 1/10:  37%|███▋      | 807/2208 [00:43<01:16, 18.24it/s][A
Epoch 1/10:  37%|███▋      | 810/2208 [00:43<01:13, 19.04it/s][A
Epoch 1/10:  37%|███▋      | 813/2208 [00:43<01:11, 19.55it/s][A
Epoch 1/10:  37%|███▋      | 816/2208 [00:44<01:09, 19.89it/s][A
Epoch 1/10:  37%|███▋      | 819/2208 [00:44<01:09, 19.98it/s][A
Epoch 1/10:  37%|███▋      | 822/2208 [00:44<01:17, 17.95it/s][A
  with torch.cuda.amp.autocast():

Epoch 1/10:  37%|███▋      | 827/2208 [00:44<01:40, 13.74it/s][A
Epoch 1/10:  38%|███▊      | 830/2208 [00:45<01:28, 15.56it/s][A

Batch 825: Training loss = 0.8990, Training accuracy = 0.4633, F1 = 0.4597



Epoch 1/10:  38%|███▊      | 833/2208 [00:45<01:20, 17.03it/s][A
Epoch 1/10:  38%|███▊      | 836/2208 [00:45<01:15, 18.17it/s][A
Epoch 1/10:  38%|███▊      | 839/2208 [00:45<01:12, 18.96it/s][A
Epoch 1/10:  38%|███▊      | 842/2208 [00:45<01:09, 19.64it/s][A
Epoch 1/10:  38%|███▊      | 845/2208 [00:45<01:07, 20.19it/s][A
Epoch 1/10:  38%|███▊      | 848/2208 [00:45<01:11, 19.12it/s][A
  with torch.cuda.amp.autocast():

Epoch 1/10:  39%|███▊      | 854/2208 [00:46<01:30, 14.93it/s][A

Batch 850: Training loss = 1.0226, Training accuracy = 0.4702, F1 = 0.4666



Epoch 1/10:  39%|███▉      | 857/2208 [00:46<01:22, 16.41it/s][A
Epoch 1/10:  39%|███▉      | 860/2208 [00:46<01:16, 17.58it/s][A
Epoch 1/10:  39%|███▉      | 863/2208 [00:46<01:12, 18.44it/s][A
Epoch 1/10:  39%|███▉      | 866/2208 [00:46<01:09, 19.18it/s][A
Epoch 1/10:  39%|███▉      | 869/2208 [00:47<01:07, 19.79it/s][A
Epoch 1/10:  39%|███▉      | 872/2208 [00:47<01:07, 19.90it/s][A
  with torch.cuda.amp.autocast():

Epoch 1/10:  40%|███▉      | 877/2208 [00:47<01:42, 13.00it/s][A
Epoch 1/10:  40%|███▉      | 880/2208 [00:47<01:28, 14.93it/s][A

Batch 875: Training loss = 0.9066, Training accuracy = 0.4766, F1 = 0.4730



Epoch 1/10:  40%|███▉      | 883/2208 [00:48<01:20, 16.42it/s][A
Epoch 1/10:  40%|████      | 886/2208 [00:48<01:14, 17.72it/s][A
Epoch 1/10:  40%|████      | 889/2208 [00:48<01:10, 18.59it/s][A
Epoch 1/10:  40%|████      | 892/2208 [00:48<01:08, 19.33it/s][A
Epoch 1/10:  41%|████      | 895/2208 [00:48<01:05, 19.92it/s][A
Epoch 1/10:  41%|████      | 898/2208 [00:48<01:04, 20.25it/s][A
  with torch.cuda.amp.autocast():

Epoch 1/10:  41%|████      | 904/2208 [00:49<01:16, 16.99it/s][A

Batch 900: Training loss = 0.9990, Training accuracy = 0.4833, F1 = 0.4797



Epoch 1/10:  41%|████      | 907/2208 [00:49<01:11, 18.23it/s][A
Epoch 1/10:  41%|████      | 910/2208 [00:49<01:08, 19.05it/s][A
Epoch 1/10:  41%|████▏     | 913/2208 [00:49<01:05, 19.68it/s][A
Epoch 1/10:  41%|████▏     | 916/2208 [00:49<01:03, 20.24it/s][A
Epoch 1/10:  42%|████▏     | 919/2208 [00:49<01:02, 20.62it/s][A
Epoch 1/10:  42%|████▏     | 922/2208 [00:50<01:01, 20.76it/s][A
  with torch.cuda.amp.autocast():

Epoch 1/10:  42%|████▏     | 928/2208 [00:50<01:22, 15.43it/s][A

Batch 925: Training loss = 0.7321, Training accuracy = 0.4893, F1 = 0.4857



Epoch 1/10:  42%|████▏     | 931/2208 [00:50<01:15, 16.86it/s][A
Epoch 1/10:  42%|████▏     | 934/2208 [00:50<01:10, 17.99it/s][A
Epoch 1/10:  42%|████▏     | 937/2208 [00:50<01:07, 18.95it/s][A
Epoch 1/10:  43%|████▎     | 940/2208 [00:51<01:05, 19.50it/s][A
Epoch 1/10:  43%|████▎     | 943/2208 [00:51<01:03, 20.01it/s][A
Epoch 1/10:  43%|████▎     | 946/2208 [00:51<01:01, 20.42it/s][A
  with torch.cuda.amp.autocast():

Epoch 1/10:  43%|████▎     | 952/2208 [00:51<01:21, 15.43it/s][A
Epoch 1/10:  43%|████▎     | 955/2208 [00:51<01:13, 16.96it/s][A

Batch 950: Training loss = 0.9178, Training accuracy = 0.4953, F1 = 0.4918



Epoch 1/10:  43%|████▎     | 958/2208 [00:52<01:09, 18.10it/s][A
Epoch 1/10:  44%|████▎     | 961/2208 [00:52<01:05, 19.07it/s][A
Epoch 1/10:  44%|████▎     | 964/2208 [00:52<01:03, 19.69it/s][A
Epoch 1/10:  44%|████▍     | 967/2208 [00:52<01:01, 20.06it/s][A
Epoch 1/10:  44%|████▍     | 970/2208 [00:52<01:00, 20.35it/s][A
Epoch 1/10:  44%|████▍     | 973/2208 [00:52<00:59, 20.78it/s][A
  with torch.cuda.amp.autocast():

Epoch 1/10:  44%|████▍     | 979/2208 [00:53<01:13, 16.65it/s][A

Batch 975: Training loss = 0.8161, Training accuracy = 0.5012, F1 = 0.4978



Epoch 1/10:  44%|████▍     | 982/2208 [00:53<01:08, 17.90it/s][A
Epoch 1/10:  45%|████▍     | 985/2208 [00:53<01:05, 18.70it/s][A
Epoch 1/10:  45%|████▍     | 988/2208 [00:53<01:02, 19.45it/s][A
Epoch 1/10:  45%|████▍     | 991/2208 [00:53<01:01, 19.88it/s][A
Epoch 1/10:  45%|████▌     | 994/2208 [00:53<00:59, 20.36it/s][A
Epoch 1/10:  45%|████▌     | 997/2208 [00:54<00:58, 20.64it/s][A
  with torch.cuda.amp.autocast():

Epoch 1/10:  45%|████▌     | 1003/2208 [00:54<01:24, 14.32it/s][A

Batch 1000: Training loss = 0.8432, Training accuracy = 0.5069, F1 = 0.5034



Epoch 1/10:  46%|████▌     | 1006/2208 [00:54<01:15, 15.93it/s][A
Epoch 1/10:  46%|████▌     | 1009/2208 [00:54<01:09, 17.27it/s][A
Epoch 1/10:  46%|████▌     | 1012/2208 [00:55<01:05, 18.38it/s][A
Epoch 1/10:  46%|████▌     | 1015/2208 [00:55<01:02, 19.13it/s][A
Epoch 1/10:  46%|████▌     | 1018/2208 [00:55<00:59, 19.90it/s][A
Epoch 1/10:  46%|████▌     | 1021/2208 [00:55<00:58, 20.30it/s][A
  with torch.cuda.amp.autocast():

Epoch 1/10:  47%|████▋     | 1027/2208 [00:55<01:20, 14.68it/s][A
Epoch 1/10:  47%|████▋     | 1030/2208 [00:56<01:12, 16.28it/s][A

Batch 1025: Training loss = 0.8746, Training accuracy = 0.5122, F1 = 0.5088



Epoch 1/10:  47%|████▋     | 1033/2208 [00:56<01:07, 17.39it/s][A
Epoch 1/10:  47%|████▋     | 1036/2208 [00:56<01:03, 18.41it/s][A
Epoch 1/10:  47%|████▋     | 1039/2208 [00:56<01:00, 19.27it/s][A
Epoch 1/10:  47%|████▋     | 1042/2208 [00:56<00:58, 19.89it/s][A
Epoch 1/10:  47%|████▋     | 1045/2208 [00:56<00:57, 20.18it/s][A
Epoch 1/10:  47%|████▋     | 1048/2208 [00:56<00:56, 20.49it/s][A
  with torch.cuda.amp.autocast():

Epoch 1/10:  48%|████▊     | 1054/2208 [00:57<01:10, 16.28it/s][A

Batch 1050: Training loss = 0.8614, Training accuracy = 0.5174, F1 = 0.5140



Epoch 1/10:  48%|████▊     | 1057/2208 [00:57<01:05, 17.53it/s][A
Epoch 1/10:  48%|████▊     | 1060/2208 [00:57<01:02, 18.44it/s][A
Epoch 1/10:  48%|████▊     | 1063/2208 [00:57<00:59, 19.22it/s][A
Epoch 1/10:  48%|████▊     | 1066/2208 [00:57<00:57, 19.77it/s][A
Epoch 1/10:  48%|████▊     | 1069/2208 [00:58<00:56, 20.12it/s][A
Epoch 1/10:  49%|████▊     | 1072/2208 [00:58<00:56, 20.27it/s][A
  with torch.cuda.amp.autocast():

Epoch 1/10:  49%|████▉     | 1078/2208 [00:58<01:22, 13.62it/s][A

Batch 1075: Training loss = 0.7135, Training accuracy = 0.5227, F1 = 0.5194



Epoch 1/10:  49%|████▉     | 1081/2208 [00:58<01:13, 15.33it/s][A
Epoch 1/10:  49%|████▉     | 1084/2208 [00:59<01:07, 16.73it/s][A
Epoch 1/10:  49%|████▉     | 1087/2208 [00:59<01:02, 17.97it/s][A
Epoch 1/10:  49%|████▉     | 1090/2208 [00:59<00:59, 18.85it/s][A
Epoch 1/10:  50%|████▉     | 1093/2208 [00:59<01:04, 17.39it/s][A
Epoch 1/10:  50%|████▉     | 1096/2208 [00:59<01:00, 18.43it/s][A
Epoch 1/10:  50%|████▉     | 1098/2208 [00:59<00:59, 18.71it/s][A
  with torch.cuda.amp.autocast():

Epoch 1/10:  50%|█████     | 1104/2208 [01:00<01:15, 14.64it/s][A

Batch 1100: Training loss = 0.8489, Training accuracy = 0.5278, F1 = 0.5245



Epoch 1/10:  50%|█████     | 1107/2208 [01:00<01:07, 16.23it/s][A
Epoch 1/10:  50%|█████     | 1110/2208 [01:00<01:02, 17.54it/s][A
Epoch 1/10:  50%|█████     | 1113/2208 [01:00<00:59, 18.50it/s][A
Epoch 1/10:  51%|█████     | 1116/2208 [01:00<00:56, 19.28it/s][A
Epoch 1/10:  51%|█████     | 1119/2208 [01:01<00:55, 19.77it/s][A
Epoch 1/10:  51%|█████     | 1122/2208 [01:01<00:53, 20.20it/s][A
  with torch.cuda.amp.autocast():

Epoch 1/10:  51%|█████     | 1128/2208 [01:01<01:21, 13.22it/s][A

Batch 1125: Training loss = 0.9369, Training accuracy = 0.5323, F1 = 0.5291



Epoch 1/10:  51%|█████     | 1131/2208 [01:01<01:12, 14.91it/s][A
Epoch 1/10:  51%|█████▏    | 1133/2208 [01:01<01:08, 15.70it/s][A
Epoch 1/10:  51%|█████▏    | 1136/2208 [01:02<01:02, 17.12it/s][A
Epoch 1/10:  52%|█████▏    | 1139/2208 [01:02<00:58, 18.29it/s][A
Epoch 1/10:  52%|█████▏    | 1142/2208 [01:02<00:55, 19.15it/s][A
Epoch 1/10:  52%|█████▏    | 1145/2208 [01:02<00:55, 19.30it/s][A
Epoch 1/10:  52%|█████▏    | 1148/2208 [01:02<00:56, 18.89it/s][A
  with torch.cuda.amp.autocast():

Epoch 1/10:  52%|█████▏    | 1154/2208 [01:03<01:09, 15.14it/s][A

Batch 1150: Training loss = 0.8414, Training accuracy = 0.5368, F1 = 0.5336



Epoch 1/10:  52%|█████▏    | 1157/2208 [01:03<01:03, 16.67it/s][A
Epoch 1/10:  53%|█████▎    | 1160/2208 [01:03<00:58, 17.83it/s][A
Epoch 1/10:  53%|█████▎    | 1163/2208 [01:03<00:55, 18.76it/s][A
Epoch 1/10:  53%|█████▎    | 1166/2208 [01:03<00:53, 19.46it/s][A
Epoch 1/10:  53%|█████▎    | 1169/2208 [01:03<00:52, 19.96it/s][A
Epoch 1/10:  53%|█████▎    | 1172/2208 [01:04<00:51, 20.29it/s][A
  with torch.cuda.amp.autocast():

Epoch 1/10:  53%|█████▎    | 1178/2208 [01:04<01:12, 14.30it/s][A

Batch 1175: Training loss = 0.8690, Training accuracy = 0.5413, F1 = 0.5381



Epoch 1/10:  53%|█████▎    | 1181/2208 [01:04<01:04, 15.87it/s][A
Epoch 1/10:  54%|█████▎    | 1184/2208 [01:04<00:59, 17.21it/s][A
Epoch 1/10:  54%|█████▍    | 1187/2208 [01:04<00:56, 18.22it/s][A
Epoch 1/10:  54%|█████▍    | 1190/2208 [01:05<00:53, 19.10it/s][A
Epoch 1/10:  54%|█████▍    | 1193/2208 [01:05<00:51, 19.77it/s][A
Epoch 1/10:  54%|█████▍    | 1196/2208 [01:05<00:50, 20.13it/s][A
  with torch.cuda.amp.autocast():

Epoch 1/10:  54%|█████▍    | 1202/2208 [01:05<01:12, 13.95it/s][A
Epoch 1/10:  55%|█████▍    | 1205/2208 [01:06<01:04, 15.61it/s][A

Batch 1200: Training loss = 0.8507, Training accuracy = 0.5455, F1 = 0.5424



Epoch 1/10:  55%|█████▍    | 1208/2208 [01:06<00:58, 17.02it/s][A
Epoch 1/10:  55%|█████▍    | 1211/2208 [01:06<00:54, 18.13it/s][A
Epoch 1/10:  55%|█████▍    | 1214/2208 [01:06<00:52, 18.94it/s][A
Epoch 1/10:  55%|█████▌    | 1217/2208 [01:06<00:50, 19.58it/s][A
Epoch 1/10:  55%|█████▌    | 1220/2208 [01:06<00:49, 20.08it/s][A
Epoch 1/10:  55%|█████▌    | 1223/2208 [01:06<00:48, 20.37it/s][A
  with torch.cuda.amp.autocast():

Epoch 1/10:  56%|█████▌    | 1229/2208 [01:07<01:02, 15.56it/s][A

Batch 1225: Training loss = 0.7172, Training accuracy = 0.5496, F1 = 0.5465



Epoch 1/10:  56%|█████▌    | 1232/2208 [01:07<00:57, 17.00it/s][A
Epoch 1/10:  56%|█████▌    | 1235/2208 [01:07<00:53, 18.15it/s][A
Epoch 1/10:  56%|█████▌    | 1238/2208 [01:07<00:51, 18.98it/s][A
Epoch 1/10:  56%|█████▌    | 1241/2208 [01:07<00:49, 19.55it/s][A
Epoch 1/10:  56%|█████▋    | 1244/2208 [01:08<00:48, 20.05it/s][A
Epoch 1/10:  56%|█████▋    | 1247/2208 [01:08<00:46, 20.51it/s][A
  with torch.cuda.amp.autocast():

Epoch 1/10:  57%|█████▋    | 1253/2208 [01:08<01:06, 14.30it/s][A

Batch 1250: Training loss = 0.6723, Training accuracy = 0.5536, F1 = 0.5506



Epoch 1/10:  57%|█████▋    | 1256/2208 [01:08<01:00, 15.86it/s][A
Epoch 1/10:  57%|█████▋    | 1259/2208 [01:09<00:55, 17.16it/s][A
Epoch 1/10:  57%|█████▋    | 1262/2208 [01:09<00:51, 18.31it/s][A
Epoch 1/10:  57%|█████▋    | 1265/2208 [01:09<00:49, 19.22it/s][A
Epoch 1/10:  57%|█████▋    | 1268/2208 [01:09<00:47, 19.81it/s][A
Epoch 1/10:  58%|█████▊    | 1271/2208 [01:09<00:46, 20.11it/s][A
  with torch.cuda.amp.autocast():

Epoch 1/10:  58%|█████▊    | 1277/2208 [01:10<01:07, 13.71it/s][A
Epoch 1/10:  58%|█████▊    | 1280/2208 [01:10<01:00, 15.46it/s][A

Batch 1275: Training loss = 0.7888, Training accuracy = 0.5575, F1 = 0.5544



Epoch 1/10:  58%|█████▊    | 1283/2208 [01:10<00:54, 16.87it/s][A
Epoch 1/10:  58%|█████▊    | 1286/2208 [01:10<00:51, 18.07it/s][A
Epoch 1/10:  58%|█████▊    | 1289/2208 [01:10<00:48, 19.00it/s][A
Epoch 1/10:  59%|█████▊    | 1292/2208 [01:10<00:46, 19.62it/s][A
Epoch 1/10:  59%|█████▊    | 1295/2208 [01:10<00:45, 20.16it/s][A
Epoch 1/10:  59%|█████▉    | 1298/2208 [01:11<00:44, 20.47it/s][A
  with torch.cuda.amp.autocast():

Epoch 1/10:  59%|█████▉    | 1304/2208 [01:11<00:58, 15.58it/s][A

Batch 1300: Training loss = 0.9216, Training accuracy = 0.5611, F1 = 0.5582



Epoch 1/10:  59%|█████▉    | 1307/2208 [01:11<00:53, 17.00it/s][A
Epoch 1/10:  59%|█████▉    | 1310/2208 [01:11<00:49, 18.09it/s][A
Epoch 1/10:  59%|█████▉    | 1313/2208 [01:12<00:47, 18.88it/s][A
Epoch 1/10:  60%|█████▉    | 1316/2208 [01:12<00:45, 19.53it/s][A
Epoch 1/10:  60%|█████▉    | 1319/2208 [01:12<00:44, 20.09it/s][A
Epoch 1/10:  60%|█████▉    | 1322/2208 [01:12<00:43, 20.26it/s][A
  with torch.cuda.amp.autocast():

Epoch 1/10:  60%|██████    | 1328/2208 [01:13<01:05, 13.48it/s][A

Batch 1325: Training loss = 0.7166, Training accuracy = 0.5649, F1 = 0.5619



Epoch 1/10:  60%|██████    | 1331/2208 [01:13<00:57, 15.24it/s][A
Epoch 1/10:  60%|██████    | 1334/2208 [01:13<00:52, 16.66it/s][A
Epoch 1/10:  61%|██████    | 1337/2208 [01:13<00:48, 17.80it/s][A
Epoch 1/10:  61%|██████    | 1340/2208 [01:13<00:46, 18.67it/s][A
Epoch 1/10:  61%|██████    | 1343/2208 [01:13<00:44, 19.39it/s][A
Epoch 1/10:  61%|██████    | 1346/2208 [01:13<00:43, 19.92it/s][A
Epoch 1/10:  61%|██████    | 1349/2208 [01:14<00:46, 18.63it/s][A
  with torch.cuda.amp.autocast():

Epoch 1/10:  61%|██████▏   | 1354/2208 [01:14<01:02, 13.65it/s][A

Batch 1350: Training loss = 0.9169, Training accuracy = 0.5685, F1 = 0.5656



Epoch 1/10:  61%|██████▏   | 1357/2208 [01:14<00:55, 15.45it/s][A
Epoch 1/10:  62%|██████▏   | 1360/2208 [01:14<00:50, 16.93it/s][A
Epoch 1/10:  62%|██████▏   | 1363/2208 [01:14<00:46, 18.12it/s][A
Epoch 1/10:  62%|██████▏   | 1366/2208 [01:15<00:44, 18.85it/s][A
Epoch 1/10:  62%|██████▏   | 1369/2208 [01:15<00:43, 19.33it/s][A
Epoch 1/10:  62%|██████▏   | 1372/2208 [01:15<00:42, 19.77it/s][A
  with torch.cuda.amp.autocast():

Epoch 1/10:  62%|██████▏   | 1378/2208 [01:16<01:10, 11.77it/s][A

Batch 1375: Training loss = 0.7157, Training accuracy = 0.5721, F1 = 0.5692



Epoch 1/10:  63%|██████▎   | 1381/2208 [01:16<01:00, 13.65it/s][A
Epoch 1/10:  63%|██████▎   | 1384/2208 [01:16<00:53, 15.27it/s][A
Epoch 1/10:  63%|██████▎   | 1387/2208 [01:16<00:49, 16.70it/s][A
Epoch 1/10:  63%|██████▎   | 1390/2208 [01:16<00:47, 17.06it/s][A
Epoch 1/10:  63%|██████▎   | 1393/2208 [01:16<00:44, 18.25it/s][A
Epoch 1/10:  63%|██████▎   | 1396/2208 [01:16<00:42, 19.04it/s][A
  with torch.cuda.amp.autocast():

Epoch 1/10:  63%|██████▎   | 1402/2208 [01:17<01:02, 12.86it/s][A
Epoch 1/10:  64%|██████▎   | 1405/2208 [01:17<00:54, 14.67it/s][A

Batch 1400: Training loss = 0.6935, Training accuracy = 0.5754, F1 = 0.5725



Epoch 1/10:  64%|██████▍   | 1408/2208 [01:17<00:49, 16.26it/s][A
Epoch 1/10:  64%|██████▍   | 1411/2208 [01:17<00:45, 17.46it/s][A
Epoch 1/10:  64%|██████▍   | 1414/2208 [01:18<00:43, 18.40it/s][A
Epoch 1/10:  64%|██████▍   | 1417/2208 [01:18<00:41, 19.13it/s][A
Epoch 1/10:  64%|██████▍   | 1420/2208 [01:18<00:40, 19.68it/s][A
Epoch 1/10:  64%|██████▍   | 1423/2208 [01:18<00:39, 20.11it/s][A
  with torch.cuda.amp.autocast():

Epoch 1/10:  65%|██████▍   | 1429/2208 [01:19<00:52, 14.74it/s][A

Batch 1425: Training loss = 0.7233, Training accuracy = 0.5787, F1 = 0.5758



Epoch 1/10:  65%|██████▍   | 1432/2208 [01:19<00:47, 16.31it/s][A
Epoch 1/10:  65%|██████▍   | 1435/2208 [01:19<00:44, 17.50it/s][A
Epoch 1/10:  65%|██████▌   | 1438/2208 [01:19<00:41, 18.49it/s][A
Epoch 1/10:  65%|██████▌   | 1441/2208 [01:19<00:39, 19.31it/s][A
Epoch 1/10:  65%|██████▌   | 1444/2208 [01:19<00:38, 19.87it/s][A
Epoch 1/10:  66%|██████▌   | 1447/2208 [01:19<00:37, 20.15it/s][A
  with torch.cuda.amp.autocast():

Epoch 1/10:  66%|██████▌   | 1453/2208 [01:20<00:59, 12.65it/s][A

Batch 1450: Training loss = 0.7733, Training accuracy = 0.5819, F1 = 0.5791



Epoch 1/10:  66%|██████▌   | 1456/2208 [01:20<00:51, 14.47it/s][A
Epoch 1/10:  66%|██████▌   | 1459/2208 [01:20<00:46, 16.04it/s][A
Epoch 1/10:  66%|██████▌   | 1462/2208 [01:20<00:43, 17.32it/s][A
Epoch 1/10:  66%|██████▋   | 1465/2208 [01:21<00:40, 18.35it/s][A
Epoch 1/10:  66%|██████▋   | 1468/2208 [01:21<00:38, 19.01it/s][A
Epoch 1/10:  67%|██████▋   | 1471/2208 [01:21<00:38, 19.39it/s][A
  with torch.cuda.amp.autocast():

Epoch 1/10:  67%|██████▋   | 1477/2208 [01:21<00:55, 13.06it/s][A
Epoch 1/10:  67%|██████▋   | 1480/2208 [01:22<00:48, 14.86it/s][A

Batch 1475: Training loss = 0.6569, Training accuracy = 0.5851, F1 = 0.5823



Epoch 1/10:  67%|██████▋   | 1483/2208 [01:22<00:44, 16.40it/s][A
Epoch 1/10:  67%|██████▋   | 1486/2208 [01:22<00:40, 17.69it/s][A
Epoch 1/10:  67%|██████▋   | 1489/2208 [01:22<00:38, 18.52it/s][A
Epoch 1/10:  68%|██████▊   | 1492/2208 [01:22<00:37, 19.14it/s][A
Epoch 1/10:  68%|██████▊   | 1495/2208 [01:22<00:36, 19.79it/s][A
Epoch 1/10:  68%|██████▊   | 1498/2208 [01:22<00:35, 20.28it/s][A
  with torch.cuda.amp.autocast():

Epoch 1/10:  68%|██████▊   | 1504/2208 [01:23<00:47, 14.90it/s][A

Batch 1500: Training loss = 0.8123, Training accuracy = 0.5885, F1 = 0.5857



Epoch 1/10:  68%|██████▊   | 1507/2208 [01:23<00:42, 16.39it/s][A
Epoch 1/10:  68%|██████▊   | 1510/2208 [01:23<00:39, 17.66it/s][A
Epoch 1/10:  69%|██████▊   | 1513/2208 [01:23<00:37, 18.67it/s][A
Epoch 1/10:  69%|██████▊   | 1516/2208 [01:23<00:35, 19.44it/s][A
Epoch 1/10:  69%|██████▉   | 1519/2208 [01:24<00:34, 20.03it/s][A
Epoch 1/10:  69%|██████▉   | 1522/2208 [01:24<00:33, 20.46it/s][A
  with torch.cuda.amp.autocast():

Epoch 1/10:  69%|██████▉   | 1528/2208 [01:24<00:52, 13.05it/s][A

Batch 1525: Training loss = 0.6128, Training accuracy = 0.5917, F1 = 0.5889



Epoch 1/10:  69%|██████▉   | 1531/2208 [01:24<00:45, 14.85it/s][A
Epoch 1/10:  69%|██████▉   | 1534/2208 [01:25<00:41, 16.38it/s][A
Epoch 1/10:  70%|██████▉   | 1537/2208 [01:25<00:38, 17.57it/s][A
Epoch 1/10:  70%|██████▉   | 1540/2208 [01:25<00:36, 18.52it/s][A
Epoch 1/10:  70%|██████▉   | 1543/2208 [01:25<00:34, 19.26it/s][A
Epoch 1/10:  70%|███████   | 1546/2208 [01:25<00:33, 19.79it/s][A
  with torch.cuda.amp.autocast():

Epoch 1/10:  70%|███████   | 1552/2208 [01:26<00:51, 12.66it/s][A
Epoch 1/10:  70%|███████   | 1555/2208 [01:26<00:45, 14.48it/s][A

Batch 1550: Training loss = 0.5408, Training accuracy = 0.5947, F1 = 0.5920



Epoch 1/10:  71%|███████   | 1558/2208 [01:26<00:40, 16.05it/s][A
Epoch 1/10:  71%|███████   | 1561/2208 [01:26<00:37, 17.35it/s][A
Epoch 1/10:  71%|███████   | 1564/2208 [01:26<00:35, 18.38it/s][A
Epoch 1/10:  71%|███████   | 1567/2208 [01:26<00:33, 19.03it/s][A
Epoch 1/10:  71%|███████   | 1570/2208 [01:27<00:32, 19.52it/s][A
Epoch 1/10:  71%|███████   | 1573/2208 [01:27<00:31, 20.01it/s][A
  with torch.cuda.amp.autocast():

Epoch 1/10:  72%|███████▏  | 1579/2208 [01:27<00:45, 13.92it/s][A

Batch 1575: Training loss = 0.4556, Training accuracy = 0.5978, F1 = 0.5950



Epoch 1/10:  72%|███████▏  | 1582/2208 [01:28<00:40, 15.57it/s][A
Epoch 1/10:  72%|███████▏  | 1585/2208 [01:28<00:36, 16.93it/s][A
Epoch 1/10:  72%|███████▏  | 1588/2208 [01:28<00:34, 17.99it/s][A
Epoch 1/10:  72%|███████▏  | 1591/2208 [01:28<00:32, 18.80it/s][A
Epoch 1/10:  72%|███████▏  | 1594/2208 [01:28<00:31, 19.45it/s][A
Epoch 1/10:  72%|███████▏  | 1597/2208 [01:28<00:30, 19.88it/s][A
  with torch.cuda.amp.autocast():

Epoch 1/10:  73%|███████▎  | 1603/2208 [01:29<00:49, 12.13it/s][A

Batch 1600: Training loss = 0.6040, Training accuracy = 0.6007, F1 = 0.5980



Epoch 1/10:  73%|███████▎  | 1606/2208 [01:29<00:43, 13.99it/s][A
Epoch 1/10:  73%|███████▎  | 1609/2208 [01:29<00:38, 15.50it/s][A
Epoch 1/10:  73%|███████▎  | 1612/2208 [01:29<00:35, 16.84it/s][A
Epoch 1/10:  73%|███████▎  | 1615/2208 [01:29<00:33, 17.88it/s][A
Epoch 1/10:  73%|███████▎  | 1617/2208 [01:30<00:33, 17.48it/s][A
Epoch 1/10:  73%|███████▎  | 1620/2208 [01:30<00:34, 17.28it/s][A
Epoch 1/10:  74%|███████▎  | 1623/2208 [01:30<00:31, 18.39it/s][A
  with torch.cuda.amp.autocast():

Epoch 1/10:  74%|███████▍  | 1629/2208 [01:30<00:44, 13.12it/s][A

Batch 1625: Training loss = 0.4952, Training accuracy = 0.6035, F1 = 0.6009



Epoch 1/10:  74%|███████▍  | 1632/2208 [01:31<00:38, 14.85it/s][A
Epoch 1/10:  74%|███████▍  | 1635/2208 [01:31<00:35, 16.26it/s][A
Epoch 1/10:  74%|███████▍  | 1638/2208 [01:31<00:32, 17.40it/s][A
Epoch 1/10:  74%|███████▍  | 1641/2208 [01:31<00:30, 18.37it/s][A
Epoch 1/10:  74%|███████▍  | 1644/2208 [01:31<00:29, 19.03it/s][A
Epoch 1/10:  75%|███████▍  | 1647/2208 [01:31<00:28, 19.73it/s][A
  with torch.cuda.amp.autocast():

Epoch 1/10:  75%|███████▍  | 1653/2208 [01:32<00:45, 12.32it/s][A

Batch 1650: Training loss = 0.5622, Training accuracy = 0.6060, F1 = 0.6034



Epoch 1/10:  75%|███████▌  | 1656/2208 [01:32<00:39, 14.11it/s][A
Epoch 1/10:  75%|███████▌  | 1659/2208 [01:32<00:34, 15.74it/s][A
Epoch 1/10:  75%|███████▌  | 1662/2208 [01:32<00:32, 17.04it/s][A
Epoch 1/10:  75%|███████▌  | 1665/2208 [01:33<00:30, 18.07it/s][A
Epoch 1/10:  76%|███████▌  | 1668/2208 [01:33<00:28, 18.94it/s][A
Epoch 1/10:  76%|███████▌  | 1671/2208 [01:33<00:27, 19.62it/s][A
  with torch.cuda.amp.autocast():

Epoch 1/10:  76%|███████▌  | 1677/2208 [01:33<00:42, 12.43it/s][A
Epoch 1/10:  76%|███████▌  | 1680/2208 [01:34<00:36, 14.28it/s][A

Batch 1675: Training loss = 0.6367, Training accuracy = 0.6089, F1 = 0.6063



Epoch 1/10:  76%|███████▌  | 1683/2208 [01:34<00:33, 15.85it/s][A
Epoch 1/10:  76%|███████▋  | 1686/2208 [01:34<00:30, 17.22it/s][A
Epoch 1/10:  76%|███████▋  | 1689/2208 [01:34<00:28, 18.22it/s][A
Epoch 1/10:  77%|███████▋  | 1692/2208 [01:34<00:27, 19.07it/s][A
Epoch 1/10:  77%|███████▋  | 1695/2208 [01:34<00:26, 19.73it/s][A
Epoch 1/10:  77%|███████▋  | 1698/2208 [01:34<00:25, 20.25it/s][A
  with torch.cuda.amp.autocast():

Epoch 1/10:  77%|███████▋  | 1704/2208 [01:35<00:36, 13.79it/s][A

Batch 1700: Training loss = 0.6517, Training accuracy = 0.6116, F1 = 0.6090



Epoch 1/10:  77%|███████▋  | 1707/2208 [01:35<00:32, 15.38it/s][A
Epoch 1/10:  77%|███████▋  | 1710/2208 [01:35<00:29, 16.83it/s][A
Epoch 1/10:  78%|███████▊  | 1713/2208 [01:35<00:27, 17.92it/s][A
Epoch 1/10:  78%|███████▊  | 1716/2208 [01:36<00:26, 18.86it/s][A
Epoch 1/10:  78%|███████▊  | 1719/2208 [01:36<00:25, 19.46it/s][A
Epoch 1/10:  78%|███████▊  | 1722/2208 [01:36<00:26, 18.62it/s][A
  with torch.cuda.amp.autocast():

Epoch 1/10:  78%|███████▊  | 1727/2208 [01:37<00:44, 10.76it/s][A
Epoch 1/10:  78%|███████▊  | 1730/2208 [01:37<00:37, 12.86it/s][A

Batch 1725: Training loss = 0.4750, Training accuracy = 0.6141, F1 = 0.6116



Epoch 1/10:  78%|███████▊  | 1733/2208 [01:37<00:32, 14.63it/s][A
Epoch 1/10:  79%|███████▊  | 1736/2208 [01:37<00:29, 16.20it/s][A
Epoch 1/10:  79%|███████▉  | 1739/2208 [01:37<00:26, 17.59it/s][A
Epoch 1/10:  79%|███████▉  | 1742/2208 [01:37<00:24, 18.65it/s][A
Epoch 1/10:  79%|███████▉  | 1745/2208 [01:37<00:23, 19.39it/s][A
Epoch 1/10:  79%|███████▉  | 1748/2208 [01:37<00:23, 19.83it/s][A
  with torch.cuda.amp.autocast():

Epoch 1/10:  79%|███████▉  | 1754/2208 [01:38<00:32, 14.13it/s][A

Batch 1750: Training loss = 0.7668, Training accuracy = 0.6168, F1 = 0.6142



Epoch 1/10:  80%|███████▉  | 1757/2208 [01:38<00:28, 15.83it/s][A
Epoch 1/10:  80%|███████▉  | 1760/2208 [01:38<00:26, 17.17it/s][A
Epoch 1/10:  80%|███████▉  | 1763/2208 [01:39<00:24, 18.17it/s][A
Epoch 1/10:  80%|███████▉  | 1766/2208 [01:39<00:23, 19.09it/s][A
Epoch 1/10:  80%|████████  | 1769/2208 [01:39<00:22, 19.68it/s][A
Epoch 1/10:  80%|████████  | 1772/2208 [01:39<00:21, 20.09it/s][A
  with torch.cuda.amp.autocast():

Epoch 1/10:  81%|████████  | 1778/2208 [01:40<00:37, 11.59it/s][A

Batch 1775: Training loss = 0.7495, Training accuracy = 0.6193, F1 = 0.6168



Epoch 1/10:  81%|████████  | 1781/2208 [01:40<00:31, 13.48it/s][A
Epoch 1/10:  81%|████████  | 1784/2208 [01:40<00:28, 15.14it/s][A
Epoch 1/10:  81%|████████  | 1787/2208 [01:40<00:25, 16.59it/s][A
Epoch 1/10:  81%|████████  | 1790/2208 [01:40<00:23, 17.86it/s][A
Epoch 1/10:  81%|████████  | 1793/2208 [01:40<00:22, 18.76it/s][A
Epoch 1/10:  81%|████████▏ | 1796/2208 [01:40<00:21, 19.45it/s][A
  with torch.cuda.amp.autocast():

Epoch 1/10:  82%|████████▏ | 1802/2208 [01:41<00:33, 12.10it/s][A
Epoch 1/10:  82%|████████▏ | 1805/2208 [01:41<00:28, 13.96it/s][A

Batch 1800: Training loss = 0.6155, Training accuracy = 0.6217, F1 = 0.6192



Epoch 1/10:  82%|████████▏ | 1808/2208 [01:41<00:25, 15.54it/s][A
Epoch 1/10:  82%|████████▏ | 1811/2208 [01:41<00:23, 16.89it/s][A
Epoch 1/10:  82%|████████▏ | 1814/2208 [01:42<00:22, 17.90it/s][A
Epoch 1/10:  82%|████████▏ | 1817/2208 [01:42<00:20, 18.73it/s][A
Epoch 1/10:  82%|████████▏ | 1820/2208 [01:42<00:20, 19.35it/s][A
Epoch 1/10:  83%|████████▎ | 1823/2208 [01:42<00:19, 19.83it/s][A
  with torch.cuda.amp.autocast():

Epoch 1/10:  83%|████████▎ | 1829/2208 [01:43<00:28, 13.39it/s][A

Batch 1825: Training loss = 0.5309, Training accuracy = 0.6239, F1 = 0.6214



Epoch 1/10:  83%|████████▎ | 1832/2208 [01:43<00:24, 15.10it/s][A
Epoch 1/10:  83%|████████▎ | 1835/2208 [01:43<00:22, 16.50it/s][A
Epoch 1/10:  83%|████████▎ | 1837/2208 [01:43<00:21, 17.15it/s][A
Epoch 1/10:  83%|████████▎ | 1840/2208 [01:43<00:20, 18.20it/s][A
Epoch 1/10:  83%|████████▎ | 1843/2208 [01:43<00:19, 19.06it/s][A
Epoch 1/10:  84%|████████▎ | 1846/2208 [01:44<00:18, 19.64it/s][A
  with torch.cuda.amp.autocast():

Epoch 1/10:  84%|████████▍ | 1852/2208 [01:44<00:33, 10.69it/s][A
Epoch 1/10:  84%|████████▍ | 1855/2208 [01:44<00:27, 12.62it/s][A

Batch 1850: Training loss = 0.4874, Training accuracy = 0.6263, F1 = 0.6238



Epoch 1/10:  84%|████████▍ | 1858/2208 [01:45<00:24, 14.34it/s][A
Epoch 1/10:  84%|████████▍ | 1861/2208 [01:45<00:21, 15.97it/s][A
Epoch 1/10:  84%|████████▍ | 1864/2208 [01:45<00:19, 17.32it/s][A
Epoch 1/10:  85%|████████▍ | 1867/2208 [01:45<00:18, 18.22it/s][A
Epoch 1/10:  85%|████████▍ | 1870/2208 [01:45<00:19, 17.44it/s][A
Epoch 1/10:  85%|████████▍ | 1873/2208 [01:45<00:18, 18.38it/s][A
  with torch.cuda.amp.autocast():

Epoch 1/10:  85%|████████▌ | 1877/2208 [01:46<00:33, 10.01it/s][A
Epoch 1/10:  85%|████████▌ | 1880/2208 [01:46<00:26, 12.27it/s][A

Batch 1875: Training loss = 0.7363, Training accuracy = 0.6284, F1 = 0.6260



Epoch 1/10:  85%|████████▌ | 1883/2208 [01:46<00:22, 14.25it/s][A
Epoch 1/10:  85%|████████▌ | 1886/2208 [01:46<00:20, 15.96it/s][A
Epoch 1/10:  86%|████████▌ | 1889/2208 [01:46<00:18, 17.30it/s][A
Epoch 1/10:  86%|████████▌ | 1892/2208 [01:47<00:17, 18.40it/s][A
Epoch 1/10:  86%|████████▌ | 1895/2208 [01:47<00:16, 19.21it/s][A
Epoch 1/10:  86%|████████▌ | 1898/2208 [01:47<00:15, 19.81it/s][A
  with torch.cuda.amp.autocast():

Epoch 1/10:  86%|████████▌ | 1904/2208 [01:47<00:22, 13.47it/s][A

Batch 1900: Training loss = 0.7020, Training accuracy = 0.6306, F1 = 0.6282



Epoch 1/10:  86%|████████▋ | 1907/2208 [01:48<00:19, 15.20it/s][A
Epoch 1/10:  87%|████████▋ | 1910/2208 [01:48<00:17, 16.71it/s][A
Epoch 1/10:  87%|████████▋ | 1913/2208 [01:48<00:16, 17.89it/s][A
Epoch 1/10:  87%|████████▋ | 1916/2208 [01:48<00:15, 18.73it/s][A
Epoch 1/10:  87%|████████▋ | 1919/2208 [01:48<00:14, 19.42it/s][A
Epoch 1/10:  87%|████████▋ | 1922/2208 [01:48<00:14, 19.95it/s][A
  with torch.cuda.amp.autocast():

Epoch 1/10:  87%|████████▋ | 1928/2208 [01:49<00:23, 11.81it/s][A

Batch 1925: Training loss = 0.5730, Training accuracy = 0.6330, F1 = 0.6306



Epoch 1/10:  87%|████████▋ | 1931/2208 [01:49<00:20, 13.68it/s][A
Epoch 1/10:  88%|████████▊ | 1934/2208 [01:49<00:17, 15.35it/s][A
Epoch 1/10:  88%|████████▊ | 1937/2208 [01:49<00:16, 16.75it/s][A
Epoch 1/10:  88%|████████▊ | 1940/2208 [01:50<00:14, 17.92it/s][A
Epoch 1/10:  88%|████████▊ | 1943/2208 [01:50<00:14, 18.80it/s][A
Epoch 1/10:  88%|████████▊ | 1946/2208 [01:50<00:13, 19.38it/s][A
  with torch.cuda.amp.autocast():

Epoch 1/10:  88%|████████▊ | 1952/2208 [01:51<00:23, 11.10it/s][A
Epoch 1/10:  89%|████████▊ | 1955/2208 [01:51<00:19, 13.00it/s][A

Batch 1950: Training loss = 0.8818, Training accuracy = 0.6352, F1 = 0.6328



Epoch 1/10:  89%|████████▊ | 1958/2208 [01:51<00:16, 14.76it/s][A
Epoch 1/10:  89%|████████▉ | 1961/2208 [01:51<00:15, 16.26it/s][A
Epoch 1/10:  89%|████████▉ | 1964/2208 [01:51<00:13, 17.54it/s][A
Epoch 1/10:  89%|████████▉ | 1967/2208 [01:51<00:13, 18.45it/s][A
Epoch 1/10:  89%|████████▉ | 1970/2208 [01:51<00:12, 19.27it/s][A
Epoch 1/10:  89%|████████▉ | 1973/2208 [01:51<00:11, 19.82it/s][A
  with torch.cuda.amp.autocast():

Epoch 1/10:  90%|████████▉ | 1979/2208 [01:52<00:17, 13.28it/s][A

Batch 1975: Training loss = 0.7422, Training accuracy = 0.6372, F1 = 0.6349



Epoch 1/10:  90%|████████▉ | 1982/2208 [01:52<00:15, 14.99it/s][A
Epoch 1/10:  90%|████████▉ | 1985/2208 [01:52<00:13, 16.49it/s][A
Epoch 1/10:  90%|█████████ | 1988/2208 [01:53<00:12, 17.73it/s][A
Epoch 1/10:  90%|█████████ | 1991/2208 [01:53<00:11, 18.61it/s][A
Epoch 1/10:  90%|█████████ | 1994/2208 [01:53<00:11, 19.28it/s][A
Epoch 1/10:  90%|█████████ | 1997/2208 [01:53<00:10, 19.95it/s][A
  with torch.cuda.amp.autocast():

Epoch 1/10:  91%|█████████ | 2003/2208 [01:54<00:18, 11.38it/s][A

Batch 2000: Training loss = 0.6093, Training accuracy = 0.6392, F1 = 0.6369



Epoch 1/10:  91%|█████████ | 2006/2208 [01:54<00:15, 13.25it/s][A
Epoch 1/10:  91%|█████████ | 2009/2208 [01:54<00:13, 14.96it/s][A
Epoch 1/10:  91%|█████████ | 2012/2208 [01:54<00:11, 16.45it/s][A
Epoch 1/10:  91%|█████████▏| 2015/2208 [01:54<00:10, 17.60it/s][A
Epoch 1/10:  91%|█████████▏| 2018/2208 [01:54<00:10, 18.67it/s][A
Epoch 1/10:  92%|█████████▏| 2021/2208 [01:55<00:09, 19.39it/s][A
  with torch.cuda.amp.autocast():

Epoch 1/10:  92%|█████████▏| 2027/2208 [01:55<00:15, 11.38it/s][A
Epoch 1/10:  92%|█████████▏| 2030/2208 [01:55<00:13, 13.24it/s][A

Batch 2025: Training loss = 0.7568, Training accuracy = 0.6412, F1 = 0.6389



Epoch 1/10:  92%|█████████▏| 2033/2208 [01:55<00:11, 14.95it/s][A
Epoch 1/10:  92%|█████████▏| 2036/2208 [01:56<00:10, 16.38it/s][A
Epoch 1/10:  92%|█████████▏| 2039/2208 [01:56<00:09, 17.47it/s][A
Epoch 1/10:  92%|█████████▏| 2042/2208 [01:56<00:09, 18.44it/s][A
Epoch 1/10:  93%|█████████▎| 2045/2208 [01:56<00:08, 19.16it/s][A
Epoch 1/10:  93%|█████████▎| 2048/2208 [01:56<00:08, 19.62it/s][A
  with torch.cuda.amp.autocast():

Epoch 1/10:  93%|█████████▎| 2054/2208 [01:57<00:12, 12.50it/s][A

Batch 2050: Training loss = 0.5714, Training accuracy = 0.6432, F1 = 0.6409



Epoch 1/10:  93%|█████████▎| 2057/2208 [01:57<00:10, 14.27it/s][A
Epoch 1/10:  93%|█████████▎| 2060/2208 [01:57<00:09, 15.76it/s][A
Epoch 1/10:  93%|█████████▎| 2063/2208 [01:57<00:08, 17.05it/s][A
Epoch 1/10:  94%|█████████▎| 2066/2208 [01:57<00:07, 18.10it/s][A
Epoch 1/10:  94%|█████████▎| 2069/2208 [01:58<00:07, 18.82it/s][A
Epoch 1/10:  94%|█████████▍| 2072/2208 [01:58<00:07, 19.42it/s][A
  with torch.cuda.amp.autocast():

Epoch 1/10:  94%|█████████▍| 2078/2208 [01:58<00:12, 10.82it/s][A

Batch 2075: Training loss = 0.4773, Training accuracy = 0.6453, F1 = 0.6430



Epoch 1/10:  94%|█████████▍| 2081/2208 [01:59<00:09, 12.73it/s][A
Epoch 1/10:  94%|█████████▍| 2084/2208 [01:59<00:08, 14.53it/s][A
Epoch 1/10:  95%|█████████▍| 2087/2208 [01:59<00:07, 16.00it/s][A
Epoch 1/10:  95%|█████████▍| 2090/2208 [01:59<00:06, 17.29it/s][A
Epoch 1/10:  95%|█████████▍| 2093/2208 [01:59<00:06, 18.32it/s][A
Epoch 1/10:  95%|█████████▍| 2096/2208 [01:59<00:06, 17.93it/s][A
Epoch 1/10:  95%|█████████▌| 2098/2208 [01:59<00:06, 16.72it/s][A
  with torch.cuda.amp.autocast():

Epoch 1/10:  95%|█████████▌| 2104/2208 [02:00<00:08, 11.64it/s][A

Batch 2100: Training loss = 0.5681, Training accuracy = 0.6473, F1 = 0.6450



Epoch 1/10:  95%|█████████▌| 2107/2208 [02:00<00:07, 13.58it/s][A
Epoch 1/10:  96%|█████████▌| 2110/2208 [02:01<00:06, 15.33it/s][A
Epoch 1/10:  96%|█████████▌| 2113/2208 [02:01<00:05, 16.87it/s][A
Epoch 1/10:  96%|█████████▌| 2116/2208 [02:01<00:05, 18.08it/s][A
Epoch 1/10:  96%|█████████▌| 2119/2208 [02:01<00:04, 18.92it/s][A
Epoch 1/10:  96%|█████████▌| 2122/2208 [02:01<00:04, 19.62it/s][A
  with torch.cuda.amp.autocast():

Epoch 1/10:  96%|█████████▋| 2128/2208 [02:02<00:07, 11.22it/s][A

Batch 2125: Training loss = 0.7047, Training accuracy = 0.6491, F1 = 0.6469



Epoch 1/10:  97%|█████████▋| 2131/2208 [02:02<00:05, 13.10it/s][A
Epoch 1/10:  97%|█████████▋| 2134/2208 [02:02<00:04, 14.84it/s][A
Epoch 1/10:  97%|█████████▋| 2137/2208 [02:02<00:04, 16.24it/s][A
Epoch 1/10:  97%|█████████▋| 2140/2208 [02:02<00:03, 17.43it/s][A
Epoch 1/10:  97%|█████████▋| 2143/2208 [02:02<00:03, 18.54it/s][A
Epoch 1/10:  97%|█████████▋| 2146/2208 [02:03<00:03, 19.35it/s][A
  with torch.cuda.amp.autocast():

Epoch 1/10:  97%|█████████▋| 2152/2208 [02:03<00:05, 10.81it/s][A
Epoch 1/10:  98%|█████████▊| 2155/2208 [02:03<00:04, 12.74it/s][A

Batch 2150: Training loss = 0.4348, Training accuracy = 0.6510, F1 = 0.6487



Epoch 1/10:  98%|█████████▊| 2158/2208 [02:04<00:03, 14.50it/s][A
Epoch 1/10:  98%|█████████▊| 2161/2208 [02:04<00:02, 16.05it/s][A
Epoch 1/10:  98%|█████████▊| 2164/2208 [02:04<00:02, 17.33it/s][A
Epoch 1/10:  98%|█████████▊| 2167/2208 [02:04<00:02, 18.36it/s][A
Epoch 1/10:  98%|█████████▊| 2170/2208 [02:04<00:01, 19.24it/s][A
Epoch 1/10:  98%|█████████▊| 2173/2208 [02:04<00:01, 19.92it/s][A
  with torch.cuda.amp.autocast():

Epoch 1/10:  99%|█████████▊| 2179/2208 [02:05<00:02, 13.00it/s][A

Batch 2175: Training loss = 0.5365, Training accuracy = 0.6527, F1 = 0.6505



Epoch 1/10:  99%|█████████▉| 2182/2208 [02:05<00:01, 14.75it/s][A
Epoch 1/10:  99%|█████████▉| 2184/2208 [02:05<00:01, 15.61it/s][A
Epoch 1/10:  99%|█████████▉| 2187/2208 [02:05<00:01, 17.14it/s][A
Epoch 1/10:  99%|█████████▉| 2190/2208 [02:05<00:00, 18.35it/s][A
Epoch 1/10:  99%|█████████▉| 2193/2208 [02:06<00:00, 19.15it/s][A
Epoch 1/10:  99%|█████████▉| 2196/2208 [02:06<00:00, 19.86it/s][A
  with torch.cuda.amp.autocast():

Epoch 1/10: 100%|█████████▉| 2202/2208 [02:06<00:00, 11.21it/s][A
Epoch 1/10: 100%|█████████▉| 2205/2208 [02:07<00:00, 13.17it/s][A

Batch 2200: Training loss = 0.6651, Training accuracy = 0.6545, F1 = 0.6522



Epoch 1/10: 100%|██████████| 2208/2208 [02:07<00:00, 14.99it/s][A
                                                               [A


Epoch 1 Training Metrics:
Loss: 1.2313
Accuracy: 0.6550
F1 Score: 0.6528
Precision: 0.6523
Recall: 0.6550

Starting validation...



Validation:   0%|          | 0/552 [00:00<?, ?it/s][A
Validation:   0%|          | 1/552 [00:01<16:11,  1.76s/it][A
Validation:   1%|          | 3/552 [00:01<04:33,  2.00it/s][A
Validation:   1%|          | 5/552 [00:01<02:27,  3.71it/s][A
Validation:   1%|▏         | 7/552 [00:02<01:36,  5.64it/s][A
Validation:   2%|▏         | 9/552 [00:02<01:10,  7.66it/s][A
Validation:   2%|▏         | 11/552 [00:02<00:55,  9.67it/s][A
Validation:   2%|▏         | 13/552 [00:02<00:46, 11.56it/s][A
Validation:   3%|▎         | 15/552 [00:02<00:40, 13.22it/s][A
Validation:   3%|▎         | 17/552 [00:02<00:36, 14.59it/s][A
Validation:   3%|▎         | 19/552 [00:02<00:33, 15.70it/s][A
Validation:   4%|▍         | 21/552 [00:02<00:32, 16.55it/s][A
Validation:   4%|▍         | 23/552 [00:02<00:30, 17.29it/s][A
Validation:   5%|▍         | 25/552 [00:03<00:29, 17.74it/s][A
Validation:   5%|▍         | 27/552 [00:03<00:29, 18.00it/s][A
Validation:   5%|▌         | 29/552 [00:03<00:28, 18.


Epoch 1 Validation Metrics:
Loss: 0.4053
Accuracy: 0.8612
F1 Score: 0.8570
Precision: 0.8704
Recall: 0.8612


Training epochs:  10%|█         | 1/10 [02:40<24:00, 160.02s/it]


Starting epoch 2/10



  with torch.cuda.amp.autocast():

  with torch.cuda.amp.autocast():

Epoch 2/10:   0%|          | 3/2208 [00:01<17:48,  2.06it/s]  [A

Batch 0: Training loss = 0.6028, Training accuracy = 0.7812, F1 = 0.7755



Epoch 2/10:   0%|          | 5/2208 [00:01<09:36,  3.82it/s][A
Epoch 2/10:   0%|          | 8/2208 [00:02<05:28,  6.70it/s][A
Epoch 2/10:   0%|          | 11/2208 [00:02<03:51,  9.47it/s][A
Epoch 2/10:   1%|          | 13/2208 [00:02<03:16, 11.17it/s][A
Epoch 2/10:   1%|          | 16/2208 [00:02<02:40, 13.65it/s][A
Epoch 2/10:   1%|          | 18/2208 [00:02<02:34, 14.21it/s][A
Epoch 2/10:   1%|          | 21/2208 [00:02<02:15, 16.16it/s][A
Epoch 2/10:   1%|          | 23/2208 [00:02<02:20, 15.54it/s][A
  with torch.cuda.amp.autocast():

Epoch 2/10:   1%|▏         | 29/2208 [00:03<02:01, 17.89it/s][A

Batch 25: Training loss = 0.4302, Training accuracy = 0.8311, F1 = 0.8277



Epoch 2/10:   1%|▏         | 32/2208 [00:03<01:55, 18.79it/s][A
Epoch 2/10:   2%|▏         | 35/2208 [00:03<01:51, 19.54it/s][A
Epoch 2/10:   2%|▏         | 38/2208 [00:03<01:49, 19.90it/s][A
Epoch 2/10:   2%|▏         | 41/2208 [00:03<01:47, 20.25it/s][A
Epoch 2/10:   2%|▏         | 44/2208 [00:03<01:48, 19.93it/s][A
Epoch 2/10:   2%|▏         | 47/2208 [00:04<01:50, 19.47it/s][A
Epoch 2/10:   2%|▏         | 49/2208 [00:04<01:53, 18.95it/s][A
  with torch.cuda.amp.autocast():

Epoch 2/10:   2%|▏         | 54/2208 [00:04<01:53, 19.02it/s][A

Batch 50: Training loss = 0.4773, Training accuracy = 0.8313, F1 = 0.8298



Epoch 2/10:   3%|▎         | 56/2208 [00:04<01:53, 18.98it/s][A
Epoch 2/10:   3%|▎         | 58/2208 [00:04<01:53, 18.86it/s][A
Epoch 2/10:   3%|▎         | 60/2208 [00:04<01:54, 18.82it/s][A
Epoch 2/10:   3%|▎         | 62/2208 [00:04<02:01, 17.62it/s][A
Epoch 2/10:   3%|▎         | 65/2208 [00:05<01:53, 18.80it/s][A
Epoch 2/10:   3%|▎         | 67/2208 [00:05<01:58, 18.05it/s][A
Epoch 2/10:   3%|▎         | 70/2208 [00:05<01:54, 18.63it/s][A
Epoch 2/10:   3%|▎         | 73/2208 [00:05<01:48, 19.60it/s][A
  with torch.cuda.amp.autocast():

Epoch 2/10:   3%|▎         | 77/2208 [00:05<01:59, 17.85it/s][A
Epoch 2/10:   4%|▎         | 79/2208 [00:05<02:03, 17.21it/s][A

Batch 75: Training loss = 0.6270, Training accuracy = 0.8221, F1 = 0.8206



Epoch 2/10:   4%|▎         | 82/2208 [00:05<01:54, 18.53it/s][A
Epoch 2/10:   4%|▍         | 85/2208 [00:06<01:48, 19.53it/s][A
Epoch 2/10:   4%|▍         | 88/2208 [00:06<01:45, 20.17it/s][A
Epoch 2/10:   4%|▍         | 91/2208 [00:06<01:44, 20.19it/s][A
Epoch 2/10:   4%|▍         | 94/2208 [00:06<01:42, 20.55it/s][A
Epoch 2/10:   4%|▍         | 97/2208 [00:06<01:41, 20.81it/s][A
  with torch.cuda.amp.autocast():

Epoch 2/10:   5%|▍         | 103/2208 [00:06<01:49, 19.27it/s][A

Batch 100: Training loss = 0.5158, Training accuracy = 0.8223, F1 = 0.8213



Epoch 2/10:   5%|▍         | 106/2208 [00:07<01:45, 19.84it/s][A
Epoch 2/10:   5%|▍         | 109/2208 [00:07<01:43, 20.33it/s][A
Epoch 2/10:   5%|▌         | 112/2208 [00:07<01:41, 20.61it/s][A
Epoch 2/10:   5%|▌         | 115/2208 [00:07<01:40, 20.73it/s][A
Epoch 2/10:   5%|▌         | 118/2208 [00:07<01:39, 20.90it/s][A
Epoch 2/10:   5%|▌         | 121/2208 [00:07<01:39, 21.04it/s][A
  with torch.cuda.amp.autocast():

Epoch 2/10:   6%|▌         | 127/2208 [00:08<01:44, 19.88it/s][A
Epoch 2/10:   6%|▌         | 130/2208 [00:08<01:42, 20.31it/s][A

Batch 125: Training loss = 0.4263, Training accuracy = 0.8225, F1 = 0.8214



Epoch 2/10:   6%|▌         | 133/2208 [00:08<01:40, 20.59it/s][A
Epoch 2/10:   6%|▌         | 136/2208 [00:08<01:39, 20.85it/s][A
Epoch 2/10:   6%|▋         | 139/2208 [00:08<01:38, 21.07it/s][A
Epoch 2/10:   6%|▋         | 142/2208 [00:08<01:38, 21.00it/s][A
Epoch 2/10:   7%|▋         | 145/2208 [00:08<01:37, 21.06it/s][A
Epoch 2/10:   7%|▋         | 148/2208 [00:09<01:37, 21.17it/s][A
  with torch.cuda.amp.autocast():

Epoch 2/10:   7%|▋         | 154/2208 [00:09<01:40, 20.35it/s][A

Batch 150: Training loss = 0.5494, Training accuracy = 0.8228, F1 = 0.8217



Epoch 2/10:   7%|▋         | 157/2208 [00:09<01:39, 20.64it/s][A
Epoch 2/10:   7%|▋         | 160/2208 [00:09<01:38, 20.80it/s][A
Epoch 2/10:   7%|▋         | 163/2208 [00:09<01:37, 20.90it/s][A
Epoch 2/10:   8%|▊         | 166/2208 [00:10<01:37, 20.93it/s][A
Epoch 2/10:   8%|▊         | 169/2208 [00:10<01:37, 20.97it/s][A
Epoch 2/10:   8%|▊         | 172/2208 [00:10<01:37, 20.96it/s][A
  with torch.cuda.amp.autocast():

Epoch 2/10:   8%|▊         | 178/2208 [00:10<01:46, 19.14it/s][A

Batch 175: Training loss = 0.4995, Training accuracy = 0.8222, F1 = 0.8211



Epoch 2/10:   8%|▊         | 181/2208 [00:10<01:43, 19.58it/s][A
Epoch 2/10:   8%|▊         | 184/2208 [00:10<01:41, 19.98it/s][A
Epoch 2/10:   8%|▊         | 187/2208 [00:11<01:39, 20.36it/s][A
Epoch 2/10:   9%|▊         | 190/2208 [00:11<01:43, 19.43it/s][A
Epoch 2/10:   9%|▊         | 193/2208 [00:11<01:41, 19.91it/s][A
Epoch 2/10:   9%|▉         | 196/2208 [00:11<01:41, 19.87it/s][A
Epoch 2/10:   9%|▉         | 198/2208 [00:11<01:43, 19.33it/s][A
  with torch.cuda.amp.autocast():

Epoch 2/10:   9%|▉         | 204/2208 [00:11<01:44, 19.27it/s][A

Batch 200: Training loss = 0.4999, Training accuracy = 0.8223, F1 = 0.8212



Epoch 2/10:   9%|▉         | 206/2208 [00:12<01:43, 19.35it/s][A
Epoch 2/10:   9%|▉         | 209/2208 [00:12<01:39, 20.01it/s][A
Epoch 2/10:  10%|▉         | 212/2208 [00:12<01:37, 20.55it/s][A
Epoch 2/10:  10%|▉         | 215/2208 [00:12<01:59, 16.67it/s][A
Epoch 2/10:  10%|▉         | 218/2208 [00:12<01:55, 17.20it/s][A
Epoch 2/10:  10%|█         | 221/2208 [00:12<01:48, 18.29it/s][A
Epoch 2/10:  10%|█         | 223/2208 [00:13<01:57, 16.83it/s][A
  with torch.cuda.amp.autocast():

Epoch 2/10:  10%|█         | 229/2208 [00:13<01:50, 17.84it/s][A

Batch 225: Training loss = 0.5782, Training accuracy = 0.8224, F1 = 0.8214



Epoch 2/10:  11%|█         | 232/2208 [00:13<01:44, 18.90it/s][A
Epoch 2/10:  11%|█         | 235/2208 [00:13<01:41, 19.49it/s][A
Epoch 2/10:  11%|█         | 238/2208 [00:13<01:46, 18.54it/s][A
Epoch 2/10:  11%|█         | 241/2208 [00:13<01:42, 19.26it/s][A
Epoch 2/10:  11%|█         | 244/2208 [00:14<01:39, 19.75it/s][A
Epoch 2/10:  11%|█         | 246/2208 [00:14<01:47, 18.21it/s][A
Epoch 2/10:  11%|█▏        | 249/2208 [00:14<01:42, 19.14it/s][A
  with torch.cuda.amp.autocast():

Epoch 2/10:  12%|█▏        | 254/2208 [00:14<01:45, 18.56it/s][A

Batch 250: Training loss = 0.7314, Training accuracy = 0.8231, F1 = 0.8220



Epoch 2/10:  12%|█▏        | 257/2208 [00:14<01:40, 19.43it/s][A
Epoch 2/10:  12%|█▏        | 259/2208 [00:14<01:42, 19.06it/s][A
Epoch 2/10:  12%|█▏        | 262/2208 [00:15<01:56, 16.66it/s][A
Epoch 2/10:  12%|█▏        | 265/2208 [00:15<01:48, 17.91it/s][A
Epoch 2/10:  12%|█▏        | 268/2208 [00:15<01:43, 18.78it/s][A
Epoch 2/10:  12%|█▏        | 271/2208 [00:15<01:39, 19.51it/s][A
Epoch 2/10:  12%|█▏        | 273/2208 [00:15<01:38, 19.59it/s][A
  with torch.cuda.amp.autocast():

Epoch 2/10:  13%|█▎        | 277/2208 [00:15<02:03, 15.66it/s][A
Epoch 2/10:  13%|█▎        | 280/2208 [00:16<01:52, 17.21it/s][A

Batch 275: Training loss = 0.4658, Training accuracy = 0.8235, F1 = 0.8224



Epoch 2/10:  13%|█▎        | 283/2208 [00:16<01:45, 18.33it/s][A
Epoch 2/10:  13%|█▎        | 286/2208 [00:16<01:40, 19.10it/s][A
Epoch 2/10:  13%|█▎        | 289/2208 [00:16<01:37, 19.65it/s][A
Epoch 2/10:  13%|█▎        | 291/2208 [00:16<01:44, 18.40it/s][A
Epoch 2/10:  13%|█▎        | 294/2208 [00:16<01:40, 19.03it/s][A
Epoch 2/10:  13%|█▎        | 297/2208 [00:16<01:36, 19.72it/s][A
Epoch 2/10:  14%|█▎        | 299/2208 [00:17<01:46, 17.88it/s][A
  with torch.cuda.amp.autocast():

Epoch 2/10:  14%|█▍        | 304/2208 [00:17<01:53, 16.77it/s][A

Batch 300: Training loss = 0.5619, Training accuracy = 0.8237, F1 = 0.8227



Epoch 2/10:  14%|█▍        | 307/2208 [00:17<01:45, 18.07it/s][A
Epoch 2/10:  14%|█▍        | 309/2208 [00:17<01:58, 15.96it/s][A
Epoch 2/10:  14%|█▍        | 312/2208 [00:17<01:48, 17.45it/s][A
Epoch 2/10:  14%|█▍        | 315/2208 [00:18<01:42, 18.52it/s][A
Epoch 2/10:  14%|█▍        | 318/2208 [00:18<01:37, 19.38it/s][A
Epoch 2/10:  15%|█▍        | 321/2208 [00:18<01:34, 19.90it/s][A
  with torch.cuda.amp.autocast():

Epoch 2/10:  15%|█▍        | 327/2208 [00:18<01:52, 16.65it/s][A
Epoch 2/10:  15%|█▍        | 330/2208 [00:18<01:45, 17.75it/s][A

Batch 325: Training loss = 0.5294, Training accuracy = 0.8239, F1 = 0.8230



Epoch 2/10:  15%|█▌        | 333/2208 [00:19<01:40, 18.64it/s][A
Epoch 2/10:  15%|█▌        | 335/2208 [00:19<01:39, 18.91it/s][A
Epoch 2/10:  15%|█▌        | 338/2208 [00:19<01:36, 19.46it/s][A
Epoch 2/10:  15%|█▌        | 341/2208 [00:19<01:48, 17.27it/s][A
Epoch 2/10:  16%|█▌        | 344/2208 [00:19<01:41, 18.28it/s][A
Epoch 2/10:  16%|█▌        | 346/2208 [00:19<01:40, 18.55it/s][A
Epoch 2/10:  16%|█▌        | 349/2208 [00:19<01:43, 17.97it/s][A
  with torch.cuda.amp.autocast():

Epoch 2/10:  16%|█▌        | 353/2208 [00:20<01:48, 17.04it/s][A

Batch 350: Training loss = 0.5928, Training accuracy = 0.8245, F1 = 0.8236



Epoch 2/10:  16%|█▌        | 356/2208 [00:20<01:40, 18.44it/s][A
Epoch 2/10:  16%|█▋        | 359/2208 [00:20<01:35, 19.42it/s][A
Epoch 2/10:  16%|█▋        | 361/2208 [00:20<01:35, 19.44it/s][A
Epoch 2/10:  16%|█▋        | 364/2208 [00:20<01:31, 20.06it/s][A
Epoch 2/10:  17%|█▋        | 367/2208 [00:20<01:30, 20.27it/s][A
Epoch 2/10:  17%|█▋        | 370/2208 [00:20<01:32, 19.94it/s][A
Epoch 2/10:  17%|█▋        | 373/2208 [00:21<01:30, 20.37it/s][A
  with torch.cuda.amp.autocast():

Epoch 2/10:  17%|█▋        | 379/2208 [00:21<01:36, 19.01it/s][A

Batch 375: Training loss = 0.6903, Training accuracy = 0.8255, F1 = 0.8246



Epoch 2/10:  17%|█▋        | 382/2208 [00:21<01:32, 19.70it/s][A
Epoch 2/10:  17%|█▋        | 385/2208 [00:21<01:30, 20.19it/s][A
Epoch 2/10:  18%|█▊        | 388/2208 [00:21<01:28, 20.54it/s][A
Epoch 2/10:  18%|█▊        | 391/2208 [00:22<01:28, 20.54it/s][A
Epoch 2/10:  18%|█▊        | 394/2208 [00:22<01:27, 20.74it/s][A
Epoch 2/10:  18%|█▊        | 397/2208 [00:22<01:35, 19.06it/s][A
  with torch.cuda.amp.autocast():

Epoch 2/10:  18%|█▊        | 403/2208 [00:22<01:45, 17.11it/s][A

Batch 400: Training loss = 0.3512, Training accuracy = 0.8262, F1 = 0.8253



Epoch 2/10:  18%|█▊        | 406/2208 [00:22<01:39, 18.17it/s][A
Epoch 2/10:  19%|█▊        | 409/2208 [00:23<01:34, 19.01it/s][A
Epoch 2/10:  19%|█▊        | 412/2208 [00:23<01:31, 19.72it/s][A
Epoch 2/10:  19%|█▉        | 415/2208 [00:23<01:28, 20.24it/s][A
Epoch 2/10:  19%|█▉        | 418/2208 [00:23<01:27, 20.44it/s][A
Epoch 2/10:  19%|█▉        | 421/2208 [00:23<01:26, 20.69it/s][A
  with torch.cuda.amp.autocast():

Epoch 2/10:  19%|█▉        | 427/2208 [00:23<01:39, 17.87it/s][A
Epoch 2/10:  19%|█▉        | 430/2208 [00:24<01:34, 18.83it/s][A

Batch 425: Training loss = 0.5716, Training accuracy = 0.8261, F1 = 0.8253



Epoch 2/10:  20%|█▉        | 433/2208 [00:24<01:30, 19.57it/s][A
Epoch 2/10:  20%|█▉        | 436/2208 [00:24<01:27, 20.17it/s][A
Epoch 2/10:  20%|█▉        | 439/2208 [00:24<01:26, 20.36it/s][A
Epoch 2/10:  20%|██        | 442/2208 [00:24<01:25, 20.63it/s][A
Epoch 2/10:  20%|██        | 445/2208 [00:24<01:24, 20.82it/s][A
Epoch 2/10:  20%|██        | 448/2208 [00:24<01:23, 21.00it/s][A
  with torch.cuda.amp.autocast():

Epoch 2/10:  21%|██        | 454/2208 [00:25<01:33, 18.85it/s][A

Batch 450: Training loss = 0.6625, Training accuracy = 0.8266, F1 = 0.8257



Epoch 2/10:  21%|██        | 457/2208 [00:25<01:29, 19.50it/s][A
Epoch 2/10:  21%|██        | 460/2208 [00:25<01:27, 20.09it/s][A
Epoch 2/10:  21%|██        | 463/2208 [00:25<01:25, 20.34it/s][A
Epoch 2/10:  21%|██        | 466/2208 [00:25<01:24, 20.71it/s][A
Epoch 2/10:  21%|██        | 469/2208 [00:26<01:24, 20.60it/s][A
Epoch 2/10:  21%|██▏       | 472/2208 [00:26<01:23, 20.89it/s][A
  with torch.cuda.amp.autocast():

Epoch 2/10:  22%|██▏       | 478/2208 [00:26<01:36, 17.91it/s][A

Batch 475: Training loss = 0.4668, Training accuracy = 0.8265, F1 = 0.8256



Epoch 2/10:  22%|██▏       | 481/2208 [00:26<01:31, 18.83it/s][A
Epoch 2/10:  22%|██▏       | 484/2208 [00:26<01:28, 19.57it/s][A
Epoch 2/10:  22%|██▏       | 487/2208 [00:26<01:25, 20.07it/s][A
Epoch 2/10:  22%|██▏       | 490/2208 [00:27<01:24, 20.44it/s][A
Epoch 2/10:  22%|██▏       | 493/2208 [00:27<01:23, 20.56it/s][A
Epoch 2/10:  22%|██▏       | 496/2208 [00:27<01:22, 20.85it/s][A
  with torch.cuda.amp.autocast():

Epoch 2/10:  23%|██▎       | 502/2208 [00:27<01:35, 17.85it/s][A
Epoch 2/10:  23%|██▎       | 505/2208 [00:27<01:30, 18.80it/s][A

Batch 500: Training loss = 0.3740, Training accuracy = 0.8271, F1 = 0.8262



Epoch 2/10:  23%|██▎       | 508/2208 [00:27<01:27, 19.51it/s][A
Epoch 2/10:  23%|██▎       | 511/2208 [00:28<01:24, 20.01it/s][A
Epoch 2/10:  23%|██▎       | 514/2208 [00:28<01:23, 20.26it/s][A
Epoch 2/10:  23%|██▎       | 517/2208 [00:28<01:22, 20.59it/s][A
Epoch 2/10:  24%|██▎       | 520/2208 [00:28<01:21, 20.81it/s][A
Epoch 2/10:  24%|██▎       | 523/2208 [00:28<01:20, 20.95it/s][A
  with torch.cuda.amp.autocast():

Epoch 2/10:  24%|██▍       | 529/2208 [00:29<01:30, 18.49it/s][A

Batch 525: Training loss = 0.3290, Training accuracy = 0.8281, F1 = 0.8272



Epoch 2/10:  24%|██▍       | 532/2208 [00:29<01:27, 19.23it/s][A
Epoch 2/10:  24%|██▍       | 535/2208 [00:29<01:24, 19.83it/s][A
Epoch 2/10:  24%|██▍       | 538/2208 [00:29<01:22, 20.34it/s][A
Epoch 2/10:  25%|██▍       | 541/2208 [00:29<01:21, 20.51it/s][A
Epoch 2/10:  25%|██▍       | 544/2208 [00:29<01:20, 20.61it/s][A
Epoch 2/10:  25%|██▍       | 547/2208 [00:29<01:20, 20.76it/s][A
  with torch.cuda.amp.autocast():

Epoch 2/10:  25%|██▌       | 553/2208 [00:30<01:34, 17.42it/s][A

Batch 550: Training loss = 0.6400, Training accuracy = 0.8288, F1 = 0.8280



Epoch 2/10:  25%|██▌       | 556/2208 [00:30<01:29, 18.46it/s][A
Epoch 2/10:  25%|██▌       | 559/2208 [00:30<01:25, 19.27it/s][A
Epoch 2/10:  25%|██▌       | 562/2208 [00:30<01:23, 19.78it/s][A
Epoch 2/10:  26%|██▌       | 565/2208 [00:30<01:23, 19.61it/s][A
Epoch 2/10:  26%|██▌       | 567/2208 [00:31<01:30, 18.05it/s][A
Epoch 2/10:  26%|██▌       | 570/2208 [00:31<01:27, 18.76it/s][A
Epoch 2/10:  26%|██▌       | 573/2208 [00:31<01:23, 19.57it/s][A
  with torch.cuda.amp.autocast():

Epoch 2/10:  26%|██▌       | 578/2208 [00:31<01:35, 17.11it/s][A

Batch 575: Training loss = 0.4527, Training accuracy = 0.8297, F1 = 0.8289



Epoch 2/10:  26%|██▋       | 581/2208 [00:31<01:29, 18.18it/s][A
Epoch 2/10:  26%|██▋       | 583/2208 [00:31<01:34, 17.12it/s][A
Epoch 2/10:  27%|██▋       | 586/2208 [00:32<01:28, 18.29it/s][A
Epoch 2/10:  27%|██▋       | 589/2208 [00:32<01:26, 18.80it/s][A
Epoch 2/10:  27%|██▋       | 591/2208 [00:32<01:36, 16.84it/s][A
Epoch 2/10:  27%|██▋       | 594/2208 [00:32<01:29, 17.99it/s][A
Epoch 2/10:  27%|██▋       | 596/2208 [00:32<01:27, 18.37it/s][A
Epoch 2/10:  27%|██▋       | 599/2208 [00:32<01:23, 19.32it/s][A
  with torch.cuda.amp.autocast():

Epoch 2/10:  27%|██▋       | 604/2208 [00:33<01:34, 17.00it/s][A

Batch 600: Training loss = 0.6484, Training accuracy = 0.8303, F1 = 0.8295



Epoch 2/10:  27%|██▋       | 607/2208 [00:33<01:27, 18.23it/s][A
Epoch 2/10:  28%|██▊       | 610/2208 [00:33<01:23, 19.14it/s][A
Epoch 2/10:  28%|██▊       | 613/2208 [00:33<01:20, 19.75it/s][A
Epoch 2/10:  28%|██▊       | 616/2208 [00:33<01:20, 19.82it/s][A
Epoch 2/10:  28%|██▊       | 619/2208 [00:33<01:20, 19.79it/s][A
Epoch 2/10:  28%|██▊       | 622/2208 [00:33<01:18, 20.22it/s][A
  with torch.cuda.amp.autocast():

Epoch 2/10:  28%|██▊       | 627/2208 [00:34<01:53, 13.98it/s][A
Epoch 2/10:  29%|██▊       | 630/2208 [00:34<01:39, 15.82it/s][A

Batch 625: Training loss = 0.5227, Training accuracy = 0.8300, F1 = 0.8292



Epoch 2/10:  29%|██▊       | 633/2208 [00:34<01:31, 17.28it/s][A
Epoch 2/10:  29%|██▉       | 636/2208 [00:34<01:25, 18.44it/s][A
Epoch 2/10:  29%|██▉       | 639/2208 [00:35<01:21, 19.25it/s][A
Epoch 2/10:  29%|██▉       | 642/2208 [00:35<01:18, 19.84it/s][A
Epoch 2/10:  29%|██▉       | 645/2208 [00:35<01:16, 20.30it/s][A
Epoch 2/10:  29%|██▉       | 648/2208 [00:35<01:15, 20.63it/s][A
  with torch.cuda.amp.autocast():

Epoch 2/10:  30%|██▉       | 654/2208 [00:35<01:25, 18.11it/s][A

Batch 650: Training loss = 0.3916, Training accuracy = 0.8303, F1 = 0.8295



Epoch 2/10:  30%|██▉       | 657/2208 [00:35<01:21, 19.07it/s][A
Epoch 2/10:  30%|██▉       | 660/2208 [00:36<01:18, 19.70it/s][A
Epoch 2/10:  30%|███       | 663/2208 [00:36<01:16, 20.22it/s][A
Epoch 2/10:  30%|███       | 666/2208 [00:36<01:15, 20.47it/s][A
Epoch 2/10:  30%|███       | 669/2208 [00:36<01:14, 20.68it/s][A
Epoch 2/10:  30%|███       | 672/2208 [00:36<01:13, 20.83it/s][A
  with torch.cuda.amp.autocast():

Epoch 2/10:  31%|███       | 678/2208 [00:37<01:35, 16.07it/s][A

Batch 675: Training loss = 0.4388, Training accuracy = 0.8311, F1 = 0.8303



Epoch 2/10:  31%|███       | 681/2208 [00:37<01:28, 17.34it/s][A
Epoch 2/10:  31%|███       | 684/2208 [00:37<01:22, 18.49it/s][A
Epoch 2/10:  31%|███       | 687/2208 [00:37<01:18, 19.30it/s][A
Epoch 2/10:  31%|███▏      | 690/2208 [00:37<01:16, 19.86it/s][A
Epoch 2/10:  31%|███▏      | 693/2208 [00:37<01:14, 20.27it/s][A
Epoch 2/10:  32%|███▏      | 696/2208 [00:37<01:13, 20.52it/s][A
  with torch.cuda.amp.autocast():

Epoch 2/10:  32%|███▏      | 702/2208 [00:38<01:31, 16.43it/s][A
Epoch 2/10:  32%|███▏      | 705/2208 [00:38<01:24, 17.74it/s][A

Batch 700: Training loss = 0.5568, Training accuracy = 0.8315, F1 = 0.8307



Epoch 2/10:  32%|███▏      | 708/2208 [00:38<01:20, 18.74it/s][A
Epoch 2/10:  32%|███▏      | 711/2208 [00:38<01:17, 19.32it/s][A
Epoch 2/10:  32%|███▏      | 714/2208 [00:38<01:15, 19.87it/s][A
Epoch 2/10:  32%|███▏      | 717/2208 [00:39<01:13, 20.22it/s][A
Epoch 2/10:  33%|███▎      | 720/2208 [00:39<01:12, 20.51it/s][A
Epoch 2/10:  33%|███▎      | 723/2208 [00:39<01:11, 20.90it/s][A
  with torch.cuda.amp.autocast():

Epoch 2/10:  33%|███▎      | 729/2208 [00:39<01:22, 17.93it/s][A

Batch 725: Training loss = 0.4829, Training accuracy = 0.8321, F1 = 0.8313



Epoch 2/10:  33%|███▎      | 732/2208 [00:39<01:17, 18.94it/s][A
Epoch 2/10:  33%|███▎      | 735/2208 [00:40<01:14, 19.65it/s][A
Epoch 2/10:  33%|███▎      | 738/2208 [00:40<01:12, 20.20it/s][A
Epoch 2/10:  34%|███▎      | 741/2208 [00:40<01:11, 20.59it/s][A
Epoch 2/10:  34%|███▎      | 744/2208 [00:40<01:09, 20.93it/s][A
Epoch 2/10:  34%|███▍      | 747/2208 [00:40<01:09, 20.99it/s][A
  with torch.cuda.amp.autocast():

Epoch 2/10:  34%|███▍      | 753/2208 [00:40<01:29, 16.24it/s][A

Batch 750: Training loss = 0.4724, Training accuracy = 0.8330, F1 = 0.8322



Epoch 2/10:  34%|███▍      | 756/2208 [00:41<01:22, 17.52it/s][A
Epoch 2/10:  34%|███▍      | 759/2208 [00:41<01:18, 18.46it/s][A
Epoch 2/10:  35%|███▍      | 762/2208 [00:41<01:15, 19.16it/s][A
Epoch 2/10:  35%|███▍      | 765/2208 [00:41<01:12, 19.77it/s][A
Epoch 2/10:  35%|███▍      | 768/2208 [00:41<01:10, 20.31it/s][A
Epoch 2/10:  35%|███▍      | 771/2208 [00:41<01:09, 20.67it/s][A
  with torch.cuda.amp.autocast():

Epoch 2/10:  35%|███▌      | 777/2208 [00:42<01:26, 16.63it/s][A
Epoch 2/10:  35%|███▌      | 780/2208 [00:42<01:19, 17.88it/s][A

Batch 775: Training loss = 0.4592, Training accuracy = 0.8336, F1 = 0.8328



Epoch 2/10:  35%|███▌      | 783/2208 [00:42<01:15, 18.75it/s][A
Epoch 2/10:  36%|███▌      | 786/2208 [00:42<01:13, 19.42it/s][A
Epoch 2/10:  36%|███▌      | 789/2208 [00:42<01:11, 19.90it/s][A
Epoch 2/10:  36%|███▌      | 792/2208 [00:42<01:09, 20.34it/s][A
Epoch 2/10:  36%|███▌      | 795/2208 [00:43<01:08, 20.60it/s][A
Epoch 2/10:  36%|███▌      | 798/2208 [00:43<01:07, 20.92it/s][A
  with torch.cuda.amp.autocast():

Epoch 2/10:  36%|███▋      | 804/2208 [00:43<01:20, 17.43it/s][A

Batch 800: Training loss = 0.3215, Training accuracy = 0.8340, F1 = 0.8332



Epoch 2/10:  37%|███▋      | 807/2208 [00:43<01:15, 18.51it/s][A
Epoch 2/10:  37%|███▋      | 810/2208 [00:43<01:12, 19.20it/s][A
Epoch 2/10:  37%|███▋      | 813/2208 [00:44<01:10, 19.67it/s][A
Epoch 2/10:  37%|███▋      | 816/2208 [00:44<01:09, 20.08it/s][A
Epoch 2/10:  37%|███▋      | 819/2208 [00:44<01:08, 20.36it/s][A
Epoch 2/10:  37%|███▋      | 822/2208 [00:44<01:07, 20.42it/s][A
  with torch.cuda.amp.autocast():

Epoch 2/10:  38%|███▊      | 828/2208 [00:44<01:26, 16.02it/s][A

Batch 825: Training loss = 0.4073, Training accuracy = 0.8344, F1 = 0.8336



Epoch 2/10:  38%|███▊      | 831/2208 [00:45<01:19, 17.39it/s][A
Epoch 2/10:  38%|███▊      | 834/2208 [00:45<01:14, 18.47it/s][A
Epoch 2/10:  38%|███▊      | 837/2208 [00:45<01:11, 19.21it/s][A
Epoch 2/10:  38%|███▊      | 840/2208 [00:45<01:09, 19.71it/s][A
Epoch 2/10:  38%|███▊      | 843/2208 [00:45<01:17, 17.70it/s][A
Epoch 2/10:  38%|███▊      | 845/2208 [00:45<01:25, 16.00it/s][A
Epoch 2/10:  38%|███▊      | 847/2208 [00:45<01:21, 16.79it/s][A
  with torch.cuda.amp.autocast():

Epoch 2/10:  39%|███▊      | 852/2208 [00:46<01:43, 13.08it/s][A
Epoch 2/10:  39%|███▊      | 855/2208 [00:46<01:29, 15.10it/s][A

Batch 850: Training loss = 0.5812, Training accuracy = 0.8347, F1 = 0.8339



Epoch 2/10:  39%|███▉      | 858/2208 [00:46<01:21, 16.64it/s][A
Epoch 2/10:  39%|███▉      | 860/2208 [00:46<01:18, 17.24it/s][A
Epoch 2/10:  39%|███▉      | 863/2208 [00:46<01:13, 18.31it/s][A
Epoch 2/10:  39%|███▉      | 866/2208 [00:47<01:09, 19.22it/s][A
Epoch 2/10:  39%|███▉      | 869/2208 [00:47<01:07, 19.84it/s][A
Epoch 2/10:  39%|███▉      | 872/2208 [00:47<01:12, 18.31it/s][A
  with torch.cuda.amp.autocast():

Epoch 2/10:  40%|███▉      | 877/2208 [00:47<01:32, 14.32it/s][A
Epoch 2/10:  40%|███▉      | 880/2208 [00:47<01:22, 16.13it/s][A

Batch 875: Training loss = 0.4265, Training accuracy = 0.8352, F1 = 0.8344



Epoch 2/10:  40%|███▉      | 883/2208 [00:48<01:16, 17.38it/s][A
Epoch 2/10:  40%|████      | 886/2208 [00:48<01:11, 18.38it/s][A
Epoch 2/10:  40%|████      | 889/2208 [00:48<01:09, 19.04it/s][A
Epoch 2/10:  40%|████      | 892/2208 [00:48<01:07, 19.50it/s][A
Epoch 2/10:  41%|████      | 895/2208 [00:48<01:05, 20.02it/s][A
Epoch 2/10:  41%|████      | 898/2208 [00:48<01:04, 20.26it/s][A
  with torch.cuda.amp.autocast():

Epoch 2/10:  41%|████      | 904/2208 [00:49<01:19, 16.38it/s][A

Batch 900: Training loss = 0.5891, Training accuracy = 0.8357, F1 = 0.8350



Epoch 2/10:  41%|████      | 907/2208 [00:49<01:13, 17.66it/s][A
Epoch 2/10:  41%|████      | 910/2208 [00:49<01:09, 18.61it/s][A
Epoch 2/10:  41%|████▏     | 913/2208 [00:49<01:07, 19.29it/s][A
Epoch 2/10:  41%|████▏     | 916/2208 [00:49<01:05, 19.63it/s][A
Epoch 2/10:  42%|████▏     | 919/2208 [00:49<01:03, 20.17it/s][A
Epoch 2/10:  42%|████▏     | 922/2208 [00:50<01:03, 20.38it/s][A
  with torch.cuda.amp.autocast():

Epoch 2/10:  42%|████▏     | 928/2208 [00:50<01:21, 15.75it/s][A

Batch 925: Training loss = 0.3818, Training accuracy = 0.8363, F1 = 0.8355



Epoch 2/10:  42%|████▏     | 931/2208 [00:50<01:14, 17.12it/s][A
Epoch 2/10:  42%|████▏     | 934/2208 [00:50<01:10, 18.15it/s][A
Epoch 2/10:  42%|████▏     | 937/2208 [00:51<01:06, 18.99it/s][A
Epoch 2/10:  43%|████▎     | 940/2208 [00:51<01:04, 19.58it/s][A
Epoch 2/10:  43%|████▎     | 943/2208 [00:51<01:03, 19.93it/s][A
Epoch 2/10:  43%|████▎     | 946/2208 [00:51<01:05, 19.13it/s][A
  with torch.cuda.amp.autocast():

Epoch 2/10:  43%|████▎     | 952/2208 [00:51<01:23, 15.00it/s][A
Epoch 2/10:  43%|████▎     | 955/2208 [00:52<01:15, 16.54it/s][A

Batch 950: Training loss = 0.3122, Training accuracy = 0.8370, F1 = 0.8362



Epoch 2/10:  43%|████▎     | 958/2208 [00:52<01:10, 17.76it/s][A
Epoch 2/10:  44%|████▎     | 961/2208 [00:52<01:06, 18.67it/s][A
Epoch 2/10:  44%|████▎     | 964/2208 [00:52<01:03, 19.49it/s][A
Epoch 2/10:  44%|████▍     | 967/2208 [00:52<01:02, 19.84it/s][A
Epoch 2/10:  44%|████▍     | 970/2208 [00:52<01:01, 20.24it/s][A
Epoch 2/10:  44%|████▍     | 973/2208 [00:52<01:00, 20.44it/s][A
  with torch.cuda.amp.autocast():

Epoch 2/10:  44%|████▍     | 979/2208 [00:53<01:14, 16.55it/s][A

Batch 975: Training loss = 0.4840, Training accuracy = 0.8373, F1 = 0.8365



Epoch 2/10:  44%|████▍     | 982/2208 [00:53<01:09, 17.74it/s][A
Epoch 2/10:  45%|████▍     | 985/2208 [00:53<01:05, 18.62it/s][A
Epoch 2/10:  45%|████▍     | 988/2208 [00:53<01:03, 19.35it/s][A
Epoch 2/10:  45%|████▍     | 991/2208 [00:53<01:01, 19.94it/s][A
Epoch 2/10:  45%|████▌     | 994/2208 [00:54<00:59, 20.33it/s][A
Epoch 2/10:  45%|████▌     | 997/2208 [00:54<00:58, 20.58it/s][A
  with torch.cuda.amp.autocast():

Epoch 2/10:  45%|████▌     | 1003/2208 [00:54<01:19, 15.19it/s][A

Batch 1000: Training loss = 0.4778, Training accuracy = 0.8377, F1 = 0.8370



Epoch 2/10:  46%|████▌     | 1006/2208 [00:54<01:12, 16.69it/s][A
Epoch 2/10:  46%|████▌     | 1009/2208 [00:54<01:06, 17.90it/s][A
Epoch 2/10:  46%|████▌     | 1012/2208 [00:55<01:03, 18.84it/s][A
Epoch 2/10:  46%|████▌     | 1015/2208 [00:55<01:00, 19.57it/s][A
Epoch 2/10:  46%|████▌     | 1018/2208 [00:55<01:01, 19.26it/s][A
Epoch 2/10:  46%|████▌     | 1021/2208 [00:55<00:59, 19.90it/s][A
  with torch.cuda.amp.autocast():

Epoch 2/10:  47%|████▋     | 1027/2208 [00:56<01:29, 13.15it/s][A
Epoch 2/10:  47%|████▋     | 1030/2208 [00:56<01:19, 14.91it/s][A

Batch 1025: Training loss = 0.4332, Training accuracy = 0.8382, F1 = 0.8375



Epoch 2/10:  47%|████▋     | 1033/2208 [00:56<01:11, 16.36it/s][A
Epoch 2/10:  47%|████▋     | 1036/2208 [00:56<01:07, 17.49it/s][A
Epoch 2/10:  47%|████▋     | 1039/2208 [00:56<01:03, 18.43it/s][A
Epoch 2/10:  47%|████▋     | 1042/2208 [00:56<01:00, 19.30it/s][A
Epoch 2/10:  47%|████▋     | 1045/2208 [00:56<00:58, 19.91it/s][A
Epoch 2/10:  47%|████▋     | 1048/2208 [00:57<00:57, 20.31it/s][A
  with torch.cuda.amp.autocast():

Epoch 2/10:  48%|████▊     | 1054/2208 [00:57<01:09, 16.59it/s][A

Batch 1050: Training loss = 0.3168, Training accuracy = 0.8387, F1 = 0.8379



Epoch 2/10:  48%|████▊     | 1057/2208 [00:57<01:04, 17.82it/s][A
Epoch 2/10:  48%|████▊     | 1060/2208 [00:57<01:01, 18.75it/s][A
Epoch 2/10:  48%|████▊     | 1063/2208 [00:57<00:58, 19.51it/s][A
Epoch 2/10:  48%|████▊     | 1066/2208 [00:58<00:56, 20.08it/s][A
Epoch 2/10:  48%|████▊     | 1069/2208 [00:58<00:55, 20.39it/s][A
Epoch 2/10:  49%|████▊     | 1072/2208 [00:58<00:54, 20.67it/s][A
  with torch.cuda.amp.autocast():

Epoch 2/10:  49%|████▉     | 1078/2208 [00:58<01:16, 14.77it/s][A

Batch 1075: Training loss = 0.3043, Training accuracy = 0.8391, F1 = 0.8384



Epoch 2/10:  49%|████▉     | 1081/2208 [00:58<01:09, 16.29it/s][A
Epoch 2/10:  49%|████▉     | 1084/2208 [00:59<01:04, 17.44it/s][A
Epoch 2/10:  49%|████▉     | 1087/2208 [00:59<01:01, 18.35it/s][A
Epoch 2/10:  49%|████▉     | 1090/2208 [00:59<00:58, 19.16it/s][A
Epoch 2/10:  50%|████▉     | 1093/2208 [00:59<00:56, 19.68it/s][A
Epoch 2/10:  50%|████▉     | 1096/2208 [00:59<00:55, 20.01it/s][A
  with torch.cuda.amp.autocast():

Epoch 2/10:  50%|████▉     | 1102/2208 [01:00<01:26, 12.80it/s][A
Epoch 2/10:  50%|█████     | 1105/2208 [01:00<01:15, 14.61it/s][A

Batch 1100: Training loss = 0.4391, Training accuracy = 0.8396, F1 = 0.8389



Epoch 2/10:  50%|█████     | 1108/2208 [01:00<01:08, 16.13it/s][A
Epoch 2/10:  50%|█████     | 1111/2208 [01:00<01:03, 17.40it/s][A
Epoch 2/10:  50%|█████     | 1113/2208 [01:00<01:01, 17.80it/s][A
Epoch 2/10:  51%|█████     | 1116/2208 [01:00<00:58, 18.69it/s][A
Epoch 2/10:  51%|█████     | 1119/2208 [01:01<00:56, 19.41it/s][A
Epoch 2/10:  51%|█████     | 1122/2208 [01:01<00:54, 19.83it/s][A
  with torch.cuda.amp.autocast():

Epoch 2/10:  51%|█████     | 1128/2208 [01:01<01:20, 13.42it/s][A

Batch 1125: Training loss = 0.4288, Training accuracy = 0.8399, F1 = 0.8392



Epoch 2/10:  51%|█████     | 1131/2208 [01:01<01:11, 15.02it/s][A
Epoch 2/10:  51%|█████▏    | 1134/2208 [01:02<01:05, 16.45it/s][A
Epoch 2/10:  51%|█████▏    | 1137/2208 [01:02<01:00, 17.59it/s][A
Epoch 2/10:  52%|█████▏    | 1140/2208 [01:02<00:57, 18.55it/s][A
Epoch 2/10:  52%|█████▏    | 1143/2208 [01:02<00:55, 19.16it/s][A
Epoch 2/10:  52%|█████▏    | 1146/2208 [01:02<00:53, 19.71it/s][A
  with torch.cuda.amp.autocast():

Epoch 2/10:  52%|█████▏    | 1152/2208 [01:03<01:18, 13.51it/s][A
Epoch 2/10:  52%|█████▏    | 1155/2208 [01:03<01:09, 15.22it/s][A

Batch 1150: Training loss = 0.4138, Training accuracy = 0.8403, F1 = 0.8396



Epoch 2/10:  52%|█████▏    | 1158/2208 [01:03<01:03, 16.59it/s][A
Epoch 2/10:  53%|█████▎    | 1161/2208 [01:03<00:58, 17.77it/s][A
Epoch 2/10:  53%|█████▎    | 1164/2208 [01:03<00:55, 18.71it/s][A
Epoch 2/10:  53%|█████▎    | 1167/2208 [01:03<00:54, 19.26it/s][A
Epoch 2/10:  53%|█████▎    | 1170/2208 [01:04<00:52, 19.79it/s][A
Epoch 2/10:  53%|█████▎    | 1173/2208 [01:04<00:51, 19.96it/s][A
  with torch.cuda.amp.autocast():

Epoch 2/10:  53%|█████▎    | 1179/2208 [01:04<01:08, 15.07it/s][A

Batch 1175: Training loss = 0.4185, Training accuracy = 0.8408, F1 = 0.8400



Epoch 2/10:  54%|█████▎    | 1182/2208 [01:04<01:01, 16.58it/s][A
Epoch 2/10:  54%|█████▎    | 1185/2208 [01:04<00:57, 17.77it/s][A
Epoch 2/10:  54%|█████▍    | 1188/2208 [01:05<00:54, 18.64it/s][A
Epoch 2/10:  54%|█████▍    | 1191/2208 [01:05<00:52, 19.33it/s][A
Epoch 2/10:  54%|█████▍    | 1194/2208 [01:05<00:51, 19.87it/s][A
Epoch 2/10:  54%|█████▍    | 1197/2208 [01:05<00:49, 20.37it/s][A
  with torch.cuda.amp.autocast():

Epoch 2/10:  54%|█████▍    | 1203/2208 [01:06<01:11, 14.01it/s][A

Batch 1200: Training loss = 0.5043, Training accuracy = 0.8410, F1 = 0.8403



Epoch 2/10:  55%|█████▍    | 1206/2208 [01:06<01:03, 15.70it/s][A
Epoch 2/10:  55%|█████▍    | 1209/2208 [01:06<00:58, 16.97it/s][A
Epoch 2/10:  55%|█████▍    | 1212/2208 [01:06<00:54, 18.13it/s][A
Epoch 2/10:  55%|█████▌    | 1215/2208 [01:06<00:52, 18.97it/s][A
Epoch 2/10:  55%|█████▌    | 1218/2208 [01:06<00:50, 19.74it/s][A
Epoch 2/10:  55%|█████▌    | 1221/2208 [01:06<00:48, 20.23it/s][A
  with torch.cuda.amp.autocast():

Epoch 2/10:  56%|█████▌    | 1227/2208 [01:07<01:10, 13.91it/s][A
Epoch 2/10:  56%|█████▌    | 1230/2208 [01:07<01:02, 15.63it/s][A

Batch 1225: Training loss = 0.3595, Training accuracy = 0.8413, F1 = 0.8406



Epoch 2/10:  56%|█████▌    | 1233/2208 [01:07<00:57, 17.00it/s][A
Epoch 2/10:  56%|█████▌    | 1236/2208 [01:07<00:53, 18.08it/s][A
Epoch 2/10:  56%|█████▌    | 1239/2208 [01:07<00:51, 18.99it/s][A
Epoch 2/10:  56%|█████▋    | 1242/2208 [01:08<00:49, 19.68it/s][A
Epoch 2/10:  56%|█████▋    | 1245/2208 [01:08<00:47, 20.07it/s][A
Epoch 2/10:  57%|█████▋    | 1248/2208 [01:08<00:47, 20.42it/s][A
  with torch.cuda.amp.autocast():

Epoch 2/10:  57%|█████▋    | 1254/2208 [01:08<01:01, 15.60it/s][A

Batch 1250: Training loss = 0.3559, Training accuracy = 0.8417, F1 = 0.8410



Epoch 2/10:  57%|█████▋    | 1257/2208 [01:09<00:56, 16.96it/s][A
Epoch 2/10:  57%|█████▋    | 1260/2208 [01:09<00:52, 18.03it/s][A
Epoch 2/10:  57%|█████▋    | 1263/2208 [01:09<00:49, 18.91it/s][A
Epoch 2/10:  57%|█████▋    | 1266/2208 [01:09<00:47, 19.65it/s][A
Epoch 2/10:  57%|█████▋    | 1269/2208 [01:09<00:46, 20.11it/s][A
Epoch 2/10:  58%|█████▊    | 1272/2208 [01:09<00:45, 20.55it/s][A
  with torch.cuda.amp.autocast():

Epoch 2/10:  58%|█████▊    | 1278/2208 [01:10<01:09, 13.30it/s][A

Batch 1275: Training loss = 0.5891, Training accuracy = 0.8420, F1 = 0.8413



Epoch 2/10:  58%|█████▊    | 1281/2208 [01:10<01:01, 15.05it/s][A
Epoch 2/10:  58%|█████▊    | 1284/2208 [01:10<00:55, 16.57it/s][A
Epoch 2/10:  58%|█████▊    | 1287/2208 [01:10<00:51, 17.83it/s][A
Epoch 2/10:  58%|█████▊    | 1290/2208 [01:10<00:48, 18.76it/s][A
Epoch 2/10:  59%|█████▊    | 1293/2208 [01:11<00:46, 19.57it/s][A
Epoch 2/10:  59%|█████▊    | 1296/2208 [01:11<00:45, 20.09it/s][A
  with torch.cuda.amp.autocast():

Epoch 2/10:  59%|█████▉    | 1302/2208 [01:11<01:04, 14.03it/s][A
Epoch 2/10:  59%|█████▉    | 1305/2208 [01:11<00:57, 15.72it/s][A

Batch 1300: Training loss = 0.5006, Training accuracy = 0.8423, F1 = 0.8416



Epoch 2/10:  59%|█████▉    | 1308/2208 [01:11<00:52, 17.12it/s][A
Epoch 2/10:  59%|█████▉    | 1311/2208 [01:12<00:49, 18.21it/s][A
Epoch 2/10:  60%|█████▉    | 1314/2208 [01:12<00:46, 19.06it/s][A
Epoch 2/10:  60%|█████▉    | 1317/2208 [01:12<00:45, 19.60it/s][A
Epoch 2/10:  60%|█████▉    | 1320/2208 [01:12<00:44, 20.17it/s][A
Epoch 2/10:  60%|█████▉    | 1323/2208 [01:12<00:43, 20.36it/s][A
  with torch.cuda.amp.autocast():

Epoch 2/10:  60%|██████    | 1329/2208 [01:13<00:58, 15.15it/s][A

Batch 1325: Training loss = 0.3761, Training accuracy = 0.8428, F1 = 0.8421



Epoch 2/10:  60%|██████    | 1332/2208 [01:13<00:52, 16.63it/s][A
Epoch 2/10:  60%|██████    | 1335/2208 [01:13<00:49, 17.78it/s][A
Epoch 2/10:  61%|██████    | 1338/2208 [01:13<00:46, 18.72it/s][A
Epoch 2/10:  61%|██████    | 1341/2208 [01:13<00:44, 19.40it/s][A
Epoch 2/10:  61%|██████    | 1344/2208 [01:13<00:43, 19.74it/s][A
Epoch 2/10:  61%|██████    | 1347/2208 [01:14<00:42, 20.16it/s][A
  with torch.cuda.amp.autocast():

Epoch 2/10:  61%|██████▏   | 1353/2208 [01:14<01:04, 13.28it/s][A

Batch 1350: Training loss = 0.4475, Training accuracy = 0.8431, F1 = 0.8425



Epoch 2/10:  61%|██████▏   | 1356/2208 [01:14<00:56, 15.03it/s][A
Epoch 2/10:  62%|██████▏   | 1359/2208 [01:14<00:51, 16.47it/s][A
Epoch 2/10:  62%|██████▏   | 1362/2208 [01:14<00:47, 17.71it/s][A
Epoch 2/10:  62%|██████▏   | 1365/2208 [01:15<00:45, 18.56it/s][A
Epoch 2/10:  62%|██████▏   | 1368/2208 [01:15<00:43, 19.34it/s][A
Epoch 2/10:  62%|██████▏   | 1371/2208 [01:15<00:42, 19.88it/s][A
  with torch.cuda.amp.autocast():

Epoch 2/10:  62%|██████▏   | 1377/2208 [01:16<01:06, 12.54it/s][A
Epoch 2/10:  62%|██████▎   | 1380/2208 [01:16<00:57, 14.35it/s][A

Batch 1375: Training loss = 0.3027, Training accuracy = 0.8434, F1 = 0.8427



Epoch 2/10:  63%|██████▎   | 1383/2208 [01:16<00:51, 15.93it/s][A
Epoch 2/10:  63%|██████▎   | 1386/2208 [01:16<00:47, 17.18it/s][A
Epoch 2/10:  63%|██████▎   | 1389/2208 [01:16<00:44, 18.24it/s][A
Epoch 2/10:  63%|██████▎   | 1392/2208 [01:16<00:42, 19.05it/s][A
Epoch 2/10:  63%|██████▎   | 1395/2208 [01:16<00:41, 19.40it/s][A
Epoch 2/10:  63%|██████▎   | 1398/2208 [01:17<00:40, 19.88it/s][A
  with torch.cuda.amp.autocast():

Epoch 2/10:  64%|██████▎   | 1404/2208 [01:17<00:56, 14.23it/s][A

Batch 1400: Training loss = 0.4348, Training accuracy = 0.8437, F1 = 0.8431



Epoch 2/10:  64%|██████▎   | 1407/2208 [01:17<00:50, 15.80it/s][A
Epoch 2/10:  64%|██████▍   | 1410/2208 [01:17<00:46, 17.01it/s][A
Epoch 2/10:  64%|██████▍   | 1413/2208 [01:18<00:44, 18.04it/s][A
Epoch 2/10:  64%|██████▍   | 1416/2208 [01:18<00:42, 18.77it/s][A
Epoch 2/10:  64%|██████▍   | 1419/2208 [01:18<00:40, 19.28it/s][A
Epoch 2/10:  64%|██████▍   | 1422/2208 [01:18<00:39, 19.78it/s][A
  with torch.cuda.amp.autocast():

Epoch 2/10:  65%|██████▍   | 1428/2208 [01:19<00:59, 13.04it/s][A

Batch 1425: Training loss = 0.3982, Training accuracy = 0.8439, F1 = 0.8433



Epoch 2/10:  65%|██████▍   | 1431/2208 [01:19<00:52, 14.79it/s][A
Epoch 2/10:  65%|██████▍   | 1434/2208 [01:19<00:47, 16.32it/s][A
Epoch 2/10:  65%|██████▌   | 1437/2208 [01:19<00:43, 17.54it/s][A
Epoch 2/10:  65%|██████▌   | 1440/2208 [01:19<00:41, 18.55it/s][A
Epoch 2/10:  65%|██████▌   | 1443/2208 [01:19<00:39, 19.32it/s][A
Epoch 2/10:  65%|██████▌   | 1446/2208 [01:19<00:38, 19.79it/s][A
  with torch.cuda.amp.autocast():

Epoch 2/10:  66%|██████▌   | 1452/2208 [01:20<00:57, 13.12it/s][A
Epoch 2/10:  66%|██████▌   | 1455/2208 [01:20<00:50, 14.93it/s][A

Batch 1450: Training loss = 0.4441, Training accuracy = 0.8443, F1 = 0.8436



Epoch 2/10:  66%|██████▌   | 1458/2208 [01:20<00:45, 16.42it/s][A
Epoch 2/10:  66%|██████▌   | 1461/2208 [01:20<00:42, 17.56it/s][A
Epoch 2/10:  66%|██████▋   | 1464/2208 [01:20<00:40, 18.57it/s][A
Epoch 2/10:  66%|██████▋   | 1467/2208 [01:21<00:38, 19.40it/s][A
Epoch 2/10:  67%|██████▋   | 1470/2208 [01:21<00:37, 19.79it/s][A
Epoch 2/10:  67%|██████▋   | 1473/2208 [01:21<00:36, 20.23it/s][A
  with torch.cuda.amp.autocast():

Epoch 2/10:  67%|██████▋   | 1479/2208 [01:21<00:49, 14.71it/s][A

Batch 1475: Training loss = 0.4217, Training accuracy = 0.8446, F1 = 0.8439



Epoch 2/10:  67%|██████▋   | 1482/2208 [01:22<00:44, 16.22it/s][A
Epoch 2/10:  67%|██████▋   | 1485/2208 [01:22<00:41, 17.50it/s][A
Epoch 2/10:  67%|██████▋   | 1488/2208 [01:22<00:38, 18.56it/s][A
Epoch 2/10:  68%|██████▊   | 1491/2208 [01:22<00:37, 19.20it/s][A
Epoch 2/10:  68%|██████▊   | 1494/2208 [01:22<00:35, 19.85it/s][A
Epoch 2/10:  68%|██████▊   | 1497/2208 [01:22<00:35, 20.29it/s][A
  with torch.cuda.amp.autocast():

Epoch 2/10:  68%|██████▊   | 1503/2208 [01:23<00:54, 12.99it/s][A

Batch 1500: Training loss = 0.5541, Training accuracy = 0.8451, F1 = 0.8444



Epoch 2/10:  68%|██████▊   | 1506/2208 [01:23<00:47, 14.80it/s][A
Epoch 2/10:  68%|██████▊   | 1509/2208 [01:23<00:42, 16.30it/s][A
Epoch 2/10:  68%|██████▊   | 1512/2208 [01:23<00:39, 17.50it/s][A
Epoch 2/10:  69%|██████▊   | 1515/2208 [01:23<00:37, 18.57it/s][A
Epoch 2/10:  69%|██████▉   | 1518/2208 [01:24<00:35, 19.24it/s][A
Epoch 2/10:  69%|██████▉   | 1521/2208 [01:24<00:34, 19.81it/s][A
  with torch.cuda.amp.autocast():

Epoch 2/10:  69%|██████▉   | 1527/2208 [01:24<00:52, 12.99it/s][A
Epoch 2/10:  69%|██████▉   | 1530/2208 [01:24<00:46, 14.74it/s][A

Batch 1525: Training loss = 0.4496, Training accuracy = 0.8456, F1 = 0.8449



Epoch 2/10:  69%|██████▉   | 1533/2208 [01:25<00:41, 16.24it/s][A
Epoch 2/10:  70%|██████▉   | 1536/2208 [01:25<00:38, 17.55it/s][A
Epoch 2/10:  70%|██████▉   | 1539/2208 [01:25<00:36, 18.53it/s][A
Epoch 2/10:  70%|██████▉   | 1542/2208 [01:25<00:34, 19.20it/s][A
Epoch 2/10:  70%|██████▉   | 1545/2208 [01:25<00:33, 19.68it/s][A
Epoch 2/10:  70%|███████   | 1548/2208 [01:25<00:32, 20.06it/s][A
  with torch.cuda.amp.autocast():

Epoch 2/10:  70%|███████   | 1554/2208 [01:26<00:47, 13.87it/s][A

Batch 1550: Training loss = 0.2328, Training accuracy = 0.8459, F1 = 0.8453



Epoch 2/10:  71%|███████   | 1557/2208 [01:26<00:41, 15.51it/s][A
Epoch 2/10:  71%|███████   | 1560/2208 [01:26<00:38, 16.93it/s][A
Epoch 2/10:  71%|███████   | 1563/2208 [01:26<00:35, 18.03it/s][A
Epoch 2/10:  71%|███████   | 1566/2208 [01:26<00:33, 18.92it/s][A
Epoch 2/10:  71%|███████   | 1569/2208 [01:27<00:32, 19.51it/s][A
Epoch 2/10:  71%|███████   | 1572/2208 [01:27<00:31, 19.89it/s][A
  with torch.cuda.amp.autocast():

Epoch 2/10:  71%|███████▏  | 1578/2208 [01:27<00:53, 11.82it/s][A

Batch 1575: Training loss = 0.2912, Training accuracy = 0.8463, F1 = 0.8456



Epoch 2/10:  72%|███████▏  | 1581/2208 [01:28<00:45, 13.65it/s][A
Epoch 2/10:  72%|███████▏  | 1584/2208 [01:28<00:40, 15.28it/s][A
Epoch 2/10:  72%|███████▏  | 1587/2208 [01:28<00:37, 16.69it/s][A
Epoch 2/10:  72%|███████▏  | 1590/2208 [01:28<00:34, 17.85it/s][A
Epoch 2/10:  72%|███████▏  | 1593/2208 [01:28<00:32, 18.76it/s][A
Epoch 2/10:  72%|███████▏  | 1596/2208 [01:28<00:31, 19.37it/s][A
  with torch.cuda.amp.autocast():

Epoch 2/10:  73%|███████▎  | 1602/2208 [01:29<00:51, 11.79it/s][A
Epoch 2/10:  73%|███████▎  | 1605/2208 [01:29<00:44, 13.63it/s][A

Batch 1600: Training loss = 0.4313, Training accuracy = 0.8467, F1 = 0.8460



Epoch 2/10:  73%|███████▎  | 1608/2208 [01:29<00:39, 15.21it/s][A
Epoch 2/10:  73%|███████▎  | 1611/2208 [01:29<00:36, 16.50it/s][A
Epoch 2/10:  73%|███████▎  | 1614/2208 [01:29<00:33, 17.65it/s][A
Epoch 2/10:  73%|███████▎  | 1617/2208 [01:30<00:31, 18.61it/s][A
Epoch 2/10:  73%|███████▎  | 1620/2208 [01:30<00:30, 19.15it/s][A
Epoch 2/10:  74%|███████▎  | 1623/2208 [01:30<00:29, 19.60it/s][A
  with torch.cuda.amp.autocast():

Epoch 2/10:  74%|███████▍  | 1629/2208 [01:31<00:42, 13.60it/s][A

Batch 1625: Training loss = 0.3990, Training accuracy = 0.8469, F1 = 0.8462



Epoch 2/10:  74%|███████▍  | 1632/2208 [01:31<00:37, 15.22it/s][A
Epoch 2/10:  74%|███████▍  | 1635/2208 [01:31<00:34, 16.65it/s][A
Epoch 2/10:  74%|███████▍  | 1638/2208 [01:31<00:32, 17.78it/s][A
Epoch 2/10:  74%|███████▍  | 1641/2208 [01:31<00:30, 18.66it/s][A
Epoch 2/10:  74%|███████▍  | 1644/2208 [01:31<00:31, 17.76it/s][A
Epoch 2/10:  75%|███████▍  | 1647/2208 [01:31<00:29, 18.74it/s][A
  with torch.cuda.amp.autocast():

Epoch 2/10:  75%|███████▍  | 1653/2208 [01:32<00:51, 10.76it/s][A

Batch 1650: Training loss = 0.4244, Training accuracy = 0.8472, F1 = 0.8466



Epoch 2/10:  75%|███████▌  | 1656/2208 [01:32<00:43, 12.69it/s][A
Epoch 2/10:  75%|███████▌  | 1659/2208 [01:32<00:38, 14.42it/s][A
Epoch 2/10:  75%|███████▌  | 1662/2208 [01:33<00:34, 15.97it/s][A
Epoch 2/10:  75%|███████▌  | 1665/2208 [01:33<00:31, 17.31it/s][A
Epoch 2/10:  76%|███████▌  | 1668/2208 [01:33<00:29, 18.40it/s][A
Epoch 2/10:  76%|███████▌  | 1671/2208 [01:33<00:27, 19.20it/s][A
  with torch.cuda.amp.autocast():

Epoch 2/10:  76%|███████▌  | 1677/2208 [01:34<00:46, 11.50it/s][A
Epoch 2/10:  76%|███████▌  | 1680/2208 [01:34<00:39, 13.39it/s][A

Batch 1675: Training loss = 0.3690, Training accuracy = 0.8477, F1 = 0.8470



Epoch 2/10:  76%|███████▌  | 1683/2208 [01:34<00:34, 15.13it/s][A
Epoch 2/10:  76%|███████▋  | 1686/2208 [01:34<00:31, 16.53it/s][A
Epoch 2/10:  76%|███████▋  | 1689/2208 [01:34<00:29, 17.76it/s][A
Epoch 2/10:  77%|███████▋  | 1692/2208 [01:34<00:27, 18.64it/s][A
Epoch 2/10:  77%|███████▋  | 1695/2208 [01:34<00:26, 19.35it/s][A
Epoch 2/10:  77%|███████▋  | 1698/2208 [01:35<00:25, 19.95it/s][A
  with torch.cuda.amp.autocast():

Epoch 2/10:  77%|███████▋  | 1704/2208 [01:35<00:36, 13.70it/s][A

Batch 1700: Training loss = 0.4731, Training accuracy = 0.8480, F1 = 0.8474



Epoch 2/10:  77%|███████▋  | 1707/2208 [01:35<00:32, 15.37it/s][A
Epoch 2/10:  77%|███████▋  | 1710/2208 [01:36<00:29, 16.76it/s][A
Epoch 2/10:  78%|███████▊  | 1713/2208 [01:36<00:27, 17.94it/s][A
Epoch 2/10:  78%|███████▊  | 1716/2208 [01:36<00:26, 18.75it/s][A
Epoch 2/10:  78%|███████▊  | 1719/2208 [01:36<00:25, 19.42it/s][A
Epoch 2/10:  78%|███████▊  | 1722/2208 [01:36<00:24, 19.96it/s][A
  with torch.cuda.amp.autocast():

Epoch 2/10:  78%|███████▊  | 1728/2208 [01:37<00:41, 11.70it/s][A

Batch 1725: Training loss = 0.2537, Training accuracy = 0.8485, F1 = 0.8478



Epoch 2/10:  78%|███████▊  | 1731/2208 [01:37<00:35, 13.57it/s][A
Epoch 2/10:  79%|███████▊  | 1734/2208 [01:37<00:30, 15.30it/s][A
Epoch 2/10:  79%|███████▊  | 1737/2208 [01:37<00:28, 16.72it/s][A
Epoch 2/10:  79%|███████▉  | 1740/2208 [01:37<00:26, 17.88it/s][A
Epoch 2/10:  79%|███████▉  | 1743/2208 [01:37<00:24, 18.79it/s][A
Epoch 2/10:  79%|███████▉  | 1746/2208 [01:38<00:23, 19.56it/s][A
  with torch.cuda.amp.autocast():

Epoch 2/10:  79%|███████▉  | 1752/2208 [01:38<00:40, 11.29it/s][A
Epoch 2/10:  79%|███████▉  | 1755/2208 [01:38<00:34, 13.20it/s][A

Batch 1750: Training loss = 0.5556, Training accuracy = 0.8487, F1 = 0.8481



Epoch 2/10:  80%|███████▉  | 1758/2208 [01:39<00:30, 14.94it/s][A
Epoch 2/10:  80%|███████▉  | 1761/2208 [01:39<00:27, 16.31it/s][A
Epoch 2/10:  80%|███████▉  | 1764/2208 [01:39<00:25, 17.53it/s][A
Epoch 2/10:  80%|████████  | 1767/2208 [01:39<00:23, 18.58it/s][A
Epoch 2/10:  80%|████████  | 1770/2208 [01:39<00:22, 19.21it/s][A
Epoch 2/10:  80%|████████  | 1773/2208 [01:39<00:22, 19.73it/s][A
  with torch.cuda.amp.autocast():

Epoch 2/10:  81%|████████  | 1779/2208 [01:40<00:31, 13.65it/s][A

Batch 1775: Training loss = 0.4884, Training accuracy = 0.8491, F1 = 0.8485



Epoch 2/10:  81%|████████  | 1782/2208 [01:40<00:27, 15.28it/s][A
Epoch 2/10:  81%|████████  | 1785/2208 [01:40<00:25, 16.69it/s][A
Epoch 2/10:  81%|████████  | 1788/2208 [01:40<00:23, 17.86it/s][A
Epoch 2/10:  81%|████████  | 1791/2208 [01:40<00:22, 18.65it/s][A
Epoch 2/10:  81%|████████▏ | 1794/2208 [01:41<00:21, 19.28it/s][A
Epoch 2/10:  81%|████████▏ | 1797/2208 [01:41<00:20, 19.72it/s][A
  with torch.cuda.amp.autocast():

Epoch 2/10:  82%|████████▏ | 1803/2208 [01:41<00:33, 12.03it/s][A

Batch 1800: Training loss = 0.2896, Training accuracy = 0.8495, F1 = 0.8489



Epoch 2/10:  82%|████████▏ | 1806/2208 [01:41<00:29, 13.85it/s][A
Epoch 2/10:  82%|████████▏ | 1809/2208 [01:42<00:25, 15.46it/s][A
Epoch 2/10:  82%|████████▏ | 1812/2208 [01:42<00:23, 16.81it/s][A
Epoch 2/10:  82%|████████▏ | 1815/2208 [01:42<00:21, 17.90it/s][A
Epoch 2/10:  82%|████████▏ | 1818/2208 [01:42<00:20, 18.79it/s][A
Epoch 2/10:  82%|████████▏ | 1821/2208 [01:42<00:19, 19.42it/s][A
  with torch.cuda.amp.autocast():

Epoch 2/10:  83%|████████▎ | 1827/2208 [01:43<00:33, 11.28it/s][A
Epoch 2/10:  83%|████████▎ | 1830/2208 [01:43<00:28, 13.19it/s][A

Batch 1825: Training loss = 0.2951, Training accuracy = 0.8497, F1 = 0.8490



Epoch 2/10:  83%|████████▎ | 1833/2208 [01:43<00:25, 14.87it/s][A
Epoch 2/10:  83%|████████▎ | 1836/2208 [01:43<00:22, 16.24it/s][A
Epoch 2/10:  83%|████████▎ | 1839/2208 [01:43<00:21, 17.52it/s][A
Epoch 2/10:  83%|████████▎ | 1842/2208 [01:44<00:21, 16.96it/s][A
Epoch 2/10:  84%|████████▎ | 1845/2208 [01:44<00:20, 18.10it/s][A
Epoch 2/10:  84%|████████▎ | 1848/2208 [01:44<00:18, 18.98it/s][A
  with torch.cuda.amp.autocast():

Epoch 2/10:  84%|████████▍ | 1854/2208 [01:45<00:27, 12.66it/s][A

Batch 1850: Training loss = 0.3155, Training accuracy = 0.8499, F1 = 0.8492



Epoch 2/10:  84%|████████▍ | 1857/2208 [01:45<00:24, 14.44it/s][A
Epoch 2/10:  84%|████████▍ | 1860/2208 [01:45<00:21, 15.99it/s][A
Epoch 2/10:  84%|████████▍ | 1863/2208 [01:45<00:20, 17.16it/s][A
Epoch 2/10:  85%|████████▍ | 1866/2208 [01:45<00:18, 18.19it/s][A
Epoch 2/10:  85%|████████▍ | 1869/2208 [01:45<00:17, 19.08it/s][A
Epoch 2/10:  85%|████████▍ | 1872/2208 [01:45<00:17, 19.61it/s][A
  with torch.cuda.amp.autocast():

Epoch 2/10:  85%|████████▌ | 1878/2208 [01:46<00:31, 10.51it/s][A

Batch 1875: Training loss = 0.2554, Training accuracy = 0.8503, F1 = 0.8496



Epoch 2/10:  85%|████████▌ | 1881/2208 [01:46<00:26, 12.38it/s][A
Epoch 2/10:  85%|████████▌ | 1884/2208 [01:46<00:23, 14.08it/s][A
Epoch 2/10:  85%|████████▌ | 1887/2208 [01:47<00:20, 15.58it/s][A
Epoch 2/10:  86%|████████▌ | 1890/2208 [01:47<00:18, 16.94it/s][A
Epoch 2/10:  86%|████████▌ | 1893/2208 [01:47<00:17, 18.09it/s][A
Epoch 2/10:  86%|████████▌ | 1896/2208 [01:47<00:16, 18.93it/s][A
  with torch.cuda.amp.autocast():

Epoch 2/10:  86%|████████▌ | 1902/2208 [01:48<00:26, 11.41it/s][A
Epoch 2/10:  86%|████████▋ | 1905/2208 [01:48<00:22, 13.28it/s][A

Batch 1900: Training loss = 0.3307, Training accuracy = 0.8506, F1 = 0.8499



Epoch 2/10:  86%|████████▋ | 1908/2208 [01:48<00:20, 15.00it/s][A
Epoch 2/10:  87%|████████▋ | 1911/2208 [01:48<00:18, 16.48it/s][A
Epoch 2/10:  87%|████████▋ | 1914/2208 [01:48<00:16, 17.63it/s][A
Epoch 2/10:  87%|████████▋ | 1917/2208 [01:48<00:15, 18.59it/s][A
Epoch 2/10:  87%|████████▋ | 1920/2208 [01:49<00:14, 19.46it/s][A
Epoch 2/10:  87%|████████▋ | 1923/2208 [01:49<00:14, 19.99it/s][A
  with torch.cuda.amp.autocast():

Epoch 2/10:  87%|████████▋ | 1929/2208 [01:49<00:21, 12.85it/s][A

Batch 1925: Training loss = 0.3567, Training accuracy = 0.8509, F1 = 0.8503



Epoch 2/10:  88%|████████▊ | 1932/2208 [01:50<00:18, 14.61it/s][A
Epoch 2/10:  88%|████████▊ | 1935/2208 [01:50<00:16, 16.13it/s][A
Epoch 2/10:  88%|████████▊ | 1938/2208 [01:50<00:15, 17.35it/s][A
Epoch 2/10:  88%|████████▊ | 1941/2208 [01:50<00:14, 18.45it/s][A
Epoch 2/10:  88%|████████▊ | 1944/2208 [01:50<00:13, 19.20it/s][A
Epoch 2/10:  88%|████████▊ | 1947/2208 [01:50<00:13, 19.72it/s][A
  with torch.cuda.amp.autocast():

Epoch 2/10:  88%|████████▊ | 1953/2208 [01:51<00:23, 10.87it/s][A

Batch 1950: Training loss = 0.4440, Training accuracy = 0.8512, F1 = 0.8505



Epoch 2/10:  89%|████████▊ | 1956/2208 [01:51<00:19, 12.77it/s][A
Epoch 2/10:  89%|████████▊ | 1959/2208 [01:51<00:17, 14.55it/s][A
Epoch 2/10:  89%|████████▉ | 1962/2208 [01:51<00:15, 16.11it/s][A
Epoch 2/10:  89%|████████▉ | 1965/2208 [01:52<00:14, 17.30it/s][A
Epoch 2/10:  89%|████████▉ | 1968/2208 [01:52<00:13, 18.28it/s][A
Epoch 2/10:  89%|████████▉ | 1971/2208 [01:52<00:12, 19.04it/s][A
  with torch.cuda.amp.autocast():

Epoch 2/10:  90%|████████▉ | 1977/2208 [01:53<00:22, 10.38it/s][A
Epoch 2/10:  90%|████████▉ | 1980/2208 [01:53<00:18, 12.32it/s][A

Batch 1975: Training loss = 0.3896, Training accuracy = 0.8514, F1 = 0.8508



Epoch 2/10:  90%|████████▉ | 1983/2208 [01:53<00:15, 14.11it/s][A
Epoch 2/10:  90%|████████▉ | 1986/2208 [01:53<00:14, 15.67it/s][A
Epoch 2/10:  90%|█████████ | 1989/2208 [01:53<00:12, 17.07it/s][A
Epoch 2/10:  90%|█████████ | 1992/2208 [01:53<00:11, 18.15it/s][A
Epoch 2/10:  90%|█████████ | 1995/2208 [01:53<00:11, 18.93it/s][A
Epoch 2/10:  90%|█████████ | 1998/2208 [01:54<00:10, 19.66it/s][A
  with torch.cuda.amp.autocast():

Epoch 2/10:  91%|█████████ | 2004/2208 [01:54<00:15, 12.82it/s][A

Batch 2000: Training loss = 0.3720, Training accuracy = 0.8517, F1 = 0.8511



Epoch 2/10:  91%|█████████ | 2007/2208 [01:54<00:13, 14.50it/s][A
Epoch 2/10:  91%|█████████ | 2010/2208 [01:55<00:12, 15.94it/s][A
Epoch 2/10:  91%|█████████ | 2013/2208 [01:55<00:11, 17.16it/s][A
Epoch 2/10:  91%|█████████▏| 2016/2208 [01:55<00:10, 18.20it/s][A
Epoch 2/10:  91%|█████████▏| 2019/2208 [01:55<00:09, 19.07it/s][A
Epoch 2/10:  92%|█████████▏| 2022/2208 [01:55<00:09, 19.59it/s][A
  with torch.cuda.amp.autocast():

Epoch 2/10:  92%|█████████▏| 2028/2208 [01:56<00:16, 11.08it/s][A

Batch 2025: Training loss = 0.4331, Training accuracy = 0.8521, F1 = 0.8515



Epoch 2/10:  92%|█████████▏| 2031/2208 [01:56<00:13, 12.99it/s][A
Epoch 2/10:  92%|█████████▏| 2034/2208 [01:56<00:11, 14.69it/s][A
Epoch 2/10:  92%|█████████▏| 2037/2208 [01:56<00:10, 16.16it/s][A
Epoch 2/10:  92%|█████████▏| 2040/2208 [01:56<00:09, 17.40it/s][A
Epoch 2/10:  93%|█████████▎| 2043/2208 [01:56<00:08, 18.39it/s][A
Epoch 2/10:  93%|█████████▎| 2046/2208 [01:57<00:08, 19.19it/s][A
  with torch.cuda.amp.autocast():

Epoch 2/10:  93%|█████████▎| 2052/2208 [01:57<00:14, 10.83it/s][A
Epoch 2/10:  93%|█████████▎| 2055/2208 [01:57<00:12, 12.75it/s][A

Batch 2050: Training loss = 0.3000, Training accuracy = 0.8524, F1 = 0.8518



Epoch 2/10:  93%|█████████▎| 2058/2208 [01:58<00:10, 14.50it/s][A
Epoch 2/10:  93%|█████████▎| 2061/2208 [01:58<00:09, 16.04it/s][A
Epoch 2/10:  93%|█████████▎| 2064/2208 [01:58<00:08, 17.29it/s][A
Epoch 2/10:  94%|█████████▎| 2067/2208 [01:58<00:08, 16.90it/s][A
Epoch 2/10:  94%|█████████▍| 2070/2208 [01:58<00:07, 17.91it/s][A
Epoch 2/10:  94%|█████████▍| 2073/2208 [01:58<00:07, 18.62it/s][A
  with torch.cuda.amp.autocast():

Epoch 2/10:  94%|█████████▍| 2079/2208 [01:59<00:11, 11.31it/s][A

Batch 2075: Training loss = 0.2639, Training accuracy = 0.8527, F1 = 0.8521



Epoch 2/10:  94%|█████████▍| 2082/2208 [01:59<00:09, 13.14it/s][A
Epoch 2/10:  94%|█████████▍| 2085/2208 [01:59<00:08, 14.77it/s][A
Epoch 2/10:  95%|█████████▍| 2088/2208 [02:00<00:07, 16.23it/s][A
Epoch 2/10:  95%|█████████▍| 2091/2208 [02:00<00:06, 17.07it/s][A
Epoch 2/10:  95%|█████████▍| 2094/2208 [02:00<00:06, 18.17it/s][A
Epoch 2/10:  95%|█████████▍| 2097/2208 [02:00<00:06, 18.35it/s][A
Epoch 2/10:  95%|█████████▌| 2099/2208 [02:00<00:05, 18.23it/s][A
  with torch.cuda.amp.autocast():

Epoch 2/10:  95%|█████████▌| 2104/2208 [02:01<00:09, 10.62it/s][A

Batch 2100: Training loss = 0.3418, Training accuracy = 0.8529, F1 = 0.8523



Epoch 2/10:  95%|█████████▌| 2107/2208 [02:01<00:07, 12.72it/s][A
Epoch 2/10:  96%|█████████▌| 2110/2208 [02:01<00:06, 14.60it/s][A
Epoch 2/10:  96%|█████████▌| 2113/2208 [02:01<00:05, 16.20it/s][A
Epoch 2/10:  96%|█████████▌| 2116/2208 [02:02<00:05, 17.35it/s][A
Epoch 2/10:  96%|█████████▌| 2119/2208 [02:02<00:04, 18.35it/s][A
Epoch 2/10:  96%|█████████▌| 2122/2208 [02:02<00:04, 19.00it/s][A
  with torch.cuda.amp.autocast():

Epoch 2/10:  96%|█████████▋| 2127/2208 [02:03<00:08,  9.47it/s][A
Epoch 2/10:  96%|█████████▋| 2130/2208 [02:03<00:06, 11.58it/s][A

Batch 2125: Training loss = 0.4283, Training accuracy = 0.8530, F1 = 0.8524



Epoch 2/10:  97%|█████████▋| 2133/2208 [02:03<00:05, 13.59it/s][A
Epoch 2/10:  97%|█████████▋| 2136/2208 [02:03<00:04, 15.27it/s][A
Epoch 2/10:  97%|█████████▋| 2139/2208 [02:03<00:04, 16.82it/s][A
Epoch 2/10:  97%|█████████▋| 2142/2208 [02:03<00:03, 17.96it/s][A
Epoch 2/10:  97%|█████████▋| 2145/2208 [02:03<00:03, 18.69it/s][A
Epoch 2/10:  97%|█████████▋| 2148/2208 [02:04<00:03, 19.30it/s][A
  with torch.cuda.amp.autocast():

Epoch 2/10:  98%|█████████▊| 2154/2208 [02:04<00:04, 12.41it/s][A

Batch 2150: Training loss = 0.3820, Training accuracy = 0.8534, F1 = 0.8527



Epoch 2/10:  98%|█████████▊| 2157/2208 [02:04<00:03, 14.22it/s][A
Epoch 2/10:  98%|█████████▊| 2160/2208 [02:05<00:03, 15.82it/s][A
Epoch 2/10:  98%|█████████▊| 2163/2208 [02:05<00:02, 17.20it/s][A
Epoch 2/10:  98%|█████████▊| 2166/2208 [02:05<00:02, 18.22it/s][A
Epoch 2/10:  98%|█████████▊| 2169/2208 [02:05<00:02, 19.00it/s][A
Epoch 2/10:  98%|█████████▊| 2172/2208 [02:05<00:01, 19.61it/s][A
  with torch.cuda.amp.autocast():

Epoch 2/10:  99%|█████████▊| 2178/2208 [02:06<00:02, 10.39it/s][A

Batch 2175: Training loss = 0.4259, Training accuracy = 0.8536, F1 = 0.8529



Epoch 2/10:  99%|█████████▉| 2181/2208 [02:06<00:02, 12.33it/s][A
Epoch 2/10:  99%|█████████▉| 2184/2208 [02:06<00:01, 14.14it/s][A
Epoch 2/10:  99%|█████████▉| 2187/2208 [02:06<00:01, 15.74it/s][A
Epoch 2/10:  99%|█████████▉| 2190/2208 [02:06<00:01, 17.03it/s][A
Epoch 2/10:  99%|█████████▉| 2193/2208 [02:07<00:00, 18.08it/s][A
Epoch 2/10:  99%|█████████▉| 2196/2208 [02:07<00:00, 18.91it/s][A
  with torch.cuda.amp.autocast():

Epoch 2/10: 100%|█████████▉| 2202/2208 [02:07<00:00, 11.12it/s][A
Epoch 2/10: 100%|█████████▉| 2205/2208 [02:08<00:00, 13.07it/s][A

Batch 2200: Training loss = 0.5879, Training accuracy = 0.8538, F1 = 0.8531



Epoch 2/10: 100%|██████████| 2208/2208 [02:08<00:00, 14.90it/s][A
                                                               [A


Epoch 2 Training Metrics:
Loss: 0.4354
Accuracy: 0.8538
F1 Score: 0.8532
Precision: 0.8528
Recall: 0.8538

Starting validation...



Validation:   0%|          | 0/552 [00:00<?, ?it/s][A
Validation:   0%|          | 1/552 [00:01<15:07,  1.65s/it][A
Validation:   1%|          | 3/552 [00:01<04:18,  2.12it/s][A
Validation:   1%|          | 5/552 [00:01<02:20,  3.88it/s][A
Validation:   1%|▏         | 7/552 [00:01<01:32,  5.86it/s][A
Validation:   2%|▏         | 9/552 [00:02<01:08,  7.89it/s][A
Validation:   2%|▏         | 11/552 [00:02<00:54,  9.92it/s][A
Validation:   2%|▏         | 13/552 [00:02<00:45, 11.75it/s][A
Validation:   3%|▎         | 15/552 [00:02<00:40, 13.37it/s][A
Validation:   3%|▎         | 17/552 [00:02<00:36, 14.68it/s][A
Validation:   3%|▎         | 19/552 [00:02<00:33, 15.83it/s][A
Validation:   4%|▍         | 21/552 [00:02<00:32, 16.58it/s][A
Validation:   4%|▍         | 23/552 [00:02<00:30, 17.10it/s][A
Validation:   5%|▍         | 25/552 [00:02<00:29, 17.62it/s][A
Validation:   5%|▍         | 27/552 [00:03<00:29, 17.96it/s][A
Validation:   5%|▌         | 29/552 [00:03<00:28, 18.


Epoch 2 Validation Metrics:
Loss: 0.2860
Accuracy: 0.9009
F1 Score: 0.9002
Precision: 0.9073
Recall: 0.9009


Training epochs:  20%|██        | 2/10 [05:21<21:25, 160.63s/it]


Starting epoch 3/10



  with torch.cuda.amp.autocast():

  with torch.cuda.amp.autocast():

Epoch 3/10:   0%|          | 3/2208 [00:01<17:16,  2.13it/s]  [A

Batch 0: Training loss = 0.5103, Training accuracy = 0.8828, F1 = 0.8737



Epoch 3/10:   0%|          | 6/2208 [00:01<07:44,  4.75it/s][A
Epoch 3/10:   0%|          | 9/2208 [00:02<04:55,  7.44it/s][A
Epoch 3/10:   1%|          | 12/2208 [00:02<03:39, 10.00it/s][A
Epoch 3/10:   1%|          | 14/2208 [00:02<03:23, 10.79it/s][A
Epoch 3/10:   1%|          | 17/2208 [00:02<02:56, 12.44it/s][A
Epoch 3/10:   1%|          | 20/2208 [00:02<02:30, 14.49it/s][A
Epoch 3/10:   1%|          | 23/2208 [00:02<02:14, 16.22it/s][A
  with torch.cuda.amp.autocast():

Epoch 3/10:   1%|▏         | 29/2208 [00:03<02:00, 18.01it/s][A

Batch 25: Training loss = 0.2590, Training accuracy = 0.8762, F1 = 0.8749



Epoch 3/10:   1%|▏         | 32/2208 [00:03<01:55, 18.76it/s][A
Epoch 3/10:   2%|▏         | 35/2208 [00:03<01:52, 19.40it/s][A
Epoch 3/10:   2%|▏         | 38/2208 [00:03<01:59, 18.18it/s][A
Epoch 3/10:   2%|▏         | 41/2208 [00:03<01:53, 19.03it/s][A
Epoch 3/10:   2%|▏         | 43/2208 [00:03<01:52, 19.20it/s][A
Epoch 3/10:   2%|▏         | 46/2208 [00:03<01:51, 19.33it/s][A
Epoch 3/10:   2%|▏         | 48/2208 [00:04<01:51, 19.33it/s][A
  with torch.cuda.amp.autocast():

Epoch 3/10:   2%|▏         | 52/2208 [00:04<01:55, 18.70it/s][A
Epoch 3/10:   2%|▏         | 55/2208 [00:04<01:49, 19.62it/s][A

Batch 50: Training loss = 0.2269, Training accuracy = 0.8822, F1 = 0.8814



Epoch 3/10:   3%|▎         | 58/2208 [00:04<01:48, 19.77it/s][A
Epoch 3/10:   3%|▎         | 61/2208 [00:04<01:46, 20.22it/s][A
Epoch 3/10:   3%|▎         | 64/2208 [00:04<01:50, 19.36it/s][A
Epoch 3/10:   3%|▎         | 66/2208 [00:05<01:52, 19.02it/s][A
Epoch 3/10:   3%|▎         | 69/2208 [00:05<01:48, 19.72it/s][A
Epoch 3/10:   3%|▎         | 71/2208 [00:05<01:53, 18.83it/s][A
Epoch 3/10:   3%|▎         | 74/2208 [00:05<01:49, 19.55it/s][A
  with torch.cuda.amp.autocast():

Epoch 3/10:   4%|▎         | 79/2208 [00:05<01:47, 19.77it/s][A

Batch 75: Training loss = 0.4119, Training accuracy = 0.8817, F1 = 0.8806



Epoch 3/10:   4%|▎         | 82/2208 [00:05<01:45, 20.08it/s][A
Epoch 3/10:   4%|▍         | 85/2208 [00:05<01:44, 20.40it/s][A
Epoch 3/10:   4%|▍         | 88/2208 [00:06<01:42, 20.62it/s][A
Epoch 3/10:   4%|▍         | 91/2208 [00:06<01:44, 20.31it/s][A
Epoch 3/10:   4%|▍         | 94/2208 [00:06<02:03, 17.09it/s][A
Epoch 3/10:   4%|▍         | 97/2208 [00:06<01:55, 18.23it/s][A
  with torch.cuda.amp.autocast():

Epoch 3/10:   5%|▍         | 102/2208 [00:06<01:56, 18.02it/s][A
Epoch 3/10:   5%|▍         | 105/2208 [00:07<01:50, 18.96it/s][A

Batch 100: Training loss = 0.2078, Training accuracy = 0.8817, F1 = 0.8812



Epoch 3/10:   5%|▍         | 108/2208 [00:07<01:46, 19.80it/s][A
Epoch 3/10:   5%|▌         | 111/2208 [00:07<01:43, 20.26it/s][A
Epoch 3/10:   5%|▌         | 114/2208 [00:07<01:41, 20.67it/s][A
Epoch 3/10:   5%|▌         | 117/2208 [00:07<01:40, 20.76it/s][A
Epoch 3/10:   5%|▌         | 120/2208 [00:07<01:39, 20.89it/s][A
Epoch 3/10:   6%|▌         | 123/2208 [00:07<01:38, 21.08it/s][A
  with torch.cuda.amp.autocast():

Epoch 3/10:   6%|▌         | 129/2208 [00:08<01:41, 20.42it/s][A

Batch 125: Training loss = 0.3210, Training accuracy = 0.8819, F1 = 0.8812



Epoch 3/10:   6%|▌         | 132/2208 [00:08<01:40, 20.69it/s][A
Epoch 3/10:   6%|▌         | 135/2208 [00:08<01:39, 20.84it/s][A
Epoch 3/10:   6%|▋         | 138/2208 [00:08<01:38, 21.01it/s][A
Epoch 3/10:   6%|▋         | 141/2208 [00:08<01:38, 21.02it/s][A
Epoch 3/10:   7%|▋         | 144/2208 [00:08<01:37, 21.17it/s][A
Epoch 3/10:   7%|▋         | 147/2208 [00:09<01:37, 21.05it/s][A
  with torch.cuda.amp.autocast():

Epoch 3/10:   7%|▋         | 153/2208 [00:09<01:47, 19.11it/s][A

Batch 150: Training loss = 0.3314, Training accuracy = 0.8836, F1 = 0.8828



Epoch 3/10:   7%|▋         | 156/2208 [00:09<01:44, 19.56it/s][A
Epoch 3/10:   7%|▋         | 159/2208 [00:09<01:42, 20.04it/s][A
Epoch 3/10:   7%|▋         | 162/2208 [00:09<01:39, 20.51it/s][A
Epoch 3/10:   7%|▋         | 165/2208 [00:09<01:38, 20.80it/s][A
Epoch 3/10:   8%|▊         | 168/2208 [00:10<01:37, 20.92it/s][A
Epoch 3/10:   8%|▊         | 171/2208 [00:10<01:37, 20.79it/s][A
  with torch.cuda.amp.autocast():

Epoch 3/10:   8%|▊         | 177/2208 [00:10<01:44, 19.50it/s][A
Epoch 3/10:   8%|▊         | 180/2208 [00:10<01:42, 19.82it/s][A

Batch 175: Training loss = 0.2230, Training accuracy = 0.8834, F1 = 0.8827



Epoch 3/10:   8%|▊         | 183/2208 [00:10<01:40, 20.18it/s][A
Epoch 3/10:   8%|▊         | 186/2208 [00:10<01:40, 20.15it/s][A
Epoch 3/10:   9%|▊         | 189/2208 [00:11<01:43, 19.54it/s][A
Epoch 3/10:   9%|▊         | 191/2208 [00:11<01:54, 17.66it/s][A
Epoch 3/10:   9%|▊         | 193/2208 [00:11<01:52, 17.87it/s][A
Epoch 3/10:   9%|▉         | 196/2208 [00:11<01:46, 18.94it/s][A
Epoch 3/10:   9%|▉         | 198/2208 [00:11<01:47, 18.76it/s][A
  with torch.cuda.amp.autocast():

Epoch 3/10:   9%|▉         | 203/2208 [00:11<01:58, 16.96it/s][A

Batch 200: Training loss = 0.3179, Training accuracy = 0.8832, F1 = 0.8826



Epoch 3/10:   9%|▉         | 206/2208 [00:12<01:51, 17.90it/s][A
Epoch 3/10:   9%|▉         | 209/2208 [00:12<01:45, 18.87it/s][A
Epoch 3/10:  10%|▉         | 211/2208 [00:12<01:58, 16.87it/s][A
Epoch 3/10:  10%|▉         | 214/2208 [00:12<01:50, 18.11it/s][A
Epoch 3/10:  10%|▉         | 217/2208 [00:12<01:45, 18.91it/s][A
Epoch 3/10:  10%|▉         | 219/2208 [00:12<01:46, 18.70it/s][A
Epoch 3/10:  10%|█         | 222/2208 [00:13<01:53, 17.47it/s][A
  with torch.cuda.amp.autocast():

Epoch 3/10:  10%|█         | 227/2208 [00:13<01:58, 16.75it/s][A
Epoch 3/10:  10%|█         | 230/2208 [00:13<01:49, 18.03it/s][A

Batch 225: Training loss = 0.3967, Training accuracy = 0.8839, F1 = 0.8833



Epoch 3/10:  11%|█         | 233/2208 [00:13<01:44, 18.94it/s][A
Epoch 3/10:  11%|█         | 236/2208 [00:13<01:40, 19.56it/s][A
Epoch 3/10:  11%|█         | 238/2208 [00:13<01:47, 18.30it/s][A
Epoch 3/10:  11%|█         | 241/2208 [00:14<01:42, 19.15it/s][A
Epoch 3/10:  11%|█         | 243/2208 [00:14<01:49, 17.94it/s][A
Epoch 3/10:  11%|█         | 245/2208 [00:14<01:49, 17.91it/s][A
Epoch 3/10:  11%|█         | 247/2208 [00:14<01:51, 17.63it/s][A
  with torch.cuda.amp.autocast():

Epoch 3/10:  11%|█▏        | 252/2208 [00:14<02:08, 15.21it/s][A
Epoch 3/10:  12%|█▏        | 254/2208 [00:14<02:05, 15.56it/s][A

Batch 250: Training loss = 0.5448, Training accuracy = 0.8831, F1 = 0.8826



Epoch 3/10:  12%|█▏        | 257/2208 [00:15<01:53, 17.19it/s][A
Epoch 3/10:  12%|█▏        | 260/2208 [00:15<01:46, 18.30it/s][A
Epoch 3/10:  12%|█▏        | 263/2208 [00:15<01:41, 19.11it/s][A
Epoch 3/10:  12%|█▏        | 266/2208 [00:15<01:39, 19.61it/s][A
Epoch 3/10:  12%|█▏        | 269/2208 [00:15<01:37, 19.93it/s][A
Epoch 3/10:  12%|█▏        | 272/2208 [00:15<01:36, 20.14it/s][A
  with torch.cuda.amp.autocast():

Epoch 3/10:  13%|█▎        | 277/2208 [00:16<01:48, 17.86it/s][A
Epoch 3/10:  13%|█▎        | 280/2208 [00:16<01:42, 18.83it/s][A

Batch 275: Training loss = 0.2512, Training accuracy = 0.8830, F1 = 0.8825



Epoch 3/10:  13%|█▎        | 283/2208 [00:16<01:44, 18.50it/s][A
Epoch 3/10:  13%|█▎        | 285/2208 [00:16<01:42, 18.82it/s][A
Epoch 3/10:  13%|█▎        | 287/2208 [00:16<01:42, 18.76it/s][A
Epoch 3/10:  13%|█▎        | 290/2208 [00:16<01:38, 19.46it/s][A
Epoch 3/10:  13%|█▎        | 292/2208 [00:16<01:47, 17.79it/s][A
Epoch 3/10:  13%|█▎        | 295/2208 [00:17<01:52, 17.06it/s][A
Epoch 3/10:  13%|█▎        | 298/2208 [00:17<01:44, 18.20it/s][A
  with torch.cuda.amp.autocast():

Epoch 3/10:  14%|█▎        | 302/2208 [00:17<01:59, 15.92it/s][A
Epoch 3/10:  14%|█▍        | 304/2208 [00:17<02:05, 15.11it/s][A

Batch 300: Training loss = 0.2417, Training accuracy = 0.8836, F1 = 0.8832



Epoch 3/10:  14%|█▍        | 307/2208 [00:17<01:52, 16.88it/s][A
Epoch 3/10:  14%|█▍        | 309/2208 [00:17<01:49, 17.27it/s][A
Epoch 3/10:  14%|█▍        | 312/2208 [00:18<01:51, 16.99it/s][A
Epoch 3/10:  14%|█▍        | 315/2208 [00:18<01:44, 18.18it/s][A
Epoch 3/10:  14%|█▍        | 317/2208 [00:18<01:43, 18.25it/s][A
Epoch 3/10:  14%|█▍        | 320/2208 [00:18<01:38, 19.18it/s][A
Epoch 3/10:  15%|█▍        | 322/2208 [00:18<01:42, 18.33it/s][A
  with torch.cuda.amp.autocast():

Epoch 3/10:  15%|█▍        | 327/2208 [00:18<01:51, 16.90it/s][A
Epoch 3/10:  15%|█▍        | 330/2208 [00:19<01:43, 18.16it/s][A

Batch 325: Training loss = 0.3472, Training accuracy = 0.8837, F1 = 0.8833



Epoch 3/10:  15%|█▌        | 333/2208 [00:19<01:38, 19.02it/s][A
Epoch 3/10:  15%|█▌        | 336/2208 [00:19<01:35, 19.69it/s][A
Epoch 3/10:  15%|█▌        | 339/2208 [00:19<01:32, 20.14it/s][A
Epoch 3/10:  15%|█▌        | 342/2208 [00:19<01:30, 20.52it/s][A
Epoch 3/10:  16%|█▌        | 345/2208 [00:19<01:29, 20.77it/s][A
Epoch 3/10:  16%|█▌        | 348/2208 [00:19<01:28, 20.93it/s][A
  with torch.cuda.amp.autocast():

Epoch 3/10:  16%|█▌        | 354/2208 [00:20<01:35, 19.37it/s][A

Batch 350: Training loss = 0.4278, Training accuracy = 0.8837, F1 = 0.8833



Epoch 3/10:  16%|█▌        | 357/2208 [00:20<01:33, 19.81it/s][A
Epoch 3/10:  16%|█▋        | 360/2208 [00:20<01:31, 20.29it/s][A
Epoch 3/10:  16%|█▋        | 363/2208 [00:20<01:30, 20.49it/s][A
Epoch 3/10:  17%|█▋        | 366/2208 [00:20<01:28, 20.72it/s][A
Epoch 3/10:  17%|█▋        | 369/2208 [00:20<01:27, 20.99it/s][A
Epoch 3/10:  17%|█▋        | 372/2208 [00:21<01:27, 21.00it/s][A
  with torch.cuda.amp.autocast():

Epoch 3/10:  17%|█▋        | 378/2208 [00:21<01:44, 17.56it/s][A

Batch 375: Training loss = 0.5070, Training accuracy = 0.8838, F1 = 0.8833



Epoch 3/10:  17%|█▋        | 381/2208 [00:21<01:39, 18.42it/s][A
Epoch 3/10:  17%|█▋        | 384/2208 [00:21<01:35, 19.17it/s][A
Epoch 3/10:  18%|█▊        | 387/2208 [00:21<01:32, 19.74it/s][A
Epoch 3/10:  18%|█▊        | 390/2208 [00:21<01:30, 20.11it/s][A
Epoch 3/10:  18%|█▊        | 393/2208 [00:22<01:28, 20.51it/s][A
Epoch 3/10:  18%|█▊        | 396/2208 [00:22<01:27, 20.82it/s][A
  with torch.cuda.amp.autocast():

Epoch 3/10:  18%|█▊        | 402/2208 [00:22<01:40, 18.04it/s][A
Epoch 3/10:  18%|█▊        | 405/2208 [00:22<01:35, 18.90it/s][A

Batch 400: Training loss = 0.3213, Training accuracy = 0.8836, F1 = 0.8832



Epoch 3/10:  18%|█▊        | 408/2208 [00:22<01:32, 19.55it/s][A
Epoch 3/10:  19%|█▊        | 411/2208 [00:23<01:29, 20.12it/s][A
Epoch 3/10:  19%|█▉        | 414/2208 [00:23<01:28, 20.31it/s][A
Epoch 3/10:  19%|█▉        | 417/2208 [00:23<01:26, 20.64it/s][A
Epoch 3/10:  19%|█▉        | 420/2208 [00:23<01:26, 20.72it/s][A
Epoch 3/10:  19%|█▉        | 423/2208 [00:23<01:25, 20.93it/s][A
  with torch.cuda.amp.autocast():

Epoch 3/10:  19%|█▉        | 429/2208 [00:24<01:36, 18.50it/s][A

Batch 425: Training loss = 0.3402, Training accuracy = 0.8832, F1 = 0.8828



Epoch 3/10:  20%|█▉        | 432/2208 [00:24<01:31, 19.33it/s][A
Epoch 3/10:  20%|█▉        | 435/2208 [00:24<01:28, 19.96it/s][A
Epoch 3/10:  20%|█▉        | 438/2208 [00:24<01:27, 20.31it/s][A
Epoch 3/10:  20%|█▉        | 441/2208 [00:24<01:26, 20.32it/s][A
Epoch 3/10:  20%|██        | 444/2208 [00:24<01:25, 20.52it/s][A
Epoch 3/10:  20%|██        | 447/2208 [00:24<01:25, 20.57it/s][A
  with torch.cuda.amp.autocast():

Epoch 3/10:  21%|██        | 453/2208 [00:25<01:41, 17.27it/s][A

Batch 450: Training loss = 0.3639, Training accuracy = 0.8834, F1 = 0.8830



Epoch 3/10:  21%|██        | 456/2208 [00:25<01:35, 18.35it/s][A
Epoch 3/10:  21%|██        | 459/2208 [00:25<01:31, 19.20it/s][A
Epoch 3/10:  21%|██        | 462/2208 [00:25<01:28, 19.71it/s][A
Epoch 3/10:  21%|██        | 465/2208 [00:25<01:26, 20.21it/s][A
Epoch 3/10:  21%|██        | 468/2208 [00:25<01:24, 20.53it/s][A
Epoch 3/10:  21%|██▏       | 471/2208 [00:26<01:23, 20.71it/s][A
  with torch.cuda.amp.autocast():

Epoch 3/10:  22%|██▏       | 477/2208 [00:26<01:40, 17.16it/s][A
Epoch 3/10:  22%|██▏       | 480/2208 [00:26<01:34, 18.24it/s][A

Batch 475: Training loss = 0.2787, Training accuracy = 0.8833, F1 = 0.8828



Epoch 3/10:  22%|██▏       | 483/2208 [00:26<01:30, 19.06it/s][A
Epoch 3/10:  22%|██▏       | 486/2208 [00:26<01:27, 19.66it/s][A
Epoch 3/10:  22%|██▏       | 489/2208 [00:27<01:24, 20.23it/s][A
Epoch 3/10:  22%|██▏       | 492/2208 [00:27<01:23, 20.52it/s][A
Epoch 3/10:  22%|██▏       | 495/2208 [00:27<01:22, 20.70it/s][A
Epoch 3/10:  23%|██▎       | 498/2208 [00:27<01:23, 20.48it/s][A
  with torch.cuda.amp.autocast():

Epoch 3/10:  23%|██▎       | 504/2208 [00:27<01:37, 17.51it/s][A

Batch 500: Training loss = 0.2375, Training accuracy = 0.8834, F1 = 0.8830



Epoch 3/10:  23%|██▎       | 507/2208 [00:28<01:31, 18.50it/s][A
Epoch 3/10:  23%|██▎       | 510/2208 [00:28<01:27, 19.30it/s][A
Epoch 3/10:  23%|██▎       | 513/2208 [00:28<01:25, 19.88it/s][A
Epoch 3/10:  23%|██▎       | 516/2208 [00:28<01:25, 19.91it/s][A
Epoch 3/10:  24%|██▎       | 519/2208 [00:28<01:29, 18.84it/s][A
Epoch 3/10:  24%|██▎       | 521/2208 [00:28<01:28, 18.98it/s][A
Epoch 3/10:  24%|██▎       | 523/2208 [00:28<01:37, 17.20it/s][A
  with torch.cuda.amp.autocast():

Epoch 3/10:  24%|██▍       | 529/2208 [00:29<01:42, 16.39it/s][A

Batch 525: Training loss = 0.2010, Training accuracy = 0.8832, F1 = 0.8828



Epoch 3/10:  24%|██▍       | 532/2208 [00:29<01:35, 17.62it/s][A
Epoch 3/10:  24%|██▍       | 535/2208 [00:29<01:30, 18.52it/s][A
Epoch 3/10:  24%|██▍       | 538/2208 [00:29<01:26, 19.31it/s][A
Epoch 3/10:  24%|██▍       | 540/2208 [00:29<01:25, 19.43it/s][A
Epoch 3/10:  25%|██▍       | 543/2208 [00:29<01:23, 19.89it/s][A
Epoch 3/10:  25%|██▍       | 546/2208 [00:30<01:21, 20.34it/s][A
Epoch 3/10:  25%|██▍       | 549/2208 [00:30<01:41, 16.42it/s][A
  with torch.cuda.amp.autocast():

Epoch 3/10:  25%|██▌       | 554/2208 [00:30<01:46, 15.49it/s][A

Batch 550: Training loss = 0.4860, Training accuracy = 0.8836, F1 = 0.8833



Epoch 3/10:  25%|██▌       | 557/2208 [00:30<01:37, 16.99it/s][A
Epoch 3/10:  25%|██▌       | 560/2208 [00:31<01:30, 18.11it/s][A
Epoch 3/10:  25%|██▌       | 562/2208 [00:31<01:31, 17.94it/s][A
Epoch 3/10:  26%|██▌       | 565/2208 [00:31<01:27, 18.85it/s][A
Epoch 3/10:  26%|██▌       | 568/2208 [00:31<01:23, 19.61it/s][A
Epoch 3/10:  26%|██▌       | 570/2208 [00:31<01:30, 18.19it/s][A
Epoch 3/10:  26%|██▌       | 573/2208 [00:31<01:25, 19.11it/s][A
  with torch.cuda.amp.autocast():

Epoch 3/10:  26%|██▌       | 577/2208 [00:32<01:52, 14.53it/s][A
Epoch 3/10:  26%|██▋       | 580/2208 [00:32<01:39, 16.37it/s][A

Batch 575: Training loss = 0.4705, Training accuracy = 0.8838, F1 = 0.8834



Epoch 3/10:  26%|██▋       | 582/2208 [00:32<01:34, 17.12it/s][A
Epoch 3/10:  26%|██▋       | 585/2208 [00:32<01:28, 18.35it/s][A
Epoch 3/10:  27%|██▋       | 588/2208 [00:32<01:24, 19.09it/s][A
Epoch 3/10:  27%|██▋       | 591/2208 [00:32<01:22, 19.64it/s][A
Epoch 3/10:  27%|██▋       | 594/2208 [00:32<01:20, 20.16it/s][A
Epoch 3/10:  27%|██▋       | 597/2208 [00:32<01:18, 20.44it/s][A
  with torch.cuda.amp.autocast():

Epoch 3/10:  27%|██▋       | 603/2208 [00:33<01:33, 17.21it/s][A

Batch 600: Training loss = 0.5209, Training accuracy = 0.8841, F1 = 0.8837



Epoch 3/10:  27%|██▋       | 606/2208 [00:33<01:27, 18.31it/s][A
Epoch 3/10:  28%|██▊       | 609/2208 [00:33<01:23, 19.20it/s][A
Epoch 3/10:  28%|██▊       | 612/2208 [00:33<01:20, 19.83it/s][A
Epoch 3/10:  28%|██▊       | 615/2208 [00:33<01:19, 20.16it/s][A
Epoch 3/10:  28%|██▊       | 618/2208 [00:34<01:17, 20.56it/s][A
Epoch 3/10:  28%|██▊       | 621/2208 [00:34<01:16, 20.73it/s][A
  with torch.cuda.amp.autocast():

Epoch 3/10:  28%|██▊       | 627/2208 [00:34<01:32, 17.17it/s][A
Epoch 3/10:  29%|██▊       | 630/2208 [00:34<01:26, 18.32it/s][A

Batch 625: Training loss = 0.3837, Training accuracy = 0.8841, F1 = 0.8837



Epoch 3/10:  29%|██▊       | 633/2208 [00:34<01:22, 19.07it/s][A
Epoch 3/10:  29%|██▉       | 636/2208 [00:35<01:20, 19.57it/s][A
Epoch 3/10:  29%|██▉       | 639/2208 [00:35<01:18, 19.94it/s][A
Epoch 3/10:  29%|██▉       | 642/2208 [00:35<01:17, 20.33it/s][A
Epoch 3/10:  29%|██▉       | 645/2208 [00:35<01:15, 20.68it/s][A
Epoch 3/10:  29%|██▉       | 648/2208 [00:35<01:15, 20.70it/s][A
  with torch.cuda.amp.autocast():

Epoch 3/10:  30%|██▉       | 654/2208 [00:35<01:27, 17.83it/s][A

Batch 650: Training loss = 0.3251, Training accuracy = 0.8845, F1 = 0.8841



Epoch 3/10:  30%|██▉       | 657/2208 [00:36<01:22, 18.76it/s][A
Epoch 3/10:  30%|██▉       | 660/2208 [00:36<01:19, 19.37it/s][A
Epoch 3/10:  30%|███       | 663/2208 [00:36<01:17, 19.94it/s][A
Epoch 3/10:  30%|███       | 666/2208 [00:36<01:16, 20.25it/s][A
Epoch 3/10:  30%|███       | 669/2208 [00:36<01:15, 20.43it/s][A
Epoch 3/10:  30%|███       | 672/2208 [00:36<01:14, 20.52it/s][A
  with torch.cuda.amp.autocast():

Epoch 3/10:  31%|███       | 678/2208 [00:37<01:31, 16.76it/s][A

Batch 675: Training loss = 0.3136, Training accuracy = 0.8849, F1 = 0.8846



Epoch 3/10:  31%|███       | 681/2208 [00:37<01:25, 17.95it/s][A
Epoch 3/10:  31%|███       | 684/2208 [00:37<01:20, 18.85it/s][A
Epoch 3/10:  31%|███       | 687/2208 [00:37<01:17, 19.51it/s][A
Epoch 3/10:  31%|███▏      | 690/2208 [00:37<01:15, 20.02it/s][A
Epoch 3/10:  31%|███▏      | 693/2208 [00:37<01:14, 20.33it/s][A
Epoch 3/10:  32%|███▏      | 696/2208 [00:38<01:13, 20.64it/s][A
  with torch.cuda.amp.autocast():

Epoch 3/10:  32%|███▏      | 702/2208 [00:38<01:30, 16.73it/s][A
Epoch 3/10:  32%|███▏      | 705/2208 [00:38<01:23, 17.96it/s][A

Batch 700: Training loss = 0.3781, Training accuracy = 0.8854, F1 = 0.8850



Epoch 3/10:  32%|███▏      | 708/2208 [00:38<01:19, 18.96it/s][A
Epoch 3/10:  32%|███▏      | 711/2208 [00:38<01:16, 19.59it/s][A
Epoch 3/10:  32%|███▏      | 714/2208 [00:39<01:14, 20.07it/s][A
Epoch 3/10:  32%|███▏      | 717/2208 [00:39<01:13, 20.33it/s][A
Epoch 3/10:  33%|███▎      | 720/2208 [00:39<01:14, 19.95it/s][A
Epoch 3/10:  33%|███▎      | 723/2208 [00:39<01:12, 20.40it/s][A
  with torch.cuda.amp.autocast():

Epoch 3/10:  33%|███▎      | 729/2208 [00:39<01:23, 17.67it/s][A

Batch 725: Training loss = 0.3715, Training accuracy = 0.8856, F1 = 0.8853



Epoch 3/10:  33%|███▎      | 732/2208 [00:40<01:19, 18.67it/s][A
Epoch 3/10:  33%|███▎      | 735/2208 [00:40<01:15, 19.42it/s][A
Epoch 3/10:  33%|███▎      | 738/2208 [00:40<01:13, 19.93it/s][A
Epoch 3/10:  34%|███▎      | 741/2208 [00:40<01:12, 20.34it/s][A
Epoch 3/10:  34%|███▎      | 744/2208 [00:40<01:10, 20.74it/s][A
Epoch 3/10:  34%|███▍      | 747/2208 [00:40<01:09, 20.91it/s][A
  with torch.cuda.amp.autocast():

Epoch 3/10:  34%|███▍      | 753/2208 [00:41<01:30, 16.12it/s][A

Batch 750: Training loss = 0.4625, Training accuracy = 0.8858, F1 = 0.8854



Epoch 3/10:  34%|███▍      | 756/2208 [00:41<01:23, 17.44it/s][A
Epoch 3/10:  34%|███▍      | 759/2208 [00:41<01:18, 18.44it/s][A
Epoch 3/10:  35%|███▍      | 762/2208 [00:41<01:15, 19.20it/s][A
Epoch 3/10:  35%|███▍      | 765/2208 [00:41<01:12, 19.85it/s][A
Epoch 3/10:  35%|███▍      | 768/2208 [00:41<01:10, 20.35it/s][A
Epoch 3/10:  35%|███▍      | 771/2208 [00:42<01:09, 20.56it/s][A
  with torch.cuda.amp.autocast():

Epoch 3/10:  35%|███▌      | 777/2208 [00:42<01:28, 16.26it/s][A
Epoch 3/10:  35%|███▌      | 780/2208 [00:42<01:21, 17.53it/s][A

Batch 775: Training loss = 0.3667, Training accuracy = 0.8860, F1 = 0.8856



Epoch 3/10:  35%|███▌      | 783/2208 [00:42<01:16, 18.59it/s][A
Epoch 3/10:  36%|███▌      | 786/2208 [00:42<01:14, 19.17it/s][A
Epoch 3/10:  36%|███▌      | 789/2208 [00:42<01:12, 19.56it/s][A
Epoch 3/10:  36%|███▌      | 792/2208 [00:43<01:10, 19.99it/s][A
Epoch 3/10:  36%|███▌      | 795/2208 [00:43<01:09, 20.37it/s][A
Epoch 3/10:  36%|███▌      | 798/2208 [00:43<01:11, 19.78it/s][A
  with torch.cuda.amp.autocast():

Epoch 3/10:  36%|███▋      | 804/2208 [00:44<01:38, 14.25it/s][A

Batch 800: Training loss = 0.1909, Training accuracy = 0.8859, F1 = 0.8856



Epoch 3/10:  37%|███▋      | 807/2208 [00:44<01:28, 15.83it/s][A
Epoch 3/10:  37%|███▋      | 810/2208 [00:44<01:21, 17.09it/s][A
Epoch 3/10:  37%|███▋      | 813/2208 [00:44<01:16, 18.13it/s][A
Epoch 3/10:  37%|███▋      | 816/2208 [00:44<01:13, 19.02it/s][A
Epoch 3/10:  37%|███▋      | 819/2208 [00:44<01:11, 19.46it/s][A
Epoch 3/10:  37%|███▋      | 822/2208 [00:44<01:09, 19.90it/s][A
  with torch.cuda.amp.autocast():

Epoch 3/10:  38%|███▊      | 828/2208 [00:45<01:37, 14.11it/s][A

Batch 825: Training loss = 0.3445, Training accuracy = 0.8859, F1 = 0.8855



Epoch 3/10:  38%|███▊      | 831/2208 [00:45<01:27, 15.74it/s][A
Epoch 3/10:  38%|███▊      | 834/2208 [00:45<01:20, 17.09it/s][A
Epoch 3/10:  38%|███▊      | 837/2208 [00:45<01:15, 18.12it/s][A
Epoch 3/10:  38%|███▊      | 840/2208 [00:45<01:12, 18.90it/s][A
Epoch 3/10:  38%|███▊      | 843/2208 [00:46<01:09, 19.50it/s][A
Epoch 3/10:  38%|███▊      | 846/2208 [00:46<01:09, 19.72it/s][A
Epoch 3/10:  38%|███▊      | 849/2208 [00:46<01:12, 18.63it/s][A
  with torch.cuda.amp.autocast():

Epoch 3/10:  39%|███▊      | 854/2208 [00:46<01:27, 15.40it/s][A

Batch 850: Training loss = 0.3770, Training accuracy = 0.8860, F1 = 0.8856



Epoch 3/10:  39%|███▉      | 857/2208 [00:46<01:19, 16.92it/s][A
Epoch 3/10:  39%|███▉      | 860/2208 [00:47<01:15, 17.96it/s][A
Epoch 3/10:  39%|███▉      | 863/2208 [00:47<01:12, 18.67it/s][A
Epoch 3/10:  39%|███▉      | 865/2208 [00:47<01:11, 18.90it/s][A
Epoch 3/10:  39%|███▉      | 868/2208 [00:47<01:08, 19.46it/s][A
Epoch 3/10:  39%|███▉      | 871/2208 [00:47<01:07, 19.82it/s][A
  with torch.cuda.amp.autocast():

Epoch 3/10:  40%|███▉      | 877/2208 [00:48<01:33, 14.31it/s][A
Epoch 3/10:  40%|███▉      | 880/2208 [00:48<01:23, 15.97it/s][A

Batch 875: Training loss = 0.3758, Training accuracy = 0.8860, F1 = 0.8857



Epoch 3/10:  40%|███▉      | 883/2208 [00:48<01:16, 17.36it/s][A
Epoch 3/10:  40%|████      | 886/2208 [00:48<01:11, 18.40it/s][A
Epoch 3/10:  40%|████      | 889/2208 [00:48<01:08, 19.21it/s][A
Epoch 3/10:  40%|████      | 892/2208 [00:48<01:06, 19.80it/s][A
Epoch 3/10:  41%|████      | 895/2208 [00:49<01:04, 20.33it/s][A
Epoch 3/10:  41%|████      | 898/2208 [00:49<01:03, 20.56it/s][A
  with torch.cuda.amp.autocast():

Epoch 3/10:  41%|████      | 904/2208 [00:49<01:17, 16.77it/s][A

Batch 900: Training loss = 0.3069, Training accuracy = 0.8864, F1 = 0.8860



Epoch 3/10:  41%|████      | 907/2208 [00:49<01:12, 17.88it/s][A
Epoch 3/10:  41%|████      | 910/2208 [00:49<01:09, 18.76it/s][A
Epoch 3/10:  41%|████▏     | 913/2208 [00:50<01:06, 19.48it/s][A
Epoch 3/10:  41%|████▏     | 916/2208 [00:50<01:04, 20.01it/s][A
Epoch 3/10:  42%|████▏     | 919/2208 [00:50<01:03, 20.43it/s][A
Epoch 3/10:  42%|████▏     | 922/2208 [00:50<01:02, 20.62it/s][A
  with torch.cuda.amp.autocast():

Epoch 3/10:  42%|████▏     | 928/2208 [00:50<01:24, 15.15it/s][A

Batch 925: Training loss = 0.3232, Training accuracy = 0.8864, F1 = 0.8860



Epoch 3/10:  42%|████▏     | 931/2208 [00:51<01:16, 16.65it/s][A
Epoch 3/10:  42%|████▏     | 934/2208 [00:51<01:11, 17.74it/s][A
Epoch 3/10:  42%|████▏     | 937/2208 [00:51<01:08, 18.66it/s][A
Epoch 3/10:  43%|████▎     | 940/2208 [00:51<01:05, 19.37it/s][A
Epoch 3/10:  43%|████▎     | 943/2208 [00:51<01:03, 19.90it/s][A
Epoch 3/10:  43%|████▎     | 946/2208 [00:51<01:02, 20.34it/s][A
  with torch.cuda.amp.autocast():

Epoch 3/10:  43%|████▎     | 952/2208 [00:52<01:23, 15.04it/s][A
Epoch 3/10:  43%|████▎     | 955/2208 [00:52<01:15, 16.57it/s][A

Batch 950: Training loss = 0.2057, Training accuracy = 0.8868, F1 = 0.8865



Epoch 3/10:  43%|████▎     | 958/2208 [00:52<01:10, 17.82it/s][A
Epoch 3/10:  44%|████▎     | 961/2208 [00:52<01:06, 18.76it/s][A
Epoch 3/10:  44%|████▎     | 964/2208 [00:52<01:03, 19.45it/s][A
Epoch 3/10:  44%|████▍     | 967/2208 [00:52<01:02, 19.97it/s][A
Epoch 3/10:  44%|████▍     | 970/2208 [00:53<01:00, 20.31it/s][A
Epoch 3/10:  44%|████▍     | 973/2208 [00:53<00:59, 20.60it/s][A
  with torch.cuda.amp.autocast():

Epoch 3/10:  44%|████▍     | 979/2208 [00:53<01:12, 16.85it/s][A

Batch 975: Training loss = 0.3980, Training accuracy = 0.8869, F1 = 0.8865



Epoch 3/10:  44%|████▍     | 982/2208 [00:53<01:08, 17.99it/s][A
Epoch 3/10:  45%|████▍     | 985/2208 [00:53<01:05, 18.70it/s][A
Epoch 3/10:  45%|████▍     | 988/2208 [00:54<01:03, 19.35it/s][A
Epoch 3/10:  45%|████▍     | 991/2208 [00:54<01:01, 19.80it/s][A
Epoch 3/10:  45%|████▌     | 994/2208 [00:54<01:00, 20.20it/s][A
Epoch 3/10:  45%|████▌     | 997/2208 [00:54<01:00, 20.00it/s][A
  with torch.cuda.amp.autocast():

Epoch 3/10:  45%|████▌     | 1003/2208 [00:54<01:21, 14.80it/s][A

Batch 1000: Training loss = 0.2995, Training accuracy = 0.8872, F1 = 0.8869



Epoch 3/10:  46%|████▌     | 1006/2208 [00:55<01:13, 16.34it/s][A
Epoch 3/10:  46%|████▌     | 1009/2208 [00:55<01:08, 17.62it/s][A
Epoch 3/10:  46%|████▌     | 1012/2208 [00:55<01:04, 18.65it/s][A
Epoch 3/10:  46%|████▌     | 1015/2208 [00:55<01:01, 19.43it/s][A
Epoch 3/10:  46%|████▌     | 1018/2208 [00:55<00:59, 19.92it/s][A
Epoch 3/10:  46%|████▌     | 1021/2208 [00:55<00:58, 20.23it/s][A
  with torch.cuda.amp.autocast():

Epoch 3/10:  47%|████▋     | 1027/2208 [00:56<01:20, 14.58it/s][A
Epoch 3/10:  47%|████▋     | 1030/2208 [00:56<01:13, 16.13it/s][A

Batch 1025: Training loss = 0.3060, Training accuracy = 0.8875, F1 = 0.8872



Epoch 3/10:  47%|████▋     | 1033/2208 [00:56<01:07, 17.51it/s][A
Epoch 3/10:  47%|████▋     | 1036/2208 [00:56<01:03, 18.36it/s][A
Epoch 3/10:  47%|████▋     | 1039/2208 [00:56<01:01, 19.05it/s][A
Epoch 3/10:  47%|████▋     | 1042/2208 [00:57<00:59, 19.57it/s][A
Epoch 3/10:  47%|████▋     | 1045/2208 [00:57<00:57, 20.09it/s][A
Epoch 3/10:  47%|████▋     | 1048/2208 [00:57<00:56, 20.47it/s][A
  with torch.cuda.amp.autocast():

Epoch 3/10:  48%|████▊     | 1054/2208 [00:57<01:12, 15.97it/s][A

Batch 1050: Training loss = 0.2491, Training accuracy = 0.8879, F1 = 0.8876



Epoch 3/10:  48%|████▊     | 1057/2208 [00:57<01:06, 17.25it/s][A
Epoch 3/10:  48%|████▊     | 1060/2208 [00:58<01:02, 18.30it/s][A
Epoch 3/10:  48%|████▊     | 1062/2208 [00:58<01:02, 18.30it/s][A
Epoch 3/10:  48%|████▊     | 1065/2208 [00:58<00:59, 19.22it/s][A
Epoch 3/10:  48%|████▊     | 1068/2208 [00:58<01:01, 18.65it/s][A
Epoch 3/10:  49%|████▊     | 1071/2208 [00:58<01:02, 18.21it/s][A
Epoch 3/10:  49%|████▊     | 1074/2208 [00:58<00:59, 19.05it/s][A
  with torch.cuda.amp.autocast():

Epoch 3/10:  49%|████▉     | 1079/2208 [00:59<01:14, 15.08it/s][A

Batch 1075: Training loss = 0.2604, Training accuracy = 0.8883, F1 = 0.8879



Epoch 3/10:  49%|████▉     | 1082/2208 [00:59<01:08, 16.56it/s][A
Epoch 3/10:  49%|████▉     | 1085/2208 [00:59<01:03, 17.69it/s][A
Epoch 3/10:  49%|████▉     | 1088/2208 [00:59<01:00, 18.56it/s][A
Epoch 3/10:  49%|████▉     | 1091/2208 [00:59<00:58, 19.24it/s][A
Epoch 3/10:  50%|████▉     | 1094/2208 [00:59<00:56, 19.57it/s][A
Epoch 3/10:  50%|████▉     | 1097/2208 [01:00<00:55, 19.98it/s][A
  with torch.cuda.amp.autocast():

Epoch 3/10:  50%|████▉     | 1103/2208 [01:00<01:19, 13.84it/s][A

Batch 1100: Training loss = 0.2723, Training accuracy = 0.8886, F1 = 0.8882



Epoch 3/10:  50%|█████     | 1106/2208 [01:00<01:10, 15.53it/s][A
Epoch 3/10:  50%|█████     | 1109/2208 [01:00<01:05, 16.90it/s][A
Epoch 3/10:  50%|█████     | 1112/2208 [01:01<01:01, 17.97it/s][A
Epoch 3/10:  50%|█████     | 1115/2208 [01:01<00:57, 18.85it/s][A
Epoch 3/10:  51%|█████     | 1118/2208 [01:01<00:55, 19.49it/s][A
Epoch 3/10:  51%|█████     | 1121/2208 [01:01<00:54, 19.89it/s][A
Epoch 3/10:  51%|█████     | 1124/2208 [01:01<01:04, 16.90it/s][A
  with torch.cuda.amp.autocast():

Epoch 3/10:  51%|█████     | 1129/2208 [01:02<01:16, 14.13it/s][A

Batch 1125: Training loss = 0.2285, Training accuracy = 0.8887, F1 = 0.8883



Epoch 3/10:  51%|█████▏    | 1132/2208 [01:02<01:07, 15.86it/s][A
Epoch 3/10:  51%|█████▏    | 1135/2208 [01:02<01:02, 17.15it/s][A
Epoch 3/10:  52%|█████▏    | 1138/2208 [01:02<00:58, 18.27it/s][A
Epoch 3/10:  52%|█████▏    | 1141/2208 [01:02<00:55, 19.17it/s][A
Epoch 3/10:  52%|█████▏    | 1144/2208 [01:02<00:53, 19.76it/s][A
Epoch 3/10:  52%|█████▏    | 1147/2208 [01:03<00:52, 20.13it/s][A
  with torch.cuda.amp.autocast():

Epoch 3/10:  52%|█████▏    | 1153/2208 [01:03<01:14, 14.19it/s][A

Batch 1150: Training loss = 0.2431, Training accuracy = 0.8888, F1 = 0.8885



Epoch 3/10:  52%|█████▏    | 1156/2208 [01:03<01:06, 15.81it/s][A
Epoch 3/10:  52%|█████▏    | 1159/2208 [01:03<01:01, 17.10it/s][A
Epoch 3/10:  53%|█████▎    | 1162/2208 [01:03<00:57, 18.13it/s][A
Epoch 3/10:  53%|█████▎    | 1165/2208 [01:04<00:54, 19.01it/s][A
Epoch 3/10:  53%|█████▎    | 1168/2208 [01:04<00:53, 19.57it/s][A
Epoch 3/10:  53%|█████▎    | 1171/2208 [01:04<00:51, 19.94it/s][A
  with torch.cuda.amp.autocast():

Epoch 3/10:  53%|█████▎    | 1177/2208 [01:04<01:13, 14.07it/s][A
Epoch 3/10:  53%|█████▎    | 1180/2208 [01:05<01:05, 15.79it/s][A

Batch 1175: Training loss = 0.2773, Training accuracy = 0.8890, F1 = 0.8887



Epoch 3/10:  54%|█████▎    | 1183/2208 [01:05<00:59, 17.19it/s][A
Epoch 3/10:  54%|█████▎    | 1186/2208 [01:05<00:55, 18.28it/s][A
Epoch 3/10:  54%|█████▍    | 1189/2208 [01:05<00:53, 19.07it/s][A
Epoch 3/10:  54%|█████▍    | 1192/2208 [01:05<00:53, 18.97it/s][A
Epoch 3/10:  54%|█████▍    | 1195/2208 [01:05<00:51, 19.62it/s][A
Epoch 3/10:  54%|█████▍    | 1198/2208 [01:05<00:50, 20.20it/s][A
  with torch.cuda.amp.autocast():

Epoch 3/10:  55%|█████▍    | 1204/2208 [01:06<01:04, 15.47it/s][A

Batch 1200: Training loss = 0.3002, Training accuracy = 0.8892, F1 = 0.8889



Epoch 3/10:  55%|█████▍    | 1207/2208 [01:06<00:59, 16.89it/s][A
Epoch 3/10:  55%|█████▍    | 1210/2208 [01:06<00:55, 18.01it/s][A
Epoch 3/10:  55%|█████▍    | 1213/2208 [01:06<00:52, 18.92it/s][A
Epoch 3/10:  55%|█████▌    | 1216/2208 [01:06<00:50, 19.62it/s][A
Epoch 3/10:  55%|█████▌    | 1219/2208 [01:07<00:50, 19.64it/s][A
Epoch 3/10:  55%|█████▌    | 1222/2208 [01:07<00:53, 18.40it/s][A
  with torch.cuda.amp.autocast():

Epoch 3/10:  56%|█████▌    | 1227/2208 [01:07<01:15, 12.95it/s][A
Epoch 3/10:  56%|█████▌    | 1230/2208 [01:07<01:05, 14.92it/s][A

Batch 1225: Training loss = 0.2329, Training accuracy = 0.8893, F1 = 0.8890



Epoch 3/10:  56%|█████▌    | 1233/2208 [01:08<00:59, 16.43it/s][A
Epoch 3/10:  56%|█████▌    | 1236/2208 [01:08<00:55, 17.57it/s][A
Epoch 3/10:  56%|█████▌    | 1238/2208 [01:08<00:53, 18.06it/s][A
Epoch 3/10:  56%|█████▌    | 1240/2208 [01:08<00:52, 18.47it/s][A
Epoch 3/10:  56%|█████▋    | 1243/2208 [01:08<00:50, 19.21it/s][A
Epoch 3/10:  56%|█████▋    | 1246/2208 [01:08<00:48, 19.76it/s][A
  with torch.cuda.amp.autocast():

Epoch 3/10:  57%|█████▋    | 1252/2208 [01:09<01:10, 13.64it/s][A
Epoch 3/10:  57%|█████▋    | 1255/2208 [01:09<01:01, 15.43it/s][A

Batch 1250: Training loss = 0.4611, Training accuracy = 0.8894, F1 = 0.8891



Epoch 3/10:  57%|█████▋    | 1258/2208 [01:09<00:56, 16.87it/s][A
Epoch 3/10:  57%|█████▋    | 1261/2208 [01:09<00:52, 17.95it/s][A
Epoch 3/10:  57%|█████▋    | 1264/2208 [01:09<00:50, 18.88it/s][A
Epoch 3/10:  57%|█████▋    | 1267/2208 [01:09<00:48, 19.50it/s][A
Epoch 3/10:  58%|█████▊    | 1270/2208 [01:10<00:46, 19.97it/s][A
Epoch 3/10:  58%|█████▊    | 1273/2208 [01:10<00:46, 20.26it/s][A
  with torch.cuda.amp.autocast():

Epoch 3/10:  58%|█████▊    | 1279/2208 [01:10<00:59, 15.66it/s][A

Batch 1275: Training loss = 0.4152, Training accuracy = 0.8896, F1 = 0.8892



Epoch 3/10:  58%|█████▊    | 1282/2208 [01:10<00:54, 17.09it/s][A
Epoch 3/10:  58%|█████▊    | 1285/2208 [01:10<00:50, 18.18it/s][A
Epoch 3/10:  58%|█████▊    | 1288/2208 [01:11<00:48, 19.02it/s][A
Epoch 3/10:  58%|█████▊    | 1291/2208 [01:11<00:46, 19.57it/s][A
Epoch 3/10:  59%|█████▊    | 1294/2208 [01:11<00:45, 20.00it/s][A
Epoch 3/10:  59%|█████▊    | 1297/2208 [01:11<00:44, 20.45it/s][A
  with torch.cuda.amp.autocast():

Epoch 3/10:  59%|█████▉    | 1303/2208 [01:12<01:07, 13.44it/s][A

Batch 1300: Training loss = 0.5134, Training accuracy = 0.8898, F1 = 0.8895



Epoch 3/10:  59%|█████▉    | 1306/2208 [01:12<00:59, 15.10it/s][A
Epoch 3/10:  59%|█████▉    | 1309/2208 [01:12<00:54, 16.50it/s][A
Epoch 3/10:  59%|█████▉    | 1312/2208 [01:12<00:50, 17.60it/s][A
Epoch 3/10:  60%|█████▉    | 1315/2208 [01:12<00:48, 18.51it/s][A
Epoch 3/10:  60%|█████▉    | 1318/2208 [01:12<00:48, 18.20it/s][A
Epoch 3/10:  60%|█████▉    | 1321/2208 [01:12<00:46, 19.06it/s][A
Epoch 3/10:  60%|█████▉    | 1323/2208 [01:13<00:52, 17.02it/s][A
  with torch.cuda.amp.autocast():

Epoch 3/10:  60%|██████    | 1329/2208 [01:13<01:04, 13.58it/s][A

Batch 1325: Training loss = 0.2735, Training accuracy = 0.8901, F1 = 0.8897



Epoch 3/10:  60%|██████    | 1332/2208 [01:13<00:57, 15.30it/s][A
Epoch 3/10:  60%|██████    | 1335/2208 [01:13<00:51, 16.81it/s][A
Epoch 3/10:  61%|██████    | 1338/2208 [01:14<00:48, 18.06it/s][A
Epoch 3/10:  61%|██████    | 1341/2208 [01:14<00:47, 18.35it/s][A
Epoch 3/10:  61%|██████    | 1343/2208 [01:14<00:46, 18.63it/s][A
Epoch 3/10:  61%|██████    | 1346/2208 [01:14<00:44, 19.37it/s][A
Epoch 3/10:  61%|██████    | 1349/2208 [01:14<00:45, 19.04it/s][A
  with torch.cuda.amp.autocast():

Epoch 3/10:  61%|██████▏   | 1354/2208 [01:15<01:01, 13.80it/s][A

Batch 1350: Training loss = 0.2514, Training accuracy = 0.8903, F1 = 0.8899



Epoch 3/10:  61%|██████▏   | 1357/2208 [01:15<00:54, 15.56it/s][A
Epoch 3/10:  62%|██████▏   | 1360/2208 [01:15<00:49, 17.01it/s][A
Epoch 3/10:  62%|██████▏   | 1363/2208 [01:15<00:46, 18.19it/s][A
Epoch 3/10:  62%|██████▏   | 1365/2208 [01:15<00:48, 17.53it/s][A
Epoch 3/10:  62%|██████▏   | 1368/2208 [01:15<00:51, 16.25it/s][A
Epoch 3/10:  62%|██████▏   | 1371/2208 [01:16<00:47, 17.57it/s][A
Epoch 3/10:  62%|██████▏   | 1374/2208 [01:16<00:45, 18.45it/s][A
  with torch.cuda.amp.autocast():

Epoch 3/10:  62%|██████▏   | 1379/2208 [01:16<01:06, 12.52it/s][A

Batch 1375: Training loss = 0.3185, Training accuracy = 0.8905, F1 = 0.8902



Epoch 3/10:  63%|██████▎   | 1382/2208 [01:17<00:57, 14.46it/s][A
Epoch 3/10:  63%|██████▎   | 1385/2208 [01:17<00:51, 16.10it/s][A
Epoch 3/10:  63%|██████▎   | 1388/2208 [01:17<00:47, 17.42it/s][A
Epoch 3/10:  63%|██████▎   | 1391/2208 [01:17<00:44, 18.39it/s][A
Epoch 3/10:  63%|██████▎   | 1394/2208 [01:17<00:42, 19.12it/s][A
Epoch 3/10:  63%|██████▎   | 1397/2208 [01:17<00:41, 19.78it/s][A
  with torch.cuda.amp.autocast():

Epoch 3/10:  64%|██████▎   | 1403/2208 [01:18<01:01, 13.05it/s][A

Batch 1400: Training loss = 0.2362, Training accuracy = 0.8906, F1 = 0.8903



Epoch 3/10:  64%|██████▎   | 1406/2208 [01:18<00:53, 14.86it/s][A
Epoch 3/10:  64%|██████▍   | 1409/2208 [01:18<00:49, 16.30it/s][A
Epoch 3/10:  64%|██████▍   | 1412/2208 [01:18<00:45, 17.60it/s][A
Epoch 3/10:  64%|██████▍   | 1415/2208 [01:18<00:42, 18.47it/s][A
Epoch 3/10:  64%|██████▍   | 1418/2208 [01:19<00:41, 19.17it/s][A
Epoch 3/10:  64%|██████▍   | 1421/2208 [01:19<00:40, 19.65it/s][A
  with torch.cuda.amp.autocast():

Epoch 3/10:  65%|██████▍   | 1427/2208 [01:19<01:00, 12.97it/s][A
Epoch 3/10:  65%|██████▍   | 1430/2208 [01:19<00:52, 14.76it/s][A

Batch 1425: Training loss = 0.3364, Training accuracy = 0.8907, F1 = 0.8904



Epoch 3/10:  65%|██████▍   | 1433/2208 [01:19<00:47, 16.28it/s][A
Epoch 3/10:  65%|██████▌   | 1436/2208 [01:20<00:43, 17.57it/s][A
Epoch 3/10:  65%|██████▌   | 1439/2208 [01:20<00:41, 18.63it/s][A
Epoch 3/10:  65%|██████▌   | 1442/2208 [01:20<00:39, 19.27it/s][A
Epoch 3/10:  65%|██████▌   | 1445/2208 [01:20<00:38, 19.76it/s][A
Epoch 3/10:  66%|██████▌   | 1448/2208 [01:20<00:37, 20.06it/s][A
  with torch.cuda.amp.autocast():

Epoch 3/10:  66%|██████▌   | 1454/2208 [01:21<00:50, 14.81it/s][A

Batch 1450: Training loss = 0.3517, Training accuracy = 0.8908, F1 = 0.8905



Epoch 3/10:  66%|██████▌   | 1457/2208 [01:21<00:45, 16.36it/s][A
Epoch 3/10:  66%|██████▌   | 1460/2208 [01:21<00:42, 17.64it/s][A
Epoch 3/10:  66%|██████▋   | 1463/2208 [01:21<00:40, 18.59it/s][A
Epoch 3/10:  66%|██████▋   | 1466/2208 [01:21<00:38, 19.29it/s][A
Epoch 3/10:  67%|██████▋   | 1469/2208 [01:21<00:37, 19.79it/s][A
Epoch 3/10:  67%|██████▋   | 1472/2208 [01:22<00:36, 20.14it/s][A
  with torch.cuda.amp.autocast():

Epoch 3/10:  67%|██████▋   | 1478/2208 [01:22<00:56, 12.86it/s][A

Batch 1475: Training loss = 0.2994, Training accuracy = 0.8911, F1 = 0.8908



Epoch 3/10:  67%|██████▋   | 1481/2208 [01:22<00:49, 14.65it/s][A
Epoch 3/10:  67%|██████▋   | 1484/2208 [01:22<00:44, 16.17it/s][A
Epoch 3/10:  67%|██████▋   | 1487/2208 [01:23<00:41, 17.42it/s][A
Epoch 3/10:  67%|██████▋   | 1490/2208 [01:23<00:39, 18.40it/s][A
Epoch 3/10:  68%|██████▊   | 1493/2208 [01:23<00:37, 19.02it/s][A
Epoch 3/10:  68%|██████▊   | 1496/2208 [01:23<00:36, 19.61it/s][A
  with torch.cuda.amp.autocast():

Epoch 3/10:  68%|██████▊   | 1502/2208 [01:24<00:54, 12.85it/s][A
Epoch 3/10:  68%|██████▊   | 1505/2208 [01:24<00:47, 14.65it/s][A

Batch 1500: Training loss = 0.3330, Training accuracy = 0.8913, F1 = 0.8910



Epoch 3/10:  68%|██████▊   | 1508/2208 [01:24<00:43, 16.13it/s][A
Epoch 3/10:  68%|██████▊   | 1511/2208 [01:24<00:40, 17.34it/s][A
Epoch 3/10:  69%|██████▊   | 1514/2208 [01:24<00:37, 18.40it/s][A
Epoch 3/10:  69%|██████▊   | 1517/2208 [01:24<00:36, 19.16it/s][A
Epoch 3/10:  69%|██████▉   | 1520/2208 [01:24<00:35, 19.60it/s][A
Epoch 3/10:  69%|██████▉   | 1523/2208 [01:25<00:34, 20.10it/s][A
  with torch.cuda.amp.autocast():

Epoch 3/10:  69%|██████▉   | 1529/2208 [01:25<00:45, 14.84it/s][A

Batch 1525: Training loss = 0.3750, Training accuracy = 0.8916, F1 = 0.8913



Epoch 3/10:  69%|██████▉   | 1532/2208 [01:25<00:41, 16.39it/s][A
Epoch 3/10:  70%|██████▉   | 1535/2208 [01:25<00:38, 17.61it/s][A
Epoch 3/10:  70%|██████▉   | 1538/2208 [01:26<00:36, 18.57it/s][A
Epoch 3/10:  70%|██████▉   | 1541/2208 [01:26<00:34, 19.30it/s][A
Epoch 3/10:  70%|██████▉   | 1544/2208 [01:26<00:33, 19.75it/s][A
Epoch 3/10:  70%|███████   | 1547/2208 [01:26<00:32, 20.04it/s][A
  with torch.cuda.amp.autocast():

Epoch 3/10:  70%|███████   | 1553/2208 [01:27<00:52, 12.50it/s][A

Batch 1550: Training loss = 0.2420, Training accuracy = 0.8917, F1 = 0.8913



Epoch 3/10:  70%|███████   | 1556/2208 [01:27<00:45, 14.29it/s][A
Epoch 3/10:  71%|███████   | 1559/2208 [01:27<00:40, 15.83it/s][A
Epoch 3/10:  71%|███████   | 1562/2208 [01:27<00:37, 17.03it/s][A
Epoch 3/10:  71%|███████   | 1564/2208 [01:27<00:36, 17.61it/s][A
Epoch 3/10:  71%|███████   | 1567/2208 [01:27<00:34, 18.55it/s][A
Epoch 3/10:  71%|███████   | 1570/2208 [01:27<00:33, 19.20it/s][A
Epoch 3/10:  71%|███████   | 1573/2208 [01:28<00:34, 18.56it/s][A
  with torch.cuda.amp.autocast():

Epoch 3/10:  72%|███████▏  | 1579/2208 [01:28<00:50, 12.47it/s][A

Batch 1575: Training loss = 0.1985, Training accuracy = 0.8919, F1 = 0.8916



Epoch 3/10:  72%|███████▏  | 1582/2208 [01:28<00:43, 14.32it/s][A
Epoch 3/10:  72%|███████▏  | 1585/2208 [01:29<00:39, 15.95it/s][A
Epoch 3/10:  72%|███████▏  | 1588/2208 [01:29<00:35, 17.30it/s][A
Epoch 3/10:  72%|███████▏  | 1591/2208 [01:29<00:33, 18.19it/s][A
Epoch 3/10:  72%|███████▏  | 1594/2208 [01:29<00:34, 17.61it/s][A
Epoch 3/10:  72%|███████▏  | 1596/2208 [01:29<00:36, 16.73it/s][A
Epoch 3/10:  72%|███████▏  | 1599/2208 [01:29<00:33, 17.99it/s][A
  with torch.cuda.amp.autocast():

Epoch 3/10:  73%|███████▎  | 1604/2208 [01:30<00:48, 12.48it/s][A

Batch 1600: Training loss = 0.3700, Training accuracy = 0.8920, F1 = 0.8917



Epoch 3/10:  73%|███████▎  | 1607/2208 [01:30<00:41, 14.41it/s][A
Epoch 3/10:  73%|███████▎  | 1610/2208 [01:30<00:37, 16.09it/s][A
Epoch 3/10:  73%|███████▎  | 1613/2208 [01:30<00:34, 17.37it/s][A
Epoch 3/10:  73%|███████▎  | 1616/2208 [01:30<00:32, 18.41it/s][A
Epoch 3/10:  73%|███████▎  | 1619/2208 [01:31<00:30, 19.25it/s][A
Epoch 3/10:  73%|███████▎  | 1622/2208 [01:31<00:29, 19.76it/s][A
  with torch.cuda.amp.autocast():

Epoch 3/10:  74%|███████▎  | 1628/2208 [01:31<00:46, 12.45it/s][A

Batch 1625: Training loss = 0.2281, Training accuracy = 0.8920, F1 = 0.8917



Epoch 3/10:  74%|███████▍  | 1631/2208 [01:31<00:40, 14.28it/s][A
Epoch 3/10:  74%|███████▍  | 1634/2208 [01:32<00:36, 15.88it/s][A
Epoch 3/10:  74%|███████▍  | 1637/2208 [01:32<00:33, 17.21it/s][A
Epoch 3/10:  74%|███████▍  | 1640/2208 [01:32<00:31, 18.22it/s][A
Epoch 3/10:  74%|███████▍  | 1643/2208 [01:32<00:30, 18.76it/s][A
Epoch 3/10:  75%|███████▍  | 1646/2208 [01:32<00:28, 19.45it/s][A
  with torch.cuda.amp.autocast():

Epoch 3/10:  75%|███████▍  | 1652/2208 [01:33<00:46, 11.84it/s][A
Epoch 3/10:  75%|███████▍  | 1655/2208 [01:33<00:40, 13.72it/s][A

Batch 1650: Training loss = 0.2131, Training accuracy = 0.8923, F1 = 0.8920



Epoch 3/10:  75%|███████▌  | 1658/2208 [01:33<00:35, 15.40it/s][A
Epoch 3/10:  75%|███████▌  | 1661/2208 [01:33<00:32, 16.87it/s][A
Epoch 3/10:  75%|███████▌  | 1664/2208 [01:33<00:30, 17.92it/s][A
Epoch 3/10:  75%|███████▌  | 1667/2208 [01:34<00:28, 18.91it/s][A
Epoch 3/10:  76%|███████▌  | 1670/2208 [01:34<00:27, 19.64it/s][A
Epoch 3/10:  76%|███████▌  | 1673/2208 [01:34<00:26, 19.99it/s][A
  with torch.cuda.amp.autocast():

Epoch 3/10:  76%|███████▌  | 1679/2208 [01:34<00:37, 14.16it/s][A

Batch 1675: Training loss = 0.2246, Training accuracy = 0.8925, F1 = 0.8922



Epoch 3/10:  76%|███████▌  | 1682/2208 [01:35<00:33, 15.80it/s][A
Epoch 3/10:  76%|███████▋  | 1685/2208 [01:35<00:30, 17.14it/s][A
Epoch 3/10:  76%|███████▋  | 1688/2208 [01:35<00:28, 18.28it/s][A
Epoch 3/10:  77%|███████▋  | 1691/2208 [01:35<00:27, 18.98it/s][A
Epoch 3/10:  77%|███████▋  | 1694/2208 [01:35<00:26, 19.64it/s][A
Epoch 3/10:  77%|███████▋  | 1697/2208 [01:35<00:25, 20.01it/s][A
  with torch.cuda.amp.autocast():

Epoch 3/10:  77%|███████▋  | 1703/2208 [01:36<00:41, 12.23it/s][A

Batch 1700: Training loss = 0.3005, Training accuracy = 0.8927, F1 = 0.8923



Epoch 3/10:  77%|███████▋  | 1706/2208 [01:36<00:35, 14.06it/s][A
Epoch 3/10:  77%|███████▋  | 1709/2208 [01:36<00:31, 15.71it/s][A
Epoch 3/10:  78%|███████▊  | 1712/2208 [01:36<00:29, 17.03it/s][A
Epoch 3/10:  78%|███████▊  | 1715/2208 [01:36<00:27, 18.04it/s][A
Epoch 3/10:  78%|███████▊  | 1718/2208 [01:37<00:25, 18.87it/s][A
Epoch 3/10:  78%|███████▊  | 1721/2208 [01:37<00:24, 19.54it/s][A
  with torch.cuda.amp.autocast():

Epoch 3/10:  78%|███████▊  | 1727/2208 [01:37<00:39, 12.23it/s][A
Epoch 3/10:  78%|███████▊  | 1730/2208 [01:37<00:33, 14.08it/s][A

Batch 1725: Training loss = 0.2575, Training accuracy = 0.8929, F1 = 0.8925



Epoch 3/10:  78%|███████▊  | 1733/2208 [01:38<00:30, 15.70it/s][A
Epoch 3/10:  79%|███████▊  | 1736/2208 [01:38<00:27, 16.99it/s][A
Epoch 3/10:  79%|███████▉  | 1739/2208 [01:38<00:26, 18.02it/s][A
Epoch 3/10:  79%|███████▉  | 1742/2208 [01:38<00:24, 18.82it/s][A
Epoch 3/10:  79%|███████▉  | 1745/2208 [01:38<00:23, 19.42it/s][A
Epoch 3/10:  79%|███████▉  | 1748/2208 [01:38<00:23, 19.93it/s][A
  with torch.cuda.amp.autocast():

Epoch 3/10:  79%|███████▉  | 1754/2208 [01:39<00:32, 13.98it/s][A

Batch 1750: Training loss = 0.3180, Training accuracy = 0.8931, F1 = 0.8927



Epoch 3/10:  80%|███████▉  | 1757/2208 [01:39<00:28, 15.61it/s][A
Epoch 3/10:  80%|███████▉  | 1760/2208 [01:39<00:26, 16.92it/s][A
Epoch 3/10:  80%|███████▉  | 1763/2208 [01:39<00:24, 18.00it/s][A
Epoch 3/10:  80%|███████▉  | 1766/2208 [01:39<00:23, 18.97it/s][A
Epoch 3/10:  80%|████████  | 1769/2208 [01:40<00:22, 19.67it/s][A
Epoch 3/10:  80%|████████  | 1772/2208 [01:40<00:21, 20.21it/s][A
  with torch.cuda.amp.autocast():

Epoch 3/10:  81%|████████  | 1778/2208 [01:40<00:36, 11.85it/s][A

Batch 1775: Training loss = 0.4649, Training accuracy = 0.8933, F1 = 0.8929



Epoch 3/10:  81%|████████  | 1781/2208 [01:41<00:31, 13.68it/s][A
Epoch 3/10:  81%|████████  | 1784/2208 [01:41<00:27, 15.25it/s][A
Epoch 3/10:  81%|████████  | 1787/2208 [01:41<00:25, 16.65it/s][A
Epoch 3/10:  81%|████████  | 1790/2208 [01:41<00:23, 17.73it/s][A
Epoch 3/10:  81%|████████  | 1793/2208 [01:41<00:23, 17.99it/s][A
Epoch 3/10:  81%|████████▏ | 1796/2208 [01:41<00:21, 18.94it/s][A
Epoch 3/10:  81%|████████▏ | 1799/2208 [01:41<00:21, 18.81it/s][A
  with torch.cuda.amp.autocast():

Epoch 3/10:  82%|████████▏ | 1804/2208 [01:42<00:31, 12.64it/s][A

Batch 1800: Training loss = 0.2159, Training accuracy = 0.8934, F1 = 0.8931



Epoch 3/10:  82%|████████▏ | 1807/2208 [01:42<00:27, 14.50it/s][A
Epoch 3/10:  82%|████████▏ | 1810/2208 [01:42<00:24, 16.04it/s][A
Epoch 3/10:  82%|████████▏ | 1813/2208 [01:42<00:22, 17.35it/s][A
Epoch 3/10:  82%|████████▏ | 1815/2208 [01:43<00:22, 17.79it/s][A
Epoch 3/10:  82%|████████▏ | 1817/2208 [01:43<00:21, 18.28it/s][A
Epoch 3/10:  82%|████████▏ | 1820/2208 [01:43<00:20, 19.18it/s][A
Epoch 3/10:  83%|████████▎ | 1823/2208 [01:43<00:19, 19.87it/s][A
  with torch.cuda.amp.autocast():

Epoch 3/10:  83%|████████▎ | 1829/2208 [01:44<00:30, 12.39it/s][A

Batch 1825: Training loss = 0.2339, Training accuracy = 0.8936, F1 = 0.8932



Epoch 3/10:  83%|████████▎ | 1832/2208 [01:44<00:26, 14.22it/s][A
Epoch 3/10:  83%|████████▎ | 1835/2208 [01:44<00:23, 15.79it/s][A
Epoch 3/10:  83%|████████▎ | 1838/2208 [01:44<00:21, 17.12it/s][A
Epoch 3/10:  83%|████████▎ | 1841/2208 [01:44<00:20, 18.11it/s][A
Epoch 3/10:  84%|████████▎ | 1844/2208 [01:44<00:19, 18.78it/s][A
Epoch 3/10:  84%|████████▎ | 1847/2208 [01:45<00:20, 17.99it/s][A
  with torch.cuda.amp.autocast():

Epoch 3/10:  84%|████████▍ | 1852/2208 [01:45<00:32, 10.82it/s][A
Epoch 3/10:  84%|████████▍ | 1855/2208 [01:45<00:27, 12.95it/s][A

Batch 1850: Training loss = 0.2004, Training accuracy = 0.8937, F1 = 0.8934



Epoch 3/10:  84%|████████▍ | 1858/2208 [01:45<00:23, 14.81it/s][A
Epoch 3/10:  84%|████████▍ | 1861/2208 [01:46<00:21, 16.32it/s][A
Epoch 3/10:  84%|████████▍ | 1864/2208 [01:46<00:19, 17.68it/s][A
Epoch 3/10:  85%|████████▍ | 1867/2208 [01:46<00:18, 18.72it/s][A
Epoch 3/10:  85%|████████▍ | 1870/2208 [01:46<00:17, 19.28it/s][A
Epoch 3/10:  85%|████████▍ | 1873/2208 [01:46<00:16, 19.83it/s][A
  with torch.cuda.amp.autocast():

Epoch 3/10:  85%|████████▌ | 1879/2208 [01:47<00:24, 13.23it/s][A

Batch 1875: Training loss = 0.3449, Training accuracy = 0.8939, F1 = 0.8936



Epoch 3/10:  85%|████████▌ | 1882/2208 [01:47<00:21, 14.88it/s][A
Epoch 3/10:  85%|████████▌ | 1885/2208 [01:47<00:19, 16.37it/s][A
Epoch 3/10:  86%|████████▌ | 1888/2208 [01:47<00:18, 17.69it/s][A
Epoch 3/10:  86%|████████▌ | 1891/2208 [01:47<00:16, 18.67it/s][A
Epoch 3/10:  86%|████████▌ | 1894/2208 [01:48<00:16, 19.29it/s][A
Epoch 3/10:  86%|████████▌ | 1897/2208 [01:48<00:15, 19.81it/s][A
  with torch.cuda.amp.autocast():

Epoch 3/10:  86%|████████▌ | 1903/2208 [01:48<00:26, 11.64it/s][A

Batch 1900: Training loss = 0.2503, Training accuracy = 0.8939, F1 = 0.8936



Epoch 3/10:  86%|████████▋ | 1906/2208 [01:48<00:22, 13.51it/s][A
Epoch 3/10:  86%|████████▋ | 1909/2208 [01:49<00:19, 15.20it/s][A
Epoch 3/10:  87%|████████▋ | 1912/2208 [01:49<00:17, 16.64it/s][A
Epoch 3/10:  87%|████████▋ | 1915/2208 [01:49<00:16, 17.71it/s][A
Epoch 3/10:  87%|████████▋ | 1918/2208 [01:49<00:15, 18.59it/s][A
Epoch 3/10:  87%|████████▋ | 1921/2208 [01:49<00:14, 19.30it/s][A
  with torch.cuda.amp.autocast():

Epoch 3/10:  87%|████████▋ | 1927/2208 [01:50<00:24, 11.52it/s][A
Epoch 3/10:  87%|████████▋ | 1930/2208 [01:50<00:20, 13.43it/s][A

Batch 1925: Training loss = 0.3386, Training accuracy = 0.8942, F1 = 0.8938



Epoch 3/10:  88%|████████▊ | 1933/2208 [01:50<00:18, 15.13it/s][A
Epoch 3/10:  88%|████████▊ | 1936/2208 [01:50<00:16, 16.66it/s][A
Epoch 3/10:  88%|████████▊ | 1939/2208 [01:50<00:15, 17.79it/s][A
Epoch 3/10:  88%|████████▊ | 1942/2208 [01:51<00:14, 18.70it/s][A
Epoch 3/10:  88%|████████▊ | 1945/2208 [01:51<00:13, 19.37it/s][A
Epoch 3/10:  88%|████████▊ | 1948/2208 [01:51<00:13, 19.85it/s][A
  with torch.cuda.amp.autocast():

Epoch 3/10:  88%|████████▊ | 1954/2208 [01:51<00:18, 13.49it/s][A

Batch 1950: Training loss = 0.3070, Training accuracy = 0.8942, F1 = 0.8939



Epoch 3/10:  89%|████████▊ | 1957/2208 [01:52<00:16, 15.19it/s][A
Epoch 3/10:  89%|████████▉ | 1960/2208 [01:52<00:14, 16.56it/s][A
Epoch 3/10:  89%|████████▉ | 1963/2208 [01:52<00:13, 17.82it/s][A
Epoch 3/10:  89%|████████▉ | 1966/2208 [01:52<00:12, 18.78it/s][A
Epoch 3/10:  89%|████████▉ | 1969/2208 [01:52<00:12, 19.45it/s][A
Epoch 3/10:  89%|████████▉ | 1972/2208 [01:52<00:11, 19.85it/s][A
  with torch.cuda.amp.autocast():

Epoch 3/10:  90%|████████▉ | 1978/2208 [01:53<00:19, 11.61it/s][A

Batch 1975: Training loss = 0.4202, Training accuracy = 0.8943, F1 = 0.8940



Epoch 3/10:  90%|████████▉ | 1981/2208 [01:53<00:16, 13.49it/s][A
Epoch 3/10:  90%|████████▉ | 1984/2208 [01:53<00:14, 15.21it/s][A
Epoch 3/10:  90%|████████▉ | 1987/2208 [01:53<00:13, 16.67it/s][A
Epoch 3/10:  90%|█████████ | 1990/2208 [01:54<00:12, 17.79it/s][A
Epoch 3/10:  90%|█████████ | 1993/2208 [01:54<00:11, 18.67it/s][A
Epoch 3/10:  90%|█████████ | 1996/2208 [01:54<00:10, 19.33it/s][A
  with torch.cuda.amp.autocast():

Epoch 3/10:  91%|█████████ | 2002/2208 [01:55<00:18, 11.28it/s][A
Epoch 3/10:  91%|█████████ | 2005/2208 [01:55<00:15, 13.17it/s][A

Batch 2000: Training loss = 0.2821, Training accuracy = 0.8945, F1 = 0.8942



Epoch 3/10:  91%|█████████ | 2008/2208 [01:55<00:13, 14.92it/s][A
Epoch 3/10:  91%|█████████ | 2011/2208 [01:55<00:12, 16.40it/s][A
Epoch 3/10:  91%|█████████ | 2014/2208 [01:55<00:11, 17.50it/s][A
Epoch 3/10:  91%|█████████▏| 2017/2208 [01:55<00:11, 16.88it/s][A
Epoch 3/10:  91%|█████████▏| 2019/2208 [01:55<00:11, 16.87it/s][A
Epoch 3/10:  92%|█████████▏| 2022/2208 [01:56<00:10, 18.07it/s][A
Epoch 3/10:  92%|█████████▏| 2024/2208 [01:56<00:10, 16.87it/s][A
  with torch.cuda.amp.autocast():

Epoch 3/10:  92%|█████████▏| 2029/2208 [01:56<00:16, 10.82it/s][A

Batch 2025: Training loss = 0.2363, Training accuracy = 0.8947, F1 = 0.8944



Epoch 3/10:  92%|█████████▏| 2032/2208 [01:57<00:13, 12.94it/s][A
Epoch 3/10:  92%|█████████▏| 2035/2208 [01:57<00:11, 14.84it/s][A
Epoch 3/10:  92%|█████████▏| 2038/2208 [01:57<00:10, 16.43it/s][A
Epoch 3/10:  92%|█████████▏| 2041/2208 [01:57<00:09, 16.92it/s][A
Epoch 3/10:  93%|█████████▎| 2044/2208 [01:57<00:09, 17.94it/s][A
Epoch 3/10:  93%|█████████▎| 2047/2208 [01:57<00:08, 18.78it/s][A
  with torch.cuda.amp.autocast():

Epoch 3/10:  93%|█████████▎| 2052/2208 [01:58<00:16,  9.27it/s][A
Epoch 3/10:  93%|█████████▎| 2055/2208 [01:58<00:13, 11.39it/s][A

Batch 2050: Training loss = 0.3833, Training accuracy = 0.8947, F1 = 0.8944



Epoch 3/10:  93%|█████████▎| 2058/2208 [01:58<00:11, 13.32it/s][A
Epoch 3/10:  93%|█████████▎| 2061/2208 [01:58<00:09, 14.99it/s][A
Epoch 3/10:  93%|█████████▎| 2064/2208 [01:59<00:08, 16.36it/s][A
Epoch 3/10:  94%|█████████▎| 2067/2208 [01:59<00:08, 17.54it/s][A
Epoch 3/10:  94%|█████████▍| 2070/2208 [01:59<00:07, 18.60it/s][A
Epoch 3/10:  94%|█████████▍| 2073/2208 [01:59<00:07, 18.53it/s][A
  with torch.cuda.amp.autocast():

Epoch 3/10:  94%|█████████▍| 2079/2208 [02:00<00:10, 12.38it/s][A

Batch 2075: Training loss = 0.1276, Training accuracy = 0.8950, F1 = 0.8947



Epoch 3/10:  94%|█████████▍| 2082/2208 [02:00<00:08, 14.22it/s][A
Epoch 3/10:  94%|█████████▍| 2085/2208 [02:00<00:07, 15.80it/s][A
Epoch 3/10:  95%|█████████▍| 2088/2208 [02:00<00:06, 17.21it/s][A
Epoch 3/10:  95%|█████████▍| 2091/2208 [02:00<00:06, 18.20it/s][A
Epoch 3/10:  95%|█████████▍| 2094/2208 [02:00<00:06, 18.98it/s][A
Epoch 3/10:  95%|█████████▍| 2097/2208 [02:01<00:05, 19.63it/s][A
  with torch.cuda.amp.autocast():

Epoch 3/10:  95%|█████████▌| 2103/2208 [02:01<00:09, 11.02it/s][A

Batch 2100: Training loss = 0.2895, Training accuracy = 0.8952, F1 = 0.8949



Epoch 3/10:  95%|█████████▌| 2106/2208 [02:01<00:07, 12.91it/s][A
Epoch 3/10:  96%|█████████▌| 2109/2208 [02:02<00:06, 14.62it/s][A
Epoch 3/10:  96%|█████████▌| 2112/2208 [02:02<00:05, 16.15it/s][A
Epoch 3/10:  96%|█████████▌| 2115/2208 [02:02<00:05, 17.42it/s][A
Epoch 3/10:  96%|█████████▌| 2118/2208 [02:02<00:04, 18.48it/s][A
Epoch 3/10:  96%|█████████▌| 2121/2208 [02:02<00:04, 19.19it/s][A
  with torch.cuda.amp.autocast():

Epoch 3/10:  96%|█████████▋| 2127/2208 [02:03<00:07, 11.01it/s][A
Epoch 3/10:  96%|█████████▋| 2130/2208 [02:03<00:06, 12.95it/s][A

Batch 2125: Training loss = 0.4633, Training accuracy = 0.8952, F1 = 0.8949



Epoch 3/10:  97%|█████████▋| 2133/2208 [02:03<00:05, 14.73it/s][A
Epoch 3/10:  97%|█████████▋| 2136/2208 [02:03<00:04, 16.17it/s][A
Epoch 3/10:  97%|█████████▋| 2139/2208 [02:03<00:03, 17.43it/s][A
Epoch 3/10:  97%|█████████▋| 2142/2208 [02:04<00:03, 18.37it/s][A
Epoch 3/10:  97%|█████████▋| 2145/2208 [02:04<00:03, 19.13it/s][A
Epoch 3/10:  97%|█████████▋| 2148/2208 [02:04<00:03, 19.65it/s][A
  with torch.cuda.amp.autocast():

Epoch 3/10:  98%|█████████▊| 2154/2208 [02:05<00:04, 12.94it/s][A

Batch 2150: Training loss = 0.2784, Training accuracy = 0.8954, F1 = 0.8951



Epoch 3/10:  98%|█████████▊| 2157/2208 [02:05<00:03, 14.75it/s][A
Epoch 3/10:  98%|█████████▊| 2160/2208 [02:05<00:02, 16.26it/s][A
Epoch 3/10:  98%|█████████▊| 2163/2208 [02:05<00:02, 17.56it/s][A
Epoch 3/10:  98%|█████████▊| 2166/2208 [02:05<00:02, 18.47it/s][A
Epoch 3/10:  98%|█████████▊| 2169/2208 [02:05<00:02, 19.28it/s][A
Epoch 3/10:  98%|█████████▊| 2172/2208 [02:05<00:01, 19.76it/s][A
  with torch.cuda.amp.autocast():

Epoch 3/10:  99%|█████████▊| 2178/2208 [02:06<00:02, 10.18it/s][A

Batch 2175: Training loss = 0.3275, Training accuracy = 0.8954, F1 = 0.8952



Epoch 3/10:  99%|█████████▉| 2181/2208 [02:06<00:02, 12.14it/s][A
Epoch 3/10:  99%|█████████▉| 2184/2208 [02:06<00:01, 13.99it/s][A
Epoch 3/10:  99%|█████████▉| 2187/2208 [02:07<00:01, 15.58it/s][A
Epoch 3/10:  99%|█████████▉| 2190/2208 [02:07<00:01, 16.84it/s][A
Epoch 3/10:  99%|█████████▉| 2193/2208 [02:07<00:00, 17.96it/s][A
Epoch 3/10:  99%|█████████▉| 2196/2208 [02:07<00:00, 18.80it/s][A
  with torch.cuda.amp.autocast():

Epoch 3/10: 100%|█████████▉| 2202/2208 [02:08<00:00, 10.77it/s][A
Epoch 3/10: 100%|█████████▉| 2205/2208 [02:08<00:00, 12.74it/s][A

Batch 2200: Training loss = 0.4000, Training accuracy = 0.8956, F1 = 0.8953



Epoch 3/10: 100%|██████████| 2208/2208 [02:08<00:00, 14.60it/s][A
                                                               [A


Epoch 3 Training Metrics:
Loss: 0.3096
Accuracy: 0.8957
F1 Score: 0.8954
Precision: 0.8952
Recall: 0.8957

Starting validation...



Validation:   0%|          | 0/552 [00:00<?, ?it/s][A
Validation:   0%|          | 1/552 [00:01<14:51,  1.62s/it][A
Validation:   1%|          | 3/552 [00:01<04:16,  2.14it/s][A
Validation:   1%|          | 5/552 [00:01<02:19,  3.91it/s][A
Validation:   1%|▏         | 7/552 [00:01<01:33,  5.83it/s][A
Validation:   2%|▏         | 9/552 [00:02<01:09,  7.85it/s][A
Validation:   2%|▏         | 11/552 [00:02<00:55,  9.84it/s][A
Validation:   2%|▏         | 13/552 [00:02<00:46, 11.64it/s][A
Validation:   3%|▎         | 15/552 [00:02<00:40, 13.22it/s][A
Validation:   3%|▎         | 17/552 [00:02<00:36, 14.55it/s][A
Validation:   3%|▎         | 19/552 [00:02<00:33, 15.68it/s][A
Validation:   4%|▍         | 21/552 [00:02<00:32, 16.54it/s][A
Validation:   4%|▍         | 23/552 [00:02<00:30, 17.16it/s][A
Validation:   5%|▍         | 25/552 [00:02<00:29, 17.57it/s][A
Validation:   5%|▍         | 27/552 [00:03<00:29, 17.92it/s][A
Validation:   5%|▌         | 29/552 [00:03<00:28, 18.


Epoch 3 Validation Metrics:
Loss: 0.2178
Accuracy: 0.9263
F1 Score: 0.9254
Precision: 0.9303
Recall: 0.9263


Training epochs:  30%|███       | 3/10 [08:02<18:46, 160.99s/it]


Starting epoch 4/10



  with torch.cuda.amp.autocast():

  with torch.cuda.amp.autocast():

Epoch 4/10:   0%|          | 3/2208 [00:01<18:30,  1.99it/s]  [A

Batch 0: Training loss = 0.2405, Training accuracy = 0.9141, F1 = 0.9115



Epoch 4/10:   0%|          | 5/2208 [00:02<09:56,  3.69it/s][A
Epoch 4/10:   0%|          | 8/2208 [00:02<05:38,  6.49it/s][A
Epoch 4/10:   0%|          | 11/2208 [00:02<03:57,  9.24it/s][A
Epoch 4/10:   1%|          | 14/2208 [00:02<03:06, 11.76it/s][A
Epoch 4/10:   1%|          | 17/2208 [00:02<02:37, 13.90it/s][A
Epoch 4/10:   1%|          | 20/2208 [00:02<02:18, 15.77it/s][A
Epoch 4/10:   1%|          | 23/2208 [00:02<02:07, 17.13it/s][A
  with torch.cuda.amp.autocast():

Epoch 4/10:   1%|▏         | 29/2208 [00:03<01:54, 18.95it/s][A

Batch 25: Training loss = 0.2367, Training accuracy = 0.9053, F1 = 0.9051



Epoch 4/10:   1%|▏         | 32/2208 [00:03<01:50, 19.66it/s][A
Epoch 4/10:   2%|▏         | 35/2208 [00:03<01:47, 20.14it/s][A
Epoch 4/10:   2%|▏         | 38/2208 [00:03<01:45, 20.50it/s][A
Epoch 4/10:   2%|▏         | 41/2208 [00:03<01:44, 20.73it/s][A
Epoch 4/10:   2%|▏         | 44/2208 [00:03<01:44, 20.74it/s][A
Epoch 4/10:   2%|▏         | 47/2208 [00:04<01:51, 19.38it/s][A
  with torch.cuda.amp.autocast():

Epoch 4/10:   2%|▏         | 53/2208 [00:04<01:49, 19.68it/s][A

Batch 50: Training loss = 0.1546, Training accuracy = 0.9079, F1 = 0.9078



Epoch 4/10:   3%|▎         | 56/2208 [00:04<01:47, 20.04it/s][A
Epoch 4/10:   3%|▎         | 59/2208 [00:04<01:52, 19.06it/s][A
Epoch 4/10:   3%|▎         | 62/2208 [00:04<01:49, 19.60it/s][A
Epoch 4/10:   3%|▎         | 65/2208 [00:04<01:47, 19.92it/s][A
Epoch 4/10:   3%|▎         | 68/2208 [00:05<01:45, 20.33it/s][A
Epoch 4/10:   3%|▎         | 71/2208 [00:05<01:43, 20.64it/s][A
  with torch.cuda.amp.autocast():

Epoch 4/10:   3%|▎         | 77/2208 [00:05<01:48, 19.65it/s][A
Epoch 4/10:   4%|▎         | 80/2208 [00:05<01:46, 20.07it/s][A

Batch 75: Training loss = 0.3329, Training accuracy = 0.9064, F1 = 0.9061



Epoch 4/10:   4%|▍         | 83/2208 [00:05<01:43, 20.48it/s][A
Epoch 4/10:   4%|▍         | 86/2208 [00:05<01:45, 20.12it/s][A
Epoch 4/10:   4%|▍         | 89/2208 [00:06<01:47, 19.71it/s][A
Epoch 4/10:   4%|▍         | 92/2208 [00:06<01:45, 20.13it/s][A
Epoch 4/10:   4%|▍         | 95/2208 [00:06<01:49, 19.30it/s][A
Epoch 4/10:   4%|▍         | 98/2208 [00:06<01:46, 19.74it/s][A
  with torch.cuda.amp.autocast():

Epoch 4/10:   5%|▍         | 104/2208 [00:06<01:49, 19.25it/s][A

Batch 100: Training loss = 0.1784, Training accuracy = 0.9066, F1 = 0.9064



Epoch 4/10:   5%|▍         | 107/2208 [00:07<01:45, 19.84it/s][A
Epoch 4/10:   5%|▍         | 110/2208 [00:07<01:43, 20.23it/s][A
Epoch 4/10:   5%|▌         | 113/2208 [00:07<01:45, 19.88it/s][A
Epoch 4/10:   5%|▌         | 116/2208 [00:07<01:42, 20.31it/s][A
Epoch 4/10:   5%|▌         | 119/2208 [00:07<01:47, 19.49it/s][A
Epoch 4/10:   6%|▌         | 122/2208 [00:07<01:44, 19.91it/s][A
  with torch.cuda.amp.autocast():

Epoch 4/10:   6%|▌         | 128/2208 [00:08<01:46, 19.46it/s][A

Batch 125: Training loss = 0.2788, Training accuracy = 0.9063, F1 = 0.9060



Epoch 4/10:   6%|▌         | 131/2208 [00:08<01:44, 19.87it/s][A
Epoch 4/10:   6%|▌         | 134/2208 [00:08<01:42, 20.25it/s][A
Epoch 4/10:   6%|▌         | 137/2208 [00:08<01:42, 20.12it/s][A
Epoch 4/10:   6%|▋         | 140/2208 [00:08<01:41, 20.44it/s][A
Epoch 4/10:   6%|▋         | 143/2208 [00:08<01:40, 20.57it/s][A
Epoch 4/10:   7%|▋         | 146/2208 [00:08<01:38, 20.88it/s][A
  with torch.cuda.amp.autocast():

Epoch 4/10:   7%|▋         | 152/2208 [00:09<01:46, 19.22it/s][A
Epoch 4/10:   7%|▋         | 155/2208 [00:09<01:43, 19.79it/s][A

Batch 150: Training loss = 0.2688, Training accuracy = 0.9072, F1 = 0.9070



Epoch 4/10:   7%|▋         | 158/2208 [00:09<01:41, 20.23it/s][A
Epoch 4/10:   7%|▋         | 161/2208 [00:09<01:39, 20.51it/s][A
Epoch 4/10:   7%|▋         | 164/2208 [00:09<01:38, 20.78it/s][A
Epoch 4/10:   8%|▊         | 167/2208 [00:10<01:37, 20.92it/s][A
Epoch 4/10:   8%|▊         | 170/2208 [00:10<01:36, 21.10it/s][A
Epoch 4/10:   8%|▊         | 173/2208 [00:10<01:45, 19.36it/s][A
  with torch.cuda.amp.autocast():

Epoch 4/10:   8%|▊         | 179/2208 [00:10<01:53, 17.87it/s][A

Batch 175: Training loss = 0.3666, Training accuracy = 0.9073, F1 = 0.9070



Epoch 4/10:   8%|▊         | 182/2208 [00:10<01:48, 18.72it/s][A
Epoch 4/10:   8%|▊         | 185/2208 [00:10<01:44, 19.33it/s][A
Epoch 4/10:   9%|▊         | 188/2208 [00:11<01:42, 19.73it/s][A
Epoch 4/10:   9%|▊         | 191/2208 [00:11<01:53, 17.78it/s][A
Epoch 4/10:   9%|▊         | 193/2208 [00:11<01:55, 17.49it/s][A
Epoch 4/10:   9%|▉         | 195/2208 [00:11<01:51, 18.03it/s][A
Epoch 4/10:   9%|▉         | 197/2208 [00:11<01:50, 18.17it/s][A
  with torch.cuda.amp.autocast():

Epoch 4/10:   9%|▉         | 202/2208 [00:12<02:09, 15.49it/s][A
Epoch 4/10:   9%|▉         | 205/2208 [00:12<01:57, 17.08it/s][A

Batch 200: Training loss = 0.2906, Training accuracy = 0.9071, F1 = 0.9070



Epoch 4/10:   9%|▉         | 207/2208 [00:12<01:53, 17.70it/s][A
Epoch 4/10:   9%|▉         | 209/2208 [00:12<01:49, 18.23it/s][A
Epoch 4/10:  10%|▉         | 211/2208 [00:12<01:54, 17.38it/s][A
Epoch 4/10:  10%|▉         | 213/2208 [00:12<02:08, 15.51it/s][A
Epoch 4/10:  10%|▉         | 215/2208 [00:12<02:07, 15.62it/s][A
Epoch 4/10:  10%|▉         | 217/2208 [00:12<02:09, 15.37it/s][A
Epoch 4/10:  10%|▉         | 220/2208 [00:13<01:55, 17.16it/s][A
Epoch 4/10:  10%|█         | 222/2208 [00:13<02:08, 15.42it/s][A
  with torch.cuda.amp.autocast():

Epoch 4/10:  10%|█         | 227/2208 [00:13<02:02, 16.23it/s][A
Epoch 4/10:  10%|█         | 230/2208 [00:13<01:52, 17.59it/s][A

Batch 225: Training loss = 0.2345, Training accuracy = 0.9084, F1 = 0.9082



Epoch 4/10:  11%|█         | 233/2208 [00:13<01:49, 18.12it/s][A
Epoch 4/10:  11%|█         | 235/2208 [00:13<01:46, 18.50it/s][A
Epoch 4/10:  11%|█         | 237/2208 [00:14<02:14, 14.65it/s][A
Epoch 4/10:  11%|█         | 240/2208 [00:14<01:59, 16.53it/s][A
Epoch 4/10:  11%|█         | 242/2208 [00:14<01:57, 16.76it/s][A
Epoch 4/10:  11%|█         | 245/2208 [00:14<02:07, 15.36it/s][A
Epoch 4/10:  11%|█         | 248/2208 [00:14<01:55, 16.92it/s][A
  with torch.cuda.amp.autocast():

Epoch 4/10:  11%|█▏        | 252/2208 [00:15<02:05, 15.58it/s][A
Epoch 4/10:  12%|█▏        | 254/2208 [00:15<01:58, 16.48it/s][A

Batch 250: Training loss = 0.3258, Training accuracy = 0.9090, F1 = 0.9088



Epoch 4/10:  12%|█▏        | 257/2208 [00:15<01:48, 17.97it/s][A
Epoch 4/10:  12%|█▏        | 260/2208 [00:15<01:42, 18.97it/s][A
Epoch 4/10:  12%|█▏        | 262/2208 [00:15<01:59, 16.25it/s][A
Epoch 4/10:  12%|█▏        | 265/2208 [00:15<01:56, 16.63it/s][A
Epoch 4/10:  12%|█▏        | 268/2208 [00:15<01:47, 18.01it/s][A
Epoch 4/10:  12%|█▏        | 271/2208 [00:16<01:42, 18.94it/s][A
Epoch 4/10:  12%|█▏        | 274/2208 [00:16<01:38, 19.57it/s][A
  with torch.cuda.amp.autocast():

Epoch 4/10:  13%|█▎        | 279/2208 [00:16<01:41, 19.03it/s][A

Batch 275: Training loss = 0.1934, Training accuracy = 0.9093, F1 = 0.9091



Epoch 4/10:  13%|█▎        | 282/2208 [00:16<01:37, 19.67it/s][A
Epoch 4/10:  13%|█▎        | 285/2208 [00:16<01:35, 20.08it/s][A
Epoch 4/10:  13%|█▎        | 288/2208 [00:16<01:34, 20.36it/s][A
Epoch 4/10:  13%|█▎        | 291/2208 [00:17<01:33, 20.54it/s][A
Epoch 4/10:  13%|█▎        | 294/2208 [00:17<01:32, 20.67it/s][A
Epoch 4/10:  13%|█▎        | 297/2208 [00:17<01:31, 20.93it/s][A
  with torch.cuda.amp.autocast():

Epoch 4/10:  14%|█▎        | 303/2208 [00:17<01:43, 18.45it/s][A

Batch 300: Training loss = 0.3021, Training accuracy = 0.9094, F1 = 0.9092



Epoch 4/10:  14%|█▍        | 306/2208 [00:17<01:38, 19.28it/s][A
Epoch 4/10:  14%|█▍        | 309/2208 [00:17<01:35, 19.94it/s][A
Epoch 4/10:  14%|█▍        | 312/2208 [00:18<01:33, 20.30it/s][A
Epoch 4/10:  14%|█▍        | 315/2208 [00:18<01:31, 20.59it/s][A
Epoch 4/10:  14%|█▍        | 318/2208 [00:18<01:30, 20.89it/s][A
Epoch 4/10:  15%|█▍        | 321/2208 [00:18<01:30, 20.83it/s][A
  with torch.cuda.amp.autocast():

Epoch 4/10:  15%|█▍        | 327/2208 [00:18<01:41, 18.47it/s][A
Epoch 4/10:  15%|█▍        | 330/2208 [00:18<01:38, 19.06it/s][A

Batch 325: Training loss = 0.2925, Training accuracy = 0.9096, F1 = 0.9094



Epoch 4/10:  15%|█▌        | 333/2208 [00:19<01:35, 19.69it/s][A
Epoch 4/10:  15%|█▌        | 336/2208 [00:19<01:34, 19.89it/s][A
Epoch 4/10:  15%|█▌        | 339/2208 [00:19<01:33, 20.00it/s][A
Epoch 4/10:  15%|█▌        | 342/2208 [00:19<01:31, 20.33it/s][A
Epoch 4/10:  16%|█▌        | 345/2208 [00:19<01:30, 20.64it/s][A
Epoch 4/10:  16%|█▌        | 348/2208 [00:19<01:30, 20.65it/s][A
  with torch.cuda.amp.autocast():

Epoch 4/10:  16%|█▌        | 354/2208 [00:20<01:36, 19.15it/s][A

Batch 350: Training loss = 0.2280, Training accuracy = 0.9095, F1 = 0.9094



Epoch 4/10:  16%|█▌        | 357/2208 [00:20<01:33, 19.75it/s][A
Epoch 4/10:  16%|█▋        | 360/2208 [00:20<01:31, 20.11it/s][A
Epoch 4/10:  16%|█▋        | 363/2208 [00:20<01:30, 20.29it/s][A
Epoch 4/10:  17%|█▋        | 366/2208 [00:20<01:29, 20.50it/s][A
Epoch 4/10:  17%|█▋        | 369/2208 [00:20<01:28, 20.81it/s][A
Epoch 4/10:  17%|█▋        | 372/2208 [00:21<01:27, 20.89it/s][A
  with torch.cuda.amp.autocast():

Epoch 4/10:  17%|█▋        | 378/2208 [00:21<01:40, 18.12it/s][A

Batch 375: Training loss = 0.4002, Training accuracy = 0.9092, F1 = 0.9091



Epoch 4/10:  17%|█▋        | 381/2208 [00:21<01:36, 18.92it/s][A
Epoch 4/10:  17%|█▋        | 384/2208 [00:21<01:33, 19.59it/s][A
Epoch 4/10:  18%|█▊        | 387/2208 [00:21<01:31, 19.92it/s][A
Epoch 4/10:  18%|█▊        | 390/2208 [00:21<01:29, 20.36it/s][A
Epoch 4/10:  18%|█▊        | 393/2208 [00:22<01:28, 20.55it/s][A
Epoch 4/10:  18%|█▊        | 396/2208 [00:22<01:27, 20.66it/s][A
  with torch.cuda.amp.autocast():

Epoch 4/10:  18%|█▊        | 402/2208 [00:22<01:39, 18.11it/s][A
Epoch 4/10:  18%|█▊        | 405/2208 [00:22<01:35, 18.92it/s][A

Batch 400: Training loss = 0.2603, Training accuracy = 0.9093, F1 = 0.9092



Epoch 4/10:  18%|█▊        | 408/2208 [00:22<01:31, 19.62it/s][A
Epoch 4/10:  19%|█▊        | 411/2208 [00:23<01:29, 20.04it/s][A
Epoch 4/10:  19%|█▉        | 414/2208 [00:23<01:28, 20.37it/s][A
Epoch 4/10:  19%|█▉        | 417/2208 [00:23<01:26, 20.65it/s][A
Epoch 4/10:  19%|█▉        | 420/2208 [00:23<01:26, 20.68it/s][A
Epoch 4/10:  19%|█▉        | 423/2208 [00:23<01:25, 20.89it/s][A
  with torch.cuda.amp.autocast():

Epoch 4/10:  19%|█▉        | 429/2208 [00:23<01:33, 18.96it/s][A

Batch 425: Training loss = 0.3134, Training accuracy = 0.9094, F1 = 0.9092



Epoch 4/10:  20%|█▉        | 432/2208 [00:24<01:30, 19.63it/s][A
Epoch 4/10:  20%|█▉        | 435/2208 [00:24<01:28, 20.04it/s][A
Epoch 4/10:  20%|█▉        | 438/2208 [00:24<01:26, 20.36it/s][A
Epoch 4/10:  20%|█▉        | 441/2208 [00:24<01:25, 20.60it/s][A
Epoch 4/10:  20%|██        | 444/2208 [00:24<01:24, 20.85it/s][A
Epoch 4/10:  20%|██        | 447/2208 [00:24<01:25, 20.71it/s][A
  with torch.cuda.amp.autocast():

Epoch 4/10:  21%|██        | 453/2208 [00:25<01:49, 16.02it/s][A

Batch 450: Training loss = 0.3654, Training accuracy = 0.9094, F1 = 0.9092



Epoch 4/10:  21%|██        | 456/2208 [00:25<01:41, 17.27it/s][A
Epoch 4/10:  21%|██        | 459/2208 [00:25<01:35, 18.40it/s][A
Epoch 4/10:  21%|██        | 462/2208 [00:25<01:31, 19.01it/s][A
Epoch 4/10:  21%|██        | 465/2208 [00:25<01:29, 19.52it/s][A
Epoch 4/10:  21%|██        | 468/2208 [00:25<01:27, 19.80it/s][A
Epoch 4/10:  21%|██▏       | 471/2208 [00:26<01:25, 20.22it/s][A
Epoch 4/10:  21%|██▏       | 474/2208 [00:26<01:29, 19.30it/s][A
  with torch.cuda.amp.autocast():

Epoch 4/10:  22%|██▏       | 479/2208 [00:26<01:40, 17.28it/s][A

Batch 475: Training loss = 0.2546, Training accuracy = 0.9096, F1 = 0.9094



Epoch 4/10:  22%|██▏       | 482/2208 [00:26<01:33, 18.36it/s][A
Epoch 4/10:  22%|██▏       | 485/2208 [00:26<01:29, 19.19it/s][A
Epoch 4/10:  22%|██▏       | 488/2208 [00:27<01:27, 19.68it/s][A
Epoch 4/10:  22%|██▏       | 491/2208 [00:27<01:25, 20.14it/s][A
Epoch 4/10:  22%|██▏       | 494/2208 [00:27<01:41, 16.82it/s][A
Epoch 4/10:  23%|██▎       | 497/2208 [00:27<01:42, 16.68it/s][A
  with torch.cuda.amp.autocast():

Epoch 4/10:  23%|██▎       | 502/2208 [00:27<01:48, 15.77it/s][A
Epoch 4/10:  23%|██▎       | 505/2208 [00:28<01:39, 17.12it/s][A

Batch 500: Training loss = 0.2098, Training accuracy = 0.9100, F1 = 0.9098



Epoch 4/10:  23%|██▎       | 508/2208 [00:28<01:33, 18.09it/s][A
Epoch 4/10:  23%|██▎       | 511/2208 [00:28<01:29, 18.96it/s][A
Epoch 4/10:  23%|██▎       | 514/2208 [00:28<01:27, 19.43it/s][A
Epoch 4/10:  23%|██▎       | 516/2208 [00:28<01:29, 18.95it/s][A
Epoch 4/10:  23%|██▎       | 518/2208 [00:28<01:32, 18.28it/s][A
Epoch 4/10:  24%|██▎       | 521/2208 [00:28<01:27, 19.20it/s][A
Epoch 4/10:  24%|██▎       | 523/2208 [00:29<01:29, 18.85it/s][A
  with torch.cuda.amp.autocast():

Epoch 4/10:  24%|██▍       | 529/2208 [00:29<01:46, 15.74it/s][A

Batch 525: Training loss = 0.2129, Training accuracy = 0.9101, F1 = 0.9099



Epoch 4/10:  24%|██▍       | 532/2208 [00:29<01:38, 17.04it/s][A
Epoch 4/10:  24%|██▍       | 535/2208 [00:29<01:31, 18.19it/s][A
Epoch 4/10:  24%|██▍       | 538/2208 [00:29<01:27, 19.01it/s][A
Epoch 4/10:  25%|██▍       | 541/2208 [00:30<01:24, 19.67it/s][A
Epoch 4/10:  25%|██▍       | 544/2208 [00:30<01:22, 20.20it/s][A
Epoch 4/10:  25%|██▍       | 547/2208 [00:30<01:29, 18.52it/s][A
Epoch 4/10:  25%|██▍       | 549/2208 [00:30<01:34, 17.62it/s][A
  with torch.cuda.amp.autocast():

Epoch 4/10:  25%|██▌       | 554/2208 [00:30<01:38, 16.74it/s][A

Batch 550: Training loss = 0.3102, Training accuracy = 0.9105, F1 = 0.9104



Epoch 4/10:  25%|██▌       | 557/2208 [00:30<01:31, 17.99it/s][A
Epoch 4/10:  25%|██▌       | 560/2208 [00:31<01:27, 18.91it/s][A
Epoch 4/10:  25%|██▌       | 563/2208 [00:31<01:23, 19.67it/s][A
Epoch 4/10:  26%|██▌       | 566/2208 [00:31<01:22, 20.02it/s][A
Epoch 4/10:  26%|██▌       | 569/2208 [00:31<01:20, 20.31it/s][A
Epoch 4/10:  26%|██▌       | 572/2208 [00:31<01:19, 20.60it/s][A
  with torch.cuda.amp.autocast():

Epoch 4/10:  26%|██▌       | 578/2208 [00:32<01:34, 17.33it/s][A

Batch 575: Training loss = 0.2711, Training accuracy = 0.9106, F1 = 0.9105



Epoch 4/10:  26%|██▋       | 581/2208 [00:32<01:28, 18.34it/s][A
Epoch 4/10:  26%|██▋       | 584/2208 [00:32<01:25, 19.08it/s][A
Epoch 4/10:  27%|██▋       | 587/2208 [00:32<01:21, 19.77it/s][A
Epoch 4/10:  27%|██▋       | 590/2208 [00:32<01:20, 20.21it/s][A
Epoch 4/10:  27%|██▋       | 593/2208 [00:32<01:18, 20.53it/s][A
Epoch 4/10:  27%|██▋       | 596/2208 [00:32<01:17, 20.70it/s][A
  with torch.cuda.amp.autocast():

Epoch 4/10:  27%|██▋       | 602/2208 [00:33<01:33, 17.09it/s][A
Epoch 4/10:  27%|██▋       | 605/2208 [00:33<01:28, 18.10it/s][A

Batch 600: Training loss = 0.3359, Training accuracy = 0.9108, F1 = 0.9107



Epoch 4/10:  28%|██▊       | 608/2208 [00:33<01:24, 18.99it/s][A
Epoch 4/10:  28%|██▊       | 611/2208 [00:33<01:21, 19.61it/s][A
Epoch 4/10:  28%|██▊       | 614/2208 [00:33<01:19, 20.02it/s][A
Epoch 4/10:  28%|██▊       | 617/2208 [00:34<01:18, 20.26it/s][A
Epoch 4/10:  28%|██▊       | 620/2208 [00:34<01:17, 20.49it/s][A
Epoch 4/10:  28%|██▊       | 623/2208 [00:34<01:16, 20.75it/s][A
  with torch.cuda.amp.autocast():

Epoch 4/10:  28%|██▊       | 629/2208 [00:34<01:27, 18.01it/s][A

Batch 625: Training loss = 0.2649, Training accuracy = 0.9107, F1 = 0.9105



Epoch 4/10:  29%|██▊       | 632/2208 [00:34<01:23, 18.88it/s][A
Epoch 4/10:  29%|██▉       | 635/2208 [00:34<01:19, 19.67it/s][A
Epoch 4/10:  29%|██▉       | 638/2208 [00:35<01:17, 20.15it/s][A
Epoch 4/10:  29%|██▉       | 641/2208 [00:35<01:16, 20.40it/s][A
Epoch 4/10:  29%|██▉       | 644/2208 [00:35<01:15, 20.65it/s][A
Epoch 4/10:  29%|██▉       | 647/2208 [00:35<01:15, 20.78it/s][A
  with torch.cuda.amp.autocast():

Epoch 4/10:  30%|██▉       | 653/2208 [00:35<01:39, 15.56it/s][A

Batch 650: Training loss = 0.2362, Training accuracy = 0.9109, F1 = 0.9107



Epoch 4/10:  30%|██▉       | 656/2208 [00:36<01:31, 17.00it/s][A
Epoch 4/10:  30%|██▉       | 659/2208 [00:36<01:25, 18.15it/s][A
Epoch 4/10:  30%|██▉       | 662/2208 [00:36<01:21, 19.05it/s][A
Epoch 4/10:  30%|███       | 665/2208 [00:36<01:18, 19.71it/s][A
Epoch 4/10:  30%|███       | 668/2208 [00:36<01:16, 20.24it/s][A
Epoch 4/10:  30%|███       | 671/2208 [00:36<01:15, 20.40it/s][A
  with torch.cuda.amp.autocast():

Epoch 4/10:  31%|███       | 677/2208 [00:37<01:31, 16.74it/s][A
Epoch 4/10:  31%|███       | 680/2208 [00:37<01:25, 17.93it/s][A

Batch 675: Training loss = 0.3431, Training accuracy = 0.9114, F1 = 0.9113



Epoch 4/10:  31%|███       | 683/2208 [00:37<01:20, 18.84it/s][A
Epoch 4/10:  31%|███       | 686/2208 [00:37<01:18, 19.35it/s][A
Epoch 4/10:  31%|███       | 689/2208 [00:37<01:16, 19.88it/s][A
Epoch 4/10:  31%|███▏      | 692/2208 [00:37<01:14, 20.27it/s][A
Epoch 4/10:  31%|███▏      | 695/2208 [00:38<01:13, 20.46it/s][A
Epoch 4/10:  32%|███▏      | 698/2208 [00:38<01:13, 20.61it/s][A
  with torch.cuda.amp.autocast():

Epoch 4/10:  32%|███▏      | 704/2208 [00:38<01:25, 17.69it/s][A

Batch 700: Training loss = 0.3537, Training accuracy = 0.9116, F1 = 0.9114



Epoch 4/10:  32%|███▏      | 707/2208 [00:38<01:20, 18.69it/s][A
Epoch 4/10:  32%|███▏      | 710/2208 [00:38<01:17, 19.38it/s][A
Epoch 4/10:  32%|███▏      | 713/2208 [00:39<01:15, 19.83it/s][A
Epoch 4/10:  32%|███▏      | 716/2208 [00:39<01:13, 20.21it/s][A
Epoch 4/10:  33%|███▎      | 719/2208 [00:39<01:12, 20.57it/s][A
Epoch 4/10:  33%|███▎      | 722/2208 [00:39<01:11, 20.73it/s][A
  with torch.cuda.amp.autocast():

Epoch 4/10:  33%|███▎      | 728/2208 [00:39<01:35, 15.46it/s][A

Batch 725: Training loss = 0.2876, Training accuracy = 0.9116, F1 = 0.9114



Epoch 4/10:  33%|███▎      | 731/2208 [00:40<01:27, 16.87it/s][A
Epoch 4/10:  33%|███▎      | 734/2208 [00:40<01:22, 17.83it/s][A
Epoch 4/10:  33%|███▎      | 737/2208 [00:40<01:18, 18.63it/s][A
Epoch 4/10:  34%|███▎      | 740/2208 [00:40<01:16, 19.31it/s][A
Epoch 4/10:  34%|███▎      | 743/2208 [00:40<01:14, 19.77it/s][A
Epoch 4/10:  34%|███▍      | 746/2208 [00:40<01:12, 20.19it/s][A
Epoch 4/10:  34%|███▍      | 749/2208 [00:41<01:32, 15.70it/s][A
  with torch.cuda.amp.autocast():

Epoch 4/10:  34%|███▍      | 754/2208 [00:41<01:35, 15.18it/s][A

Batch 750: Training loss = 0.3344, Training accuracy = 0.9117, F1 = 0.9115



Epoch 4/10:  34%|███▍      | 757/2208 [00:41<01:27, 16.65it/s][A
Epoch 4/10:  34%|███▍      | 760/2208 [00:41<01:21, 17.75it/s][A
Epoch 4/10:  35%|███▍      | 763/2208 [00:41<01:17, 18.66it/s][A
Epoch 4/10:  35%|███▍      | 766/2208 [00:42<01:14, 19.28it/s][A
Epoch 4/10:  35%|███▍      | 769/2208 [00:42<01:12, 19.80it/s][A
Epoch 4/10:  35%|███▍      | 772/2208 [00:42<01:11, 20.22it/s][A
  with torch.cuda.amp.autocast():

Epoch 4/10:  35%|███▌      | 778/2208 [00:42<01:33, 15.21it/s][A

Batch 775: Training loss = 0.2711, Training accuracy = 0.9118, F1 = 0.9117



Epoch 4/10:  35%|███▌      | 781/2208 [00:42<01:25, 16.61it/s][A
Epoch 4/10:  36%|███▌      | 784/2208 [00:43<01:20, 17.66it/s][A
Epoch 4/10:  36%|███▌      | 787/2208 [00:43<01:16, 18.55it/s][A
Epoch 4/10:  36%|███▌      | 790/2208 [00:43<01:14, 19.13it/s][A
Epoch 4/10:  36%|███▌      | 793/2208 [00:43<01:12, 19.61it/s][A
Epoch 4/10:  36%|███▌      | 796/2208 [00:43<01:11, 19.70it/s][A
Epoch 4/10:  36%|███▌      | 799/2208 [00:43<01:12, 19.52it/s][A
  with torch.cuda.amp.autocast():

Epoch 4/10:  36%|███▋      | 804/2208 [00:44<01:29, 15.67it/s][A

Batch 800: Training loss = 0.2013, Training accuracy = 0.9120, F1 = 0.9118



Epoch 4/10:  37%|███▋      | 807/2208 [00:44<01:21, 17.09it/s][A
Epoch 4/10:  37%|███▋      | 810/2208 [00:44<01:17, 18.08it/s][A
Epoch 4/10:  37%|███▋      | 813/2208 [00:44<01:13, 18.94it/s][A
Epoch 4/10:  37%|███▋      | 816/2208 [00:44<01:11, 19.50it/s][A
Epoch 4/10:  37%|███▋      | 819/2208 [00:44<01:09, 19.94it/s][A
Epoch 4/10:  37%|███▋      | 822/2208 [00:45<01:08, 20.30it/s][A
  with torch.cuda.amp.autocast():

Epoch 4/10:  38%|███▊      | 828/2208 [00:45<01:29, 15.50it/s][A

Batch 825: Training loss = 0.2957, Training accuracy = 0.9123, F1 = 0.9122



Epoch 4/10:  38%|███▊      | 831/2208 [00:45<01:21, 16.99it/s][A
Epoch 4/10:  38%|███▊      | 834/2208 [00:45<01:16, 18.05it/s][A
Epoch 4/10:  38%|███▊      | 837/2208 [00:45<01:12, 18.86it/s][A
Epoch 4/10:  38%|███▊      | 840/2208 [00:46<01:10, 19.50it/s][A
Epoch 4/10:  38%|███▊      | 843/2208 [00:46<01:08, 19.96it/s][A
Epoch 4/10:  38%|███▊      | 846/2208 [00:46<01:06, 20.36it/s][A
  with torch.cuda.amp.autocast():

Epoch 4/10:  39%|███▊      | 852/2208 [00:46<01:24, 16.06it/s][A
Epoch 4/10:  39%|███▊      | 855/2208 [00:46<01:17, 17.37it/s][A

Batch 850: Training loss = 0.3165, Training accuracy = 0.9125, F1 = 0.9123



Epoch 4/10:  39%|███▉      | 858/2208 [00:47<01:13, 18.35it/s][A
Epoch 4/10:  39%|███▉      | 861/2208 [00:47<01:10, 19.17it/s][A
Epoch 4/10:  39%|███▉      | 864/2208 [00:47<01:07, 19.77it/s][A
Epoch 4/10:  39%|███▉      | 867/2208 [00:47<01:06, 20.08it/s][A
Epoch 4/10:  39%|███▉      | 870/2208 [00:47<01:05, 20.36it/s][A
Epoch 4/10:  40%|███▉      | 873/2208 [00:47<01:05, 20.53it/s][A
  with torch.cuda.amp.autocast():

Epoch 4/10:  40%|███▉      | 879/2208 [00:48<01:17, 17.14it/s][A

Batch 875: Training loss = 0.2692, Training accuracy = 0.9125, F1 = 0.9123



Epoch 4/10:  40%|███▉      | 882/2208 [00:48<01:13, 18.16it/s][A
Epoch 4/10:  40%|████      | 885/2208 [00:48<01:09, 18.96it/s][A
Epoch 4/10:  40%|████      | 888/2208 [00:48<01:07, 19.57it/s][A
Epoch 4/10:  40%|████      | 891/2208 [00:48<01:05, 20.12it/s][A
Epoch 4/10:  40%|████      | 894/2208 [00:48<01:04, 20.29it/s][A
Epoch 4/10:  41%|████      | 897/2208 [00:49<01:03, 20.59it/s][A
  with torch.cuda.amp.autocast():

Epoch 4/10:  41%|████      | 903/2208 [00:49<01:26, 15.14it/s][A

Batch 900: Training loss = 0.2911, Training accuracy = 0.9126, F1 = 0.9125



Epoch 4/10:  41%|████      | 906/2208 [00:49<01:18, 16.57it/s][A
Epoch 4/10:  41%|████      | 909/2208 [00:49<01:13, 17.69it/s][A
Epoch 4/10:  41%|████▏     | 912/2208 [00:49<01:09, 18.63it/s][A
Epoch 4/10:  41%|████▏     | 915/2208 [00:50<01:06, 19.31it/s][A
Epoch 4/10:  42%|████▏     | 918/2208 [00:50<01:05, 19.85it/s][A
Epoch 4/10:  42%|████▏     | 921/2208 [00:50<01:03, 20.19it/s][A
  with torch.cuda.amp.autocast():

Epoch 4/10:  42%|████▏     | 927/2208 [00:50<01:22, 15.50it/s][A
Epoch 4/10:  42%|████▏     | 930/2208 [00:50<01:15, 16.94it/s][A

Batch 925: Training loss = 0.2405, Training accuracy = 0.9127, F1 = 0.9126



Epoch 4/10:  42%|████▏     | 933/2208 [00:51<01:10, 17.97it/s][A
Epoch 4/10:  42%|████▏     | 936/2208 [00:51<01:07, 18.80it/s][A
Epoch 4/10:  43%|████▎     | 939/2208 [00:51<01:05, 19.46it/s][A
Epoch 4/10:  43%|████▎     | 942/2208 [00:51<01:03, 19.98it/s][A
Epoch 4/10:  43%|████▎     | 945/2208 [00:51<01:01, 20.39it/s][A
Epoch 4/10:  43%|████▎     | 948/2208 [00:51<01:01, 20.55it/s][A
  with torch.cuda.amp.autocast():

Epoch 4/10:  43%|████▎     | 954/2208 [00:52<01:14, 16.91it/s][A

Batch 950: Training loss = 0.3288, Training accuracy = 0.9129, F1 = 0.9127



Epoch 4/10:  43%|████▎     | 957/2208 [00:52<01:09, 18.01it/s][A
Epoch 4/10:  43%|████▎     | 960/2208 [00:52<01:06, 18.76it/s][A
Epoch 4/10:  44%|████▎     | 963/2208 [00:52<01:04, 19.32it/s][A
Epoch 4/10:  44%|████▍     | 966/2208 [00:52<01:02, 19.90it/s][A
Epoch 4/10:  44%|████▍     | 969/2208 [00:52<01:01, 20.27it/s][A
Epoch 4/10:  44%|████▍     | 972/2208 [00:53<01:00, 20.53it/s][A
  with torch.cuda.amp.autocast():

Epoch 4/10:  44%|████▍     | 978/2208 [00:53<01:22, 14.94it/s][A

Batch 975: Training loss = 0.3234, Training accuracy = 0.9129, F1 = 0.9127



Epoch 4/10:  44%|████▍     | 981/2208 [00:53<01:14, 16.48it/s][A
Epoch 4/10:  45%|████▍     | 984/2208 [00:53<01:09, 17.69it/s][A
Epoch 4/10:  45%|████▍     | 987/2208 [00:54<01:05, 18.59it/s][A
Epoch 4/10:  45%|████▍     | 990/2208 [00:54<01:02, 19.39it/s][A
Epoch 4/10:  45%|████▍     | 993/2208 [00:54<01:01, 19.91it/s][A
Epoch 4/10:  45%|████▌     | 996/2208 [00:54<00:59, 20.24it/s][A
  with torch.cuda.amp.autocast():

Epoch 4/10:  45%|████▌     | 1002/2208 [00:54<01:25, 14.15it/s][A
Epoch 4/10:  46%|████▌     | 1005/2208 [00:55<01:15, 15.85it/s][A

Batch 1000: Training loss = 0.2188, Training accuracy = 0.9131, F1 = 0.9129



Epoch 4/10:  46%|████▌     | 1008/2208 [00:55<01:09, 17.17it/s][A
Epoch 4/10:  46%|████▌     | 1011/2208 [00:55<01:05, 18.19it/s][A
Epoch 4/10:  46%|████▌     | 1014/2208 [00:55<01:03, 18.87it/s][A
Epoch 4/10:  46%|████▌     | 1017/2208 [00:55<01:01, 19.48it/s][A
Epoch 4/10:  46%|████▌     | 1020/2208 [00:55<01:03, 18.71it/s][A
Epoch 4/10:  46%|████▋     | 1022/2208 [00:55<01:07, 17.50it/s][A
  with torch.cuda.amp.autocast():

Epoch 4/10:  47%|████▋     | 1027/2208 [00:56<01:34, 12.53it/s][A
Epoch 4/10:  47%|████▋     | 1030/2208 [00:56<01:20, 14.54it/s][A

Batch 1025: Training loss = 0.1310, Training accuracy = 0.9131, F1 = 0.9129



Epoch 4/10:  47%|████▋     | 1033/2208 [00:56<01:12, 16.28it/s][A
Epoch 4/10:  47%|████▋     | 1036/2208 [00:56<01:07, 17.47it/s][A
Epoch 4/10:  47%|████▋     | 1039/2208 [00:57<01:03, 18.38it/s][A
Epoch 4/10:  47%|████▋     | 1042/2208 [00:57<01:00, 19.20it/s][A
Epoch 4/10:  47%|████▋     | 1045/2208 [00:57<01:07, 17.32it/s][A
Epoch 4/10:  47%|████▋     | 1048/2208 [00:57<01:02, 18.45it/s][A
  with torch.cuda.amp.autocast():

Epoch 4/10:  48%|████▊     | 1054/2208 [00:58<01:23, 13.86it/s][A

Batch 1050: Training loss = 0.2935, Training accuracy = 0.9134, F1 = 0.9132



Epoch 4/10:  48%|████▊     | 1057/2208 [00:58<01:14, 15.50it/s][A
Epoch 4/10:  48%|████▊     | 1059/2208 [00:58<01:10, 16.29it/s][A
Epoch 4/10:  48%|████▊     | 1062/2208 [00:58<01:05, 17.58it/s][A
Epoch 4/10:  48%|████▊     | 1065/2208 [00:58<01:01, 18.49it/s][A
Epoch 4/10:  48%|████▊     | 1067/2208 [00:58<01:03, 18.02it/s][A
Epoch 4/10:  48%|████▊     | 1070/2208 [00:58<01:02, 18.15it/s][A
Epoch 4/10:  49%|████▊     | 1073/2208 [00:59<00:59, 19.04it/s][A
  with torch.cuda.amp.autocast():

Epoch 4/10:  49%|████▉     | 1077/2208 [00:59<01:26, 13.14it/s][A
Epoch 4/10:  49%|████▉     | 1080/2208 [00:59<01:14, 15.18it/s][A

Batch 1075: Training loss = 0.1520, Training accuracy = 0.9135, F1 = 0.9133



Epoch 4/10:  49%|████▉     | 1083/2208 [00:59<01:07, 16.78it/s][A
Epoch 4/10:  49%|████▉     | 1086/2208 [00:59<01:02, 17.94it/s][A
Epoch 4/10:  49%|████▉     | 1088/2208 [00:59<01:01, 18.35it/s][A
Epoch 4/10:  49%|████▉     | 1091/2208 [01:00<00:58, 19.25it/s][A
Epoch 4/10:  50%|████▉     | 1094/2208 [01:00<00:56, 19.87it/s][A
Epoch 4/10:  50%|████▉     | 1097/2208 [01:00<00:54, 20.36it/s][A
  with torch.cuda.amp.autocast():

Epoch 4/10:  50%|████▉     | 1103/2208 [01:00<01:15, 14.61it/s][A

Batch 1100: Training loss = 0.2852, Training accuracy = 0.9135, F1 = 0.9133



Epoch 4/10:  50%|█████     | 1106/2208 [01:00<01:07, 16.23it/s][A
Epoch 4/10:  50%|█████     | 1109/2208 [01:01<01:02, 17.51it/s][A
Epoch 4/10:  50%|█████     | 1111/2208 [01:01<01:00, 18.01it/s][A
Epoch 4/10:  50%|█████     | 1114/2208 [01:01<00:57, 18.95it/s][A
Epoch 4/10:  51%|█████     | 1117/2208 [01:01<00:56, 19.42it/s][A
Epoch 4/10:  51%|█████     | 1120/2208 [01:01<00:54, 20.09it/s][A
Epoch 4/10:  51%|█████     | 1123/2208 [01:01<00:53, 20.42it/s][A
  with torch.cuda.amp.autocast():

Epoch 4/10:  51%|█████     | 1129/2208 [01:02<01:06, 16.29it/s][A

Batch 1125: Training loss = 0.2453, Training accuracy = 0.9137, F1 = 0.9135



Epoch 4/10:  51%|█████▏    | 1132/2208 [01:02<01:01, 17.48it/s][A
Epoch 4/10:  51%|█████▏    | 1135/2208 [01:02<00:57, 18.51it/s][A
Epoch 4/10:  52%|█████▏    | 1138/2208 [01:02<00:55, 19.21it/s][A
Epoch 4/10:  52%|█████▏    | 1141/2208 [01:02<00:53, 19.76it/s][A
Epoch 4/10:  52%|█████▏    | 1144/2208 [01:02<00:52, 20.24it/s][A
Epoch 4/10:  52%|█████▏    | 1147/2208 [01:03<00:51, 20.50it/s][A
  with torch.cuda.amp.autocast():

Epoch 4/10:  52%|█████▏    | 1153/2208 [01:03<01:16, 13.77it/s][A

Batch 1150: Training loss = 0.2331, Training accuracy = 0.9139, F1 = 0.9138



Epoch 4/10:  52%|█████▏    | 1156/2208 [01:03<01:07, 15.48it/s][A
Epoch 4/10:  52%|█████▏    | 1159/2208 [01:03<01:02, 16.84it/s][A
Epoch 4/10:  53%|█████▎    | 1161/2208 [01:04<01:00, 17.38it/s][A
Epoch 4/10:  53%|█████▎    | 1164/2208 [01:04<00:56, 18.37it/s][A
Epoch 4/10:  53%|█████▎    | 1167/2208 [01:04<00:54, 19.12it/s][A
Epoch 4/10:  53%|█████▎    | 1170/2208 [01:04<00:52, 19.64it/s][A
Epoch 4/10:  53%|█████▎    | 1173/2208 [01:04<00:51, 20.19it/s][A
  with torch.cuda.amp.autocast():

Epoch 4/10:  53%|█████▎    | 1179/2208 [01:05<01:05, 15.77it/s][A

Batch 1175: Training loss = 0.2630, Training accuracy = 0.9140, F1 = 0.9139



Epoch 4/10:  54%|█████▎    | 1182/2208 [01:05<00:59, 17.17it/s][A
Epoch 4/10:  54%|█████▎    | 1185/2208 [01:05<00:56, 18.17it/s][A
Epoch 4/10:  54%|█████▍    | 1188/2208 [01:05<00:53, 19.08it/s][A
Epoch 4/10:  54%|█████▍    | 1191/2208 [01:05<00:51, 19.69it/s][A
Epoch 4/10:  54%|█████▍    | 1194/2208 [01:05<00:50, 20.04it/s][A
Epoch 4/10:  54%|█████▍    | 1197/2208 [01:05<00:49, 20.45it/s][A
  with torch.cuda.amp.autocast():

Epoch 4/10:  54%|█████▍    | 1203/2208 [01:06<01:12, 13.78it/s][A

Batch 1200: Training loss = 0.2632, Training accuracy = 0.9140, F1 = 0.9139



Epoch 4/10:  55%|█████▍    | 1206/2208 [01:06<01:04, 15.48it/s][A
Epoch 4/10:  55%|█████▍    | 1209/2208 [01:06<00:59, 16.91it/s][A
Epoch 4/10:  55%|█████▍    | 1212/2208 [01:06<00:55, 18.05it/s][A
Epoch 4/10:  55%|█████▌    | 1215/2208 [01:07<00:52, 18.89it/s][A
Epoch 4/10:  55%|█████▌    | 1218/2208 [01:07<00:50, 19.51it/s][A
Epoch 4/10:  55%|█████▌    | 1221/2208 [01:07<00:49, 20.02it/s][A
  with torch.cuda.amp.autocast():

Epoch 4/10:  56%|█████▌    | 1227/2208 [01:07<01:11, 13.79it/s][A
Epoch 4/10:  56%|█████▌    | 1230/2208 [01:07<01:02, 15.55it/s][A

Batch 1225: Training loss = 0.2110, Training accuracy = 0.9142, F1 = 0.9141



Epoch 4/10:  56%|█████▌    | 1233/2208 [01:08<00:57, 16.95it/s][A
Epoch 4/10:  56%|█████▌    | 1236/2208 [01:08<00:53, 18.09it/s][A
Epoch 4/10:  56%|█████▌    | 1239/2208 [01:08<00:51, 18.96it/s][A
Epoch 4/10:  56%|█████▋    | 1242/2208 [01:08<00:49, 19.54it/s][A
Epoch 4/10:  56%|█████▋    | 1245/2208 [01:08<00:47, 20.09it/s][A
Epoch 4/10:  57%|█████▋    | 1248/2208 [01:08<00:47, 20.18it/s][A
  with torch.cuda.amp.autocast():

Epoch 4/10:  57%|█████▋    | 1254/2208 [01:09<01:04, 14.69it/s][A

Batch 1250: Training loss = 0.2125, Training accuracy = 0.9144, F1 = 0.9142



Epoch 4/10:  57%|█████▋    | 1257/2208 [01:09<00:58, 16.15it/s][A
Epoch 4/10:  57%|█████▋    | 1260/2208 [01:09<00:54, 17.26it/s][A
Epoch 4/10:  57%|█████▋    | 1263/2208 [01:09<00:51, 18.28it/s][A
Epoch 4/10:  57%|█████▋    | 1266/2208 [01:09<00:49, 19.04it/s][A
Epoch 4/10:  57%|█████▋    | 1269/2208 [01:10<00:47, 19.71it/s][A
Epoch 4/10:  58%|█████▊    | 1272/2208 [01:10<00:46, 20.14it/s][A
  with torch.cuda.amp.autocast():

Epoch 4/10:  58%|█████▊    | 1277/2208 [01:10<01:18, 11.84it/s][A
Epoch 4/10:  58%|█████▊    | 1280/2208 [01:10<01:06, 13.88it/s][A

Batch 1275: Training loss = 0.3011, Training accuracy = 0.9147, F1 = 0.9145



Epoch 4/10:  58%|█████▊    | 1283/2208 [01:11<00:59, 15.58it/s][A
Epoch 4/10:  58%|█████▊    | 1286/2208 [01:11<00:54, 16.95it/s][A
Epoch 4/10:  58%|█████▊    | 1289/2208 [01:11<00:50, 18.12it/s][A
Epoch 4/10:  59%|█████▊    | 1292/2208 [01:11<00:48, 18.96it/s][A
Epoch 4/10:  59%|█████▊    | 1295/2208 [01:11<00:50, 18.16it/s][A
Epoch 4/10:  59%|█████▊    | 1297/2208 [01:11<00:54, 16.73it/s][A
  with torch.cuda.amp.autocast():

Epoch 4/10:  59%|█████▉    | 1302/2208 [01:12<01:18, 11.48it/s][A
Epoch 4/10:  59%|█████▉    | 1305/2208 [01:12<01:06, 13.59it/s][A

Batch 1300: Training loss = 0.2385, Training accuracy = 0.9147, F1 = 0.9146



Epoch 4/10:  59%|█████▉    | 1308/2208 [01:12<00:58, 15.39it/s][A
Epoch 4/10:  59%|█████▉    | 1311/2208 [01:12<00:53, 16.77it/s][A
Epoch 4/10:  60%|█████▉    | 1314/2208 [01:12<00:50, 17.83it/s][A
Epoch 4/10:  60%|█████▉    | 1317/2208 [01:13<00:47, 18.73it/s][A
Epoch 4/10:  60%|█████▉    | 1320/2208 [01:13<00:45, 19.44it/s][A
Epoch 4/10:  60%|█████▉    | 1323/2208 [01:13<00:44, 19.83it/s][A
  with torch.cuda.amp.autocast():

Epoch 4/10:  60%|██████    | 1329/2208 [01:13<01:00, 14.54it/s][A

Batch 1325: Training loss = 0.1280, Training accuracy = 0.9148, F1 = 0.9147



Epoch 4/10:  60%|██████    | 1332/2208 [01:14<00:54, 16.09it/s][A
Epoch 4/10:  60%|██████    | 1335/2208 [01:14<00:50, 17.36it/s][A
Epoch 4/10:  61%|██████    | 1338/2208 [01:14<00:47, 18.45it/s][A
Epoch 4/10:  61%|██████    | 1341/2208 [01:14<00:45, 19.13it/s][A
Epoch 4/10:  61%|██████    | 1344/2208 [01:14<00:43, 19.70it/s][A
Epoch 4/10:  61%|██████    | 1347/2208 [01:14<00:42, 20.08it/s][A
  with torch.cuda.amp.autocast():

Epoch 4/10:  61%|██████▏   | 1353/2208 [01:15<01:03, 13.38it/s][A

Batch 1350: Training loss = 0.1917, Training accuracy = 0.9151, F1 = 0.9149



Epoch 4/10:  61%|██████▏   | 1356/2208 [01:15<00:56, 15.10it/s][A
Epoch 4/10:  62%|██████▏   | 1359/2208 [01:15<00:51, 16.54it/s][A
Epoch 4/10:  62%|██████▏   | 1362/2208 [01:15<00:47, 17.65it/s][A
Epoch 4/10:  62%|██████▏   | 1365/2208 [01:15<00:45, 18.62it/s][A
Epoch 4/10:  62%|██████▏   | 1368/2208 [01:16<00:43, 19.28it/s][A
Epoch 4/10:  62%|██████▏   | 1371/2208 [01:16<00:42, 19.85it/s][A
  with torch.cuda.amp.autocast():

Epoch 4/10:  62%|██████▏   | 1377/2208 [01:16<01:01, 13.41it/s][A
Epoch 4/10:  62%|██████▎   | 1380/2208 [01:16<00:54, 15.20it/s][A

Batch 1375: Training loss = 0.2419, Training accuracy = 0.9151, F1 = 0.9150



Epoch 4/10:  63%|██████▎   | 1383/2208 [01:17<00:49, 16.66it/s][A
Epoch 4/10:  63%|██████▎   | 1386/2208 [01:17<00:46, 17.83it/s][A
Epoch 4/10:  63%|██████▎   | 1389/2208 [01:17<00:43, 18.69it/s][A
Epoch 4/10:  63%|██████▎   | 1392/2208 [01:17<00:42, 19.41it/s][A
Epoch 4/10:  63%|██████▎   | 1395/2208 [01:17<00:41, 19.75it/s][A
Epoch 4/10:  63%|██████▎   | 1398/2208 [01:17<00:40, 20.08it/s][A
  with torch.cuda.amp.autocast():

Epoch 4/10:  64%|██████▎   | 1404/2208 [01:18<00:53, 15.10it/s][A

Batch 1400: Training loss = 0.2153, Training accuracy = 0.9151, F1 = 0.9150



Epoch 4/10:  64%|██████▎   | 1407/2208 [01:18<00:48, 16.57it/s][A
Epoch 4/10:  64%|██████▍   | 1410/2208 [01:18<00:45, 17.66it/s][A
Epoch 4/10:  64%|██████▍   | 1413/2208 [01:18<00:42, 18.66it/s][A
Epoch 4/10:  64%|██████▍   | 1416/2208 [01:18<00:40, 19.47it/s][A
Epoch 4/10:  64%|██████▍   | 1419/2208 [01:18<00:39, 20.03it/s][A
Epoch 4/10:  64%|██████▍   | 1422/2208 [01:19<00:38, 20.30it/s][A
  with torch.cuda.amp.autocast():

Epoch 4/10:  65%|██████▍   | 1428/2208 [01:19<01:00, 12.95it/s][A

Batch 1425: Training loss = 0.1915, Training accuracy = 0.9152, F1 = 0.9151



Epoch 4/10:  65%|██████▍   | 1431/2208 [01:19<00:52, 14.73it/s][A
Epoch 4/10:  65%|██████▍   | 1434/2208 [01:19<00:47, 16.33it/s][A
Epoch 4/10:  65%|██████▌   | 1437/2208 [01:20<00:43, 17.60it/s][A
Epoch 4/10:  65%|██████▌   | 1440/2208 [01:20<00:41, 18.48it/s][A
Epoch 4/10:  65%|██████▌   | 1443/2208 [01:20<00:40, 19.02it/s][A
Epoch 4/10:  65%|██████▌   | 1446/2208 [01:20<00:38, 19.69it/s][A
  with torch.cuda.amp.autocast():

Epoch 4/10:  66%|██████▌   | 1452/2208 [01:21<00:59, 12.74it/s][A
Epoch 4/10:  66%|██████▌   | 1455/2208 [01:21<00:51, 14.56it/s][A

Batch 1450: Training loss = 0.3643, Training accuracy = 0.9152, F1 = 0.9150



Epoch 4/10:  66%|██████▌   | 1458/2208 [01:21<00:46, 16.12it/s][A
Epoch 4/10:  66%|██████▌   | 1461/2208 [01:21<00:42, 17.42it/s][A
Epoch 4/10:  66%|██████▋   | 1464/2208 [01:21<00:40, 18.33it/s][A
Epoch 4/10:  66%|██████▋   | 1467/2208 [01:21<00:38, 19.07it/s][A
Epoch 4/10:  67%|██████▋   | 1470/2208 [01:21<00:37, 19.73it/s][A
Epoch 4/10:  67%|██████▋   | 1473/2208 [01:22<00:36, 20.07it/s][A
  with torch.cuda.amp.autocast():

Epoch 4/10:  67%|██████▋   | 1479/2208 [01:22<00:50, 14.53it/s][A

Batch 1475: Training loss = 0.2085, Training accuracy = 0.9153, F1 = 0.9152



Epoch 4/10:  67%|██████▋   | 1482/2208 [01:22<00:45, 16.07it/s][A
Epoch 4/10:  67%|██████▋   | 1485/2208 [01:22<00:41, 17.25it/s][A
Epoch 4/10:  67%|██████▋   | 1488/2208 [01:23<00:39, 18.34it/s][A
Epoch 4/10:  68%|██████▊   | 1491/2208 [01:23<00:37, 19.16it/s][A
Epoch 4/10:  68%|██████▊   | 1494/2208 [01:23<00:36, 19.62it/s][A
Epoch 4/10:  68%|██████▊   | 1497/2208 [01:23<00:36, 19.40it/s][A
  with torch.cuda.amp.autocast():

Epoch 4/10:  68%|██████▊   | 1502/2208 [01:24<01:04, 10.99it/s][A
Epoch 4/10:  68%|██████▊   | 1505/2208 [01:24<00:53, 13.09it/s][A

Batch 1500: Training loss = 0.2033, Training accuracy = 0.9154, F1 = 0.9152



Epoch 4/10:  68%|██████▊   | 1508/2208 [01:24<00:47, 14.87it/s][A
Epoch 4/10:  68%|██████▊   | 1511/2208 [01:24<00:42, 16.32it/s][A
Epoch 4/10:  69%|██████▊   | 1514/2208 [01:24<00:39, 17.51it/s][A
Epoch 4/10:  69%|██████▊   | 1517/2208 [01:24<00:37, 18.58it/s][A
Epoch 4/10:  69%|██████▉   | 1520/2208 [01:25<00:35, 19.19it/s][A
Epoch 4/10:  69%|██████▉   | 1523/2208 [01:25<00:35, 19.56it/s][A
  with torch.cuda.amp.autocast():

Epoch 4/10:  69%|██████▉   | 1529/2208 [01:25<00:51, 13.30it/s][A

Batch 1525: Training loss = 0.3409, Training accuracy = 0.9154, F1 = 0.9153



Epoch 4/10:  69%|██████▉   | 1532/2208 [01:25<00:45, 15.01it/s][A
Epoch 4/10:  70%|██████▉   | 1535/2208 [01:26<00:40, 16.45it/s][A
Epoch 4/10:  70%|██████▉   | 1538/2208 [01:26<00:38, 17.53it/s][A
Epoch 4/10:  70%|██████▉   | 1540/2208 [01:26<00:37, 18.00it/s][A
Epoch 4/10:  70%|██████▉   | 1543/2208 [01:26<00:35, 18.79it/s][A
Epoch 4/10:  70%|███████   | 1546/2208 [01:26<00:36, 17.96it/s][A
Epoch 4/10:  70%|███████   | 1549/2208 [01:26<00:35, 18.81it/s][A
  with torch.cuda.amp.autocast():

Epoch 4/10:  70%|███████   | 1554/2208 [01:27<00:49, 13.23it/s][A

Batch 1550: Training loss = 0.1673, Training accuracy = 0.9155, F1 = 0.9153



Epoch 4/10:  71%|███████   | 1557/2208 [01:27<00:43, 15.01it/s][A
Epoch 4/10:  71%|███████   | 1560/2208 [01:27<00:39, 16.49it/s][A
Epoch 4/10:  71%|███████   | 1563/2208 [01:27<00:36, 17.56it/s][A
Epoch 4/10:  71%|███████   | 1566/2208 [01:27<00:34, 18.57it/s][A
Epoch 4/10:  71%|███████   | 1569/2208 [01:28<00:32, 19.42it/s][A
Epoch 4/10:  71%|███████   | 1572/2208 [01:28<00:31, 20.03it/s][A
  with torch.cuda.amp.autocast():

Epoch 4/10:  71%|███████▏  | 1578/2208 [01:28<00:49, 12.66it/s][A

Batch 1575: Training loss = 0.2049, Training accuracy = 0.9155, F1 = 0.9154



Epoch 4/10:  72%|███████▏  | 1581/2208 [01:28<00:43, 14.47it/s][A
Epoch 4/10:  72%|███████▏  | 1584/2208 [01:29<00:39, 16.00it/s][A
Epoch 4/10:  72%|███████▏  | 1587/2208 [01:29<00:36, 17.25it/s][A
Epoch 4/10:  72%|███████▏  | 1590/2208 [01:29<00:34, 18.09it/s][A
Epoch 4/10:  72%|███████▏  | 1593/2208 [01:29<00:32, 18.81it/s][A
Epoch 4/10:  72%|███████▏  | 1596/2208 [01:29<00:31, 19.35it/s][A
  with torch.cuda.amp.autocast():

Epoch 4/10:  73%|███████▎  | 1602/2208 [01:30<00:50, 11.92it/s][A
Epoch 4/10:  73%|███████▎  | 1605/2208 [01:30<00:43, 13.80it/s][A

Batch 1600: Training loss = 0.2515, Training accuracy = 0.9156, F1 = 0.9155



Epoch 4/10:  73%|███████▎  | 1608/2208 [01:30<00:38, 15.46it/s][A
Epoch 4/10:  73%|███████▎  | 1611/2208 [01:30<00:35, 16.80it/s][A
Epoch 4/10:  73%|███████▎  | 1614/2208 [01:30<00:33, 17.85it/s][A
Epoch 4/10:  73%|███████▎  | 1617/2208 [01:31<00:31, 18.73it/s][A
Epoch 4/10:  73%|███████▎  | 1620/2208 [01:31<00:30, 19.50it/s][A
Epoch 4/10:  74%|███████▎  | 1623/2208 [01:31<00:29, 19.86it/s][A
  with torch.cuda.amp.autocast():

Epoch 4/10:  74%|███████▍  | 1629/2208 [01:31<00:40, 14.21it/s][A

Batch 1625: Training loss = 0.1070, Training accuracy = 0.9157, F1 = 0.9156



Epoch 4/10:  74%|███████▍  | 1632/2208 [01:32<00:36, 15.76it/s][A
Epoch 4/10:  74%|███████▍  | 1635/2208 [01:32<00:33, 17.07it/s][A
Epoch 4/10:  74%|███████▍  | 1638/2208 [01:32<00:31, 18.09it/s][A
Epoch 4/10:  74%|███████▍  | 1641/2208 [01:32<00:29, 18.95it/s][A
Epoch 4/10:  74%|███████▍  | 1644/2208 [01:32<00:28, 19.62it/s][A
Epoch 4/10:  75%|███████▍  | 1647/2208 [01:32<00:27, 20.05it/s][A
  with torch.cuda.amp.autocast():

Epoch 4/10:  75%|███████▍  | 1653/2208 [01:33<00:44, 12.39it/s][A

Batch 1650: Training loss = 0.2372, Training accuracy = 0.9158, F1 = 0.9157



Epoch 4/10:  75%|███████▌  | 1656/2208 [01:33<00:38, 14.23it/s][A
Epoch 4/10:  75%|███████▌  | 1659/2208 [01:33<00:34, 15.76it/s][A
Epoch 4/10:  75%|███████▌  | 1662/2208 [01:33<00:31, 17.07it/s][A
Epoch 4/10:  75%|███████▌  | 1665/2208 [01:33<00:29, 18.13it/s][A
Epoch 4/10:  76%|███████▌  | 1668/2208 [01:34<00:28, 18.89it/s][A
Epoch 4/10:  76%|███████▌  | 1671/2208 [01:34<00:27, 19.50it/s][A
  with torch.cuda.amp.autocast():

Epoch 4/10:  76%|███████▌  | 1677/2208 [01:34<00:44, 11.91it/s][A
Epoch 4/10:  76%|███████▌  | 1680/2208 [01:34<00:38, 13.78it/s][A

Batch 1675: Training loss = 0.2240, Training accuracy = 0.9160, F1 = 0.9159



Epoch 4/10:  76%|███████▌  | 1683/2208 [01:35<00:33, 15.45it/s][A
Epoch 4/10:  76%|███████▋  | 1686/2208 [01:35<00:31, 16.82it/s][A
Epoch 4/10:  76%|███████▋  | 1689/2208 [01:35<00:28, 18.00it/s][A
Epoch 4/10:  77%|███████▋  | 1692/2208 [01:35<00:27, 18.86it/s][A
Epoch 4/10:  77%|███████▋  | 1695/2208 [01:35<00:26, 19.46it/s][A
Epoch 4/10:  77%|███████▋  | 1698/2208 [01:35<00:25, 19.80it/s][A
  with torch.cuda.amp.autocast():

Epoch 4/10:  77%|███████▋  | 1704/2208 [01:36<00:35, 14.09it/s][A

Batch 1700: Training loss = 0.3597, Training accuracy = 0.9161, F1 = 0.9159



Epoch 4/10:  77%|███████▋  | 1707/2208 [01:36<00:31, 15.70it/s][A
Epoch 4/10:  77%|███████▋  | 1710/2208 [01:36<00:29, 17.15it/s][A
Epoch 4/10:  78%|███████▊  | 1713/2208 [01:36<00:27, 18.18it/s][A
Epoch 4/10:  78%|███████▊  | 1716/2208 [01:36<00:25, 19.03it/s][A
Epoch 4/10:  78%|███████▊  | 1719/2208 [01:37<00:25, 19.55it/s][A
Epoch 4/10:  78%|███████▊  | 1722/2208 [01:37<00:24, 20.11it/s][A
  with torch.cuda.amp.autocast():

Epoch 4/10:  78%|███████▊  | 1728/2208 [01:37<00:39, 12.26it/s][A

Batch 1725: Training loss = 0.1387, Training accuracy = 0.9162, F1 = 0.9160



Epoch 4/10:  78%|███████▊  | 1731/2208 [01:38<00:33, 14.11it/s][A
Epoch 4/10:  79%|███████▊  | 1734/2208 [01:38<00:30, 15.62it/s][A
Epoch 4/10:  79%|███████▊  | 1737/2208 [01:38<00:27, 17.00it/s][A
Epoch 4/10:  79%|███████▉  | 1740/2208 [01:38<00:25, 18.17it/s][A
Epoch 4/10:  79%|███████▉  | 1743/2208 [01:38<00:24, 19.02it/s][A
Epoch 4/10:  79%|███████▉  | 1746/2208 [01:38<00:23, 19.66it/s][A
Epoch 4/10:  79%|███████▉  | 1749/2208 [01:38<00:25, 18.27it/s][A
  with torch.cuda.amp.autocast():

Epoch 4/10:  79%|███████▉  | 1754/2208 [01:39<00:36, 12.38it/s][A

Batch 1750: Training loss = 0.2845, Training accuracy = 0.9163, F1 = 0.9161



Epoch 4/10:  80%|███████▉  | 1757/2208 [01:39<00:31, 14.29it/s][A
Epoch 4/10:  80%|███████▉  | 1760/2208 [01:39<00:27, 16.01it/s][A
Epoch 4/10:  80%|███████▉  | 1763/2208 [01:39<00:25, 17.34it/s][A
Epoch 4/10:  80%|███████▉  | 1765/2208 [01:40<00:27, 16.36it/s][A
Epoch 4/10:  80%|████████  | 1768/2208 [01:40<00:24, 17.71it/s][A
Epoch 4/10:  80%|████████  | 1771/2208 [01:40<00:23, 18.72it/s][A
Epoch 4/10:  80%|████████  | 1773/2208 [01:40<00:24, 17.58it/s][A
  with torch.cuda.amp.autocast():

Epoch 4/10:  81%|████████  | 1779/2208 [01:41<00:33, 12.63it/s][A

Batch 1775: Training loss = 0.3890, Training accuracy = 0.9164, F1 = 0.9162



Epoch 4/10:  81%|████████  | 1782/2208 [01:41<00:29, 14.44it/s][A
Epoch 4/10:  81%|████████  | 1785/2208 [01:41<00:26, 16.12it/s][A
Epoch 4/10:  81%|████████  | 1788/2208 [01:41<00:24, 17.42it/s][A
Epoch 4/10:  81%|████████  | 1791/2208 [01:41<00:22, 18.23it/s][A
Epoch 4/10:  81%|████████  | 1793/2208 [01:41<00:25, 16.49it/s][A
Epoch 4/10:  81%|████████▏ | 1796/2208 [01:42<00:23, 17.78it/s][A
Epoch 4/10:  81%|████████▏ | 1799/2208 [01:42<00:21, 18.74it/s][A
  with torch.cuda.amp.autocast():

Epoch 4/10:  82%|████████▏ | 1804/2208 [01:42<00:32, 12.36it/s][A

Batch 1800: Training loss = 0.1967, Training accuracy = 0.9165, F1 = 0.9164



Epoch 4/10:  82%|████████▏ | 1807/2208 [01:42<00:28, 14.28it/s][A
Epoch 4/10:  82%|████████▏ | 1810/2208 [01:43<00:24, 15.93it/s][A
Epoch 4/10:  82%|████████▏ | 1813/2208 [01:43<00:22, 17.30it/s][A
Epoch 4/10:  82%|████████▏ | 1816/2208 [01:43<00:21, 18.27it/s][A
Epoch 4/10:  82%|████████▏ | 1819/2208 [01:43<00:20, 19.14it/s][A
Epoch 4/10:  83%|████████▎ | 1822/2208 [01:43<00:19, 19.71it/s][A
  with torch.cuda.amp.autocast():

Epoch 4/10:  83%|████████▎ | 1828/2208 [01:44<00:31, 12.03it/s][A

Batch 1825: Training loss = 0.1193, Training accuracy = 0.9165, F1 = 0.9164



Epoch 4/10:  83%|████████▎ | 1831/2208 [01:44<00:27, 13.93it/s][A
Epoch 4/10:  83%|████████▎ | 1834/2208 [01:44<00:23, 15.59it/s][A
Epoch 4/10:  83%|████████▎ | 1837/2208 [01:44<00:21, 16.97it/s][A
Epoch 4/10:  83%|████████▎ | 1840/2208 [01:44<00:20, 18.09it/s][A
Epoch 4/10:  83%|████████▎ | 1843/2208 [01:44<00:19, 19.03it/s][A
Epoch 4/10:  84%|████████▎ | 1846/2208 [01:45<00:18, 19.62it/s][A
  with torch.cuda.amp.autocast():

Epoch 4/10:  84%|████████▍ | 1852/2208 [01:45<00:31, 11.40it/s][A
Epoch 4/10:  84%|████████▍ | 1855/2208 [01:45<00:26, 13.31it/s][A

Batch 1850: Training loss = 0.1870, Training accuracy = 0.9167, F1 = 0.9165



Epoch 4/10:  84%|████████▍ | 1858/2208 [01:46<00:23, 15.03it/s][A
Epoch 4/10:  84%|████████▍ | 1861/2208 [01:46<00:21, 16.50it/s][A
Epoch 4/10:  84%|████████▍ | 1864/2208 [01:46<00:19, 17.72it/s][A
Epoch 4/10:  85%|████████▍ | 1867/2208 [01:46<00:18, 18.71it/s][A
Epoch 4/10:  85%|████████▍ | 1870/2208 [01:46<00:17, 19.48it/s][A
Epoch 4/10:  85%|████████▍ | 1873/2208 [01:46<00:16, 19.90it/s][A
  with torch.cuda.amp.autocast():

Epoch 4/10:  85%|████████▌ | 1879/2208 [01:47<00:24, 13.57it/s][A

Batch 1875: Training loss = 0.1953, Training accuracy = 0.9168, F1 = 0.9166



Epoch 4/10:  85%|████████▌ | 1882/2208 [01:47<00:21, 15.26it/s][A
Epoch 4/10:  85%|████████▌ | 1885/2208 [01:47<00:19, 16.62it/s][A
Epoch 4/10:  86%|████████▌ | 1888/2208 [01:47<00:17, 17.78it/s][A
Epoch 4/10:  86%|████████▌ | 1891/2208 [01:47<00:16, 18.71it/s][A
Epoch 4/10:  86%|████████▌ | 1894/2208 [01:48<00:16, 19.27it/s][A
Epoch 4/10:  86%|████████▌ | 1897/2208 [01:48<00:15, 19.83it/s][A
  with torch.cuda.amp.autocast():

Epoch 4/10:  86%|████████▌ | 1903/2208 [01:48<00:26, 11.73it/s][A

Batch 1900: Training loss = 0.2206, Training accuracy = 0.9169, F1 = 0.9167



Epoch 4/10:  86%|████████▋ | 1906/2208 [01:49<00:22, 13.59it/s][A
Epoch 4/10:  86%|████████▋ | 1909/2208 [01:49<00:19, 15.29it/s][A
Epoch 4/10:  87%|████████▋ | 1912/2208 [01:49<00:17, 16.76it/s][A
Epoch 4/10:  87%|████████▋ | 1915/2208 [01:49<00:16, 17.92it/s][A
Epoch 4/10:  87%|████████▋ | 1918/2208 [01:49<00:15, 18.70it/s][A
Epoch 4/10:  87%|████████▋ | 1921/2208 [01:49<00:14, 19.57it/s][A
  with torch.cuda.amp.autocast():

Epoch 4/10:  87%|████████▋ | 1927/2208 [01:50<00:23, 11.78it/s][A
Epoch 4/10:  87%|████████▋ | 1930/2208 [01:50<00:20, 13.67it/s][A

Batch 1925: Training loss = 0.2563, Training accuracy = 0.9171, F1 = 0.9169



Epoch 4/10:  88%|████████▊ | 1933/2208 [01:50<00:17, 15.36it/s][A
Epoch 4/10:  88%|████████▊ | 1936/2208 [01:50<00:16, 16.70it/s][A
Epoch 4/10:  88%|████████▊ | 1939/2208 [01:50<00:15, 17.88it/s][A
Epoch 4/10:  88%|████████▊ | 1942/2208 [01:51<00:14, 18.72it/s][A
Epoch 4/10:  88%|████████▊ | 1945/2208 [01:51<00:13, 19.45it/s][A
Epoch 4/10:  88%|████████▊ | 1948/2208 [01:51<00:13, 19.88it/s][A
  with torch.cuda.amp.autocast():

Epoch 4/10:  88%|████████▊ | 1954/2208 [01:52<00:19, 13.29it/s][A

Batch 1950: Training loss = 0.2885, Training accuracy = 0.9172, F1 = 0.9170



Epoch 4/10:  89%|████████▊ | 1957/2208 [01:52<00:16, 15.00it/s][A
Epoch 4/10:  89%|████████▉ | 1960/2208 [01:52<00:15, 16.46it/s][A
Epoch 4/10:  89%|████████▉ | 1963/2208 [01:52<00:13, 17.53it/s][A
Epoch 4/10:  89%|████████▉ | 1966/2208 [01:52<00:13, 18.46it/s][A
Epoch 4/10:  89%|████████▉ | 1969/2208 [01:52<00:12, 19.23it/s][A
Epoch 4/10:  89%|████████▉ | 1972/2208 [01:52<00:13, 17.63it/s][A
  with torch.cuda.amp.autocast():

Epoch 4/10:  90%|████████▉ | 1977/2208 [01:53<00:22, 10.23it/s][A
Epoch 4/10:  90%|████████▉ | 1980/2208 [01:53<00:18, 12.34it/s][A

Batch 1975: Training loss = 0.3247, Training accuracy = 0.9173, F1 = 0.9172



Epoch 4/10:  90%|████████▉ | 1983/2208 [01:53<00:15, 14.26it/s][A
Epoch 4/10:  90%|████████▉ | 1986/2208 [01:54<00:13, 15.95it/s][A
Epoch 4/10:  90%|█████████ | 1989/2208 [01:54<00:13, 16.33it/s][A
Epoch 4/10:  90%|█████████ | 1991/2208 [01:54<00:13, 16.27it/s][A
Epoch 4/10:  90%|█████████ | 1994/2208 [01:54<00:12, 17.61it/s][A
Epoch 4/10:  90%|█████████ | 1997/2208 [01:54<00:11, 18.65it/s][A
Epoch 4/10:  91%|█████████ | 1999/2208 [01:54<00:11, 18.29it/s][A
  with torch.cuda.amp.autocast():

Epoch 4/10:  91%|█████████ | 2004/2208 [01:55<00:18, 11.32it/s][A

Batch 2000: Training loss = 0.1860, Training accuracy = 0.9174, F1 = 0.9173



Epoch 4/10:  91%|█████████ | 2007/2208 [01:55<00:14, 13.40it/s][A
Epoch 4/10:  91%|█████████ | 2010/2208 [01:55<00:13, 15.15it/s][A
Epoch 4/10:  91%|█████████ | 2013/2208 [01:55<00:11, 16.56it/s][A
Epoch 4/10:  91%|█████████▏| 2016/2208 [01:55<00:10, 17.62it/s][A
Epoch 4/10:  91%|█████████▏| 2019/2208 [01:56<00:10, 18.53it/s][A
Epoch 4/10:  92%|█████████▏| 2022/2208 [01:56<00:09, 19.29it/s][A
  with torch.cuda.amp.autocast():

Epoch 4/10:  92%|█████████▏| 2028/2208 [01:56<00:16, 10.98it/s][A

Batch 2025: Training loss = 0.4633, Training accuracy = 0.9176, F1 = 0.9174



Epoch 4/10:  92%|█████████▏| 2031/2208 [01:57<00:13, 12.87it/s][A
Epoch 4/10:  92%|█████████▏| 2034/2208 [01:57<00:11, 14.64it/s][A
Epoch 4/10:  92%|█████████▏| 2037/2208 [01:57<00:10, 16.16it/s][A
Epoch 4/10:  92%|█████████▏| 2040/2208 [01:57<00:09, 17.38it/s][A
Epoch 4/10:  93%|█████████▎| 2043/2208 [01:57<00:08, 18.47it/s][A
Epoch 4/10:  93%|█████████▎| 2046/2208 [01:57<00:08, 19.16it/s][A
  with torch.cuda.amp.autocast():

Epoch 4/10:  93%|█████████▎| 2052/2208 [01:58<00:14, 11.06it/s][A
Epoch 4/10:  93%|█████████▎| 2055/2208 [01:58<00:11, 12.98it/s][A

Batch 2050: Training loss = 0.2405, Training accuracy = 0.9177, F1 = 0.9175



Epoch 4/10:  93%|█████████▎| 2058/2208 [01:58<00:10, 14.67it/s][A
Epoch 4/10:  93%|█████████▎| 2061/2208 [01:58<00:09, 16.22it/s][A
Epoch 4/10:  93%|█████████▎| 2064/2208 [01:59<00:08, 17.46it/s][A
Epoch 4/10:  94%|█████████▎| 2067/2208 [01:59<00:07, 18.54it/s][A
Epoch 4/10:  94%|█████████▍| 2070/2208 [01:59<00:07, 19.29it/s][A
Epoch 4/10:  94%|█████████▍| 2073/2208 [01:59<00:06, 19.85it/s][A
  with torch.cuda.amp.autocast():

Epoch 4/10:  94%|█████████▍| 2079/2208 [02:00<00:10, 12.84it/s][A

Batch 2075: Training loss = 0.1349, Training accuracy = 0.9178, F1 = 0.9176



Epoch 4/10:  94%|█████████▍| 2082/2208 [02:00<00:08, 14.53it/s][A
Epoch 4/10:  94%|█████████▍| 2085/2208 [02:00<00:07, 16.06it/s][A
Epoch 4/10:  95%|█████████▍| 2088/2208 [02:00<00:06, 17.32it/s][A
Epoch 4/10:  95%|█████████▍| 2091/2208 [02:00<00:06, 18.31it/s][A
Epoch 4/10:  95%|█████████▍| 2094/2208 [02:00<00:05, 19.11it/s][A
Epoch 4/10:  95%|█████████▍| 2097/2208 [02:01<00:05, 19.61it/s][A
  with torch.cuda.amp.autocast():

Epoch 4/10:  95%|█████████▌| 2103/2208 [02:01<00:09, 11.25it/s][A

Batch 2100: Training loss = 0.1933, Training accuracy = 0.9179, F1 = 0.9177



Epoch 4/10:  95%|█████████▌| 2106/2208 [02:01<00:07, 13.16it/s][A
Epoch 4/10:  96%|█████████▌| 2109/2208 [02:01<00:06, 14.90it/s][A
Epoch 4/10:  96%|█████████▌| 2112/2208 [02:02<00:05, 16.39it/s][A
Epoch 4/10:  96%|█████████▌| 2115/2208 [02:02<00:05, 17.68it/s][A
Epoch 4/10:  96%|█████████▌| 2118/2208 [02:02<00:04, 18.67it/s][A
Epoch 4/10:  96%|█████████▌| 2121/2208 [02:02<00:04, 19.29it/s][A
  with torch.cuda.amp.autocast():

Epoch 4/10:  96%|█████████▋| 2127/2208 [02:03<00:07, 11.09it/s][A
Epoch 4/10:  96%|█████████▋| 2130/2208 [02:03<00:05, 13.00it/s][A

Batch 2125: Training loss = 0.2544, Training accuracy = 0.9179, F1 = 0.9177



Epoch 4/10:  97%|█████████▋| 2133/2208 [02:03<00:05, 14.69it/s][A
Epoch 4/10:  97%|█████████▋| 2136/2208 [02:03<00:04, 16.22it/s][A
Epoch 4/10:  97%|█████████▋| 2139/2208 [02:03<00:03, 17.45it/s][A
Epoch 4/10:  97%|█████████▋| 2142/2208 [02:03<00:03, 18.44it/s][A
Epoch 4/10:  97%|█████████▋| 2145/2208 [02:04<00:03, 19.06it/s][A
Epoch 4/10:  97%|█████████▋| 2148/2208 [02:04<00:03, 19.63it/s][A
  with torch.cuda.amp.autocast():

Epoch 4/10:  98%|█████████▊| 2154/2208 [02:04<00:04, 13.07it/s][A

Batch 2150: Training loss = 0.1808, Training accuracy = 0.9180, F1 = 0.9178



Epoch 4/10:  98%|█████████▊| 2157/2208 [02:05<00:03, 14.85it/s][A
Epoch 4/10:  98%|█████████▊| 2160/2208 [02:05<00:02, 16.38it/s][A
Epoch 4/10:  98%|█████████▊| 2163/2208 [02:05<00:02, 17.58it/s][A
Epoch 4/10:  98%|█████████▊| 2166/2208 [02:05<00:02, 18.56it/s][A
Epoch 4/10:  98%|█████████▊| 2169/2208 [02:05<00:02, 19.31it/s][A
Epoch 4/10:  98%|█████████▊| 2172/2208 [02:05<00:01, 19.83it/s][A
  with torch.cuda.amp.autocast():

Epoch 4/10:  99%|█████████▊| 2178/2208 [02:06<00:03,  9.90it/s][A

Batch 2175: Training loss = 0.3206, Training accuracy = 0.9181, F1 = 0.9179



Epoch 4/10:  99%|█████████▉| 2181/2208 [02:06<00:02, 11.83it/s][A
Epoch 4/10:  99%|█████████▉| 2184/2208 [02:06<00:01, 13.56it/s][A
Epoch 4/10:  99%|█████████▉| 2187/2208 [02:06<00:01, 15.17it/s][A
Epoch 4/10:  99%|█████████▉| 2190/2208 [02:07<00:01, 16.63it/s][A
Epoch 4/10:  99%|█████████▉| 2193/2208 [02:07<00:00, 17.70it/s][A
Epoch 4/10:  99%|█████████▉| 2196/2208 [02:07<00:00, 18.30it/s][A
Epoch 4/10: 100%|█████████▉| 2199/2208 [02:07<00:00, 18.65it/s][A
  with torch.cuda.amp.autocast():

Epoch 4/10: 100%|█████████▉| 2204/2208 [02:08<00:00, 12.06it/s][A

Batch 2200: Training loss = 0.2224, Training accuracy = 0.9182, F1 = 0.9181



Epoch 4/10: 100%|█████████▉| 2207/2208 [02:08<00:00, 14.09it/s][A
                                                               [A


Epoch 4 Training Metrics:
Loss: 0.2449
Accuracy: 0.9182
F1 Score: 0.9181
Precision: 0.9180
Recall: 0.9182

Starting validation...



Validation:   0%|          | 0/552 [00:00<?, ?it/s][A
Validation:   0%|          | 1/552 [00:01<14:37,  1.59s/it][A
Validation:   1%|          | 3/552 [00:01<04:10,  2.19it/s][A
Validation:   1%|          | 5/552 [00:01<02:22,  3.83it/s][A
Validation:   1%|▏         | 7/552 [00:01<01:34,  5.74it/s][A
Validation:   2%|▏         | 9/552 [00:02<01:09,  7.76it/s][A
Validation:   2%|▏         | 11/552 [00:02<00:55,  9.80it/s][A
Validation:   2%|▏         | 13/552 [00:02<00:46, 11.65it/s][A
Validation:   3%|▎         | 15/552 [00:02<00:40, 13.34it/s][A
Validation:   3%|▎         | 17/552 [00:02<00:36, 14.75it/s][A
Validation:   3%|▎         | 19/552 [00:02<00:33, 15.86it/s][A
Validation:   4%|▍         | 21/552 [00:02<00:31, 16.74it/s][A
Validation:   4%|▍         | 23/552 [00:02<00:30, 17.42it/s][A
Validation:   5%|▍         | 25/552 [00:02<00:29, 17.82it/s][A
Validation:   5%|▍         | 27/552 [00:03<00:28, 18.21it/s][A
Validation:   5%|▌         | 29/552 [00:03<00:28, 18.


Epoch 4 Validation Metrics:
Loss: 0.1971
Accuracy: 0.9355
F1 Score: 0.9351
Precision: 0.9388
Recall: 0.9355


Training epochs:  40%|████      | 4/10 [10:43<16:06, 161.15s/it]


Starting epoch 5/10



  with torch.cuda.amp.autocast():

  with torch.cuda.amp.autocast():

Epoch 5/10:   0%|          | 2/2208 [00:01<27:35,  1.33it/s]  [A

Batch 0: Training loss = 0.2117, Training accuracy = 0.9375, F1 = 0.9401



Epoch 5/10:   0%|          | 5/2208 [00:01<09:04,  4.04it/s][A
Epoch 5/10:   0%|          | 8/2208 [00:02<05:21,  6.85it/s][A
Epoch 5/10:   0%|          | 11/2208 [00:02<03:49,  9.58it/s][A
Epoch 5/10:   1%|          | 14/2208 [00:02<03:04, 11.88it/s][A
Epoch 5/10:   1%|          | 17/2208 [00:02<02:35, 14.06it/s][A
Epoch 5/10:   1%|          | 19/2208 [00:02<02:25, 15.08it/s][A
Epoch 5/10:   1%|          | 22/2208 [00:02<02:11, 16.62it/s][A
  with torch.cuda.amp.autocast():

Epoch 5/10:   1%|▏         | 28/2208 [00:03<02:00, 18.11it/s][A
Epoch 5/10:   1%|▏         | 30/2208 [00:03<01:59, 18.24it/s]

Batch 25: Training loss = 0.2447, Training accuracy = 0.9294, F1 = 0.9288


[A
Epoch 5/10:   1%|▏         | 33/2208 [00:03<01:53, 19.21it/s][A
Epoch 5/10:   2%|▏         | 36/2208 [00:03<01:53, 19.17it/s][A
Epoch 5/10:   2%|▏         | 38/2208 [00:03<01:56, 18.70it/s][A
Epoch 5/10:   2%|▏         | 41/2208 [00:03<01:51, 19.47it/s][A
Epoch 5/10:   2%|▏         | 43/2208 [00:03<01:57, 18.40it/s][A
Epoch 5/10:   2%|▏         | 46/2208 [00:03<01:54, 18.89it/s][A
Epoch 5/10:   2%|▏         | 49/2208 [00:04<01:49, 19.65it/s][A
  with torch.cuda.amp.autocast():

Epoch 5/10:   2%|▏         | 54/2208 [00:04<01:58, 18.18it/s][A

Batch 50: Training loss = 0.1847, Training accuracy = 0.9294, F1 = 0.9289



Epoch 5/10:   3%|▎         | 57/2208 [00:04<01:52, 19.12it/s][A
Epoch 5/10:   3%|▎         | 60/2208 [00:04<01:49, 19.59it/s][A
Epoch 5/10:   3%|▎         | 63/2208 [00:04<01:46, 20.07it/s][A
Epoch 5/10:   3%|▎         | 66/2208 [00:05<01:47, 19.97it/s][A
Epoch 5/10:   3%|▎         | 69/2208 [00:05<01:45, 20.22it/s][A
Epoch 5/10:   3%|▎         | 72/2208 [00:05<01:43, 20.56it/s][A
  with torch.cuda.amp.autocast():

Epoch 5/10:   3%|▎         | 77/2208 [00:05<01:53, 18.81it/s][A
Epoch 5/10:   4%|▎         | 80/2208 [00:05<01:48, 19.62it/s][A

Batch 75: Training loss = 0.2916, Training accuracy = 0.9264, F1 = 0.9261



Epoch 5/10:   4%|▍         | 83/2208 [00:05<01:45, 20.10it/s][A
Epoch 5/10:   4%|▍         | 86/2208 [00:06<01:43, 20.52it/s][A
Epoch 5/10:   4%|▍         | 89/2208 [00:06<01:41, 20.78it/s][A
Epoch 5/10:   4%|▍         | 92/2208 [00:06<01:54, 18.47it/s][A
Epoch 5/10:   4%|▍         | 94/2208 [00:06<02:01, 17.33it/s][A
Epoch 5/10:   4%|▍         | 97/2208 [00:06<01:54, 18.46it/s][A
  with torch.cuda.amp.autocast():

Epoch 5/10:   5%|▍         | 102/2208 [00:06<01:52, 18.73it/s][A
Epoch 5/10:   5%|▍         | 105/2208 [00:07<01:47, 19.54it/s][A

Batch 100: Training loss = 0.1888, Training accuracy = 0.9271, F1 = 0.9270



Epoch 5/10:   5%|▍         | 108/2208 [00:07<01:44, 20.06it/s][A
Epoch 5/10:   5%|▌         | 111/2208 [00:07<01:42, 20.39it/s][A
Epoch 5/10:   5%|▌         | 114/2208 [00:07<01:41, 20.67it/s][A
Epoch 5/10:   5%|▌         | 117/2208 [00:07<01:40, 20.88it/s][A
Epoch 5/10:   5%|▌         | 120/2208 [00:07<01:41, 20.60it/s][A
Epoch 5/10:   6%|▌         | 123/2208 [00:07<01:40, 20.70it/s][A
  with torch.cuda.amp.autocast():

Epoch 5/10:   6%|▌         | 128/2208 [00:08<02:05, 16.54it/s][A

Batch 125: Training loss = 0.1989, Training accuracy = 0.9287, F1 = 0.9285



Epoch 5/10:   6%|▌         | 131/2208 [00:08<01:57, 17.73it/s][A
Epoch 5/10:   6%|▌         | 134/2208 [00:08<01:50, 18.70it/s][A
Epoch 5/10:   6%|▌         | 137/2208 [00:08<01:47, 19.28it/s][A
Epoch 5/10:   6%|▋         | 139/2208 [00:08<01:46, 19.34it/s][A
Epoch 5/10:   6%|▋         | 142/2208 [00:08<01:44, 19.74it/s][A
Epoch 5/10:   7%|▋         | 144/2208 [00:09<01:44, 19.67it/s][A
Epoch 5/10:   7%|▋         | 147/2208 [00:09<01:54, 18.05it/s][A
  with torch.cuda.amp.autocast():

Epoch 5/10:   7%|▋         | 152/2208 [00:09<01:53, 18.10it/s][A
Epoch 5/10:   7%|▋         | 155/2208 [00:09<01:47, 19.03it/s][A

Batch 150: Training loss = 0.1235, Training accuracy = 0.9298, F1 = 0.9296



Epoch 5/10:   7%|▋         | 157/2208 [00:09<01:46, 19.20it/s][A
Epoch 5/10:   7%|▋         | 160/2208 [00:09<01:45, 19.47it/s][A
Epoch 5/10:   7%|▋         | 163/2208 [00:10<01:42, 19.92it/s][A
Epoch 5/10:   8%|▊         | 166/2208 [00:10<01:41, 20.20it/s][A
Epoch 5/10:   8%|▊         | 169/2208 [00:10<01:53, 18.03it/s][A
Epoch 5/10:   8%|▊         | 172/2208 [00:10<02:01, 16.71it/s][A
Epoch 5/10:   8%|▊         | 174/2208 [00:10<01:59, 17.06it/s][A
  with torch.cuda.amp.autocast():

Epoch 5/10:   8%|▊         | 179/2208 [00:11<01:58, 17.08it/s][A

Batch 175: Training loss = 0.2485, Training accuracy = 0.9293, F1 = 0.9291



Epoch 5/10:   8%|▊         | 181/2208 [00:11<01:54, 17.66it/s][A
Epoch 5/10:   8%|▊         | 184/2208 [00:11<01:58, 17.02it/s][A
Epoch 5/10:   8%|▊         | 187/2208 [00:11<01:50, 18.25it/s][A
Epoch 5/10:   9%|▊         | 189/2208 [00:11<01:52, 17.94it/s][A
Epoch 5/10:   9%|▊         | 192/2208 [00:11<01:46, 18.97it/s][A
Epoch 5/10:   9%|▉         | 195/2208 [00:11<01:42, 19.69it/s][A
Epoch 5/10:   9%|▉         | 197/2208 [00:11<01:52, 17.86it/s][A
  with torch.cuda.amp.autocast():

Epoch 5/10:   9%|▉         | 202/2208 [00:12<02:04, 16.10it/s][A
Epoch 5/10:   9%|▉         | 204/2208 [00:12<02:01, 16.54it/s][A

Batch 200: Training loss = 0.2406, Training accuracy = 0.9294, F1 = 0.9292



Epoch 5/10:   9%|▉         | 207/2208 [00:12<01:51, 17.94it/s][A
Epoch 5/10:   9%|▉         | 209/2208 [00:12<02:03, 16.20it/s][A
Epoch 5/10:  10%|▉         | 212/2208 [00:12<01:54, 17.49it/s][A
Epoch 5/10:  10%|▉         | 215/2208 [00:13<01:47, 18.56it/s][A
Epoch 5/10:  10%|▉         | 217/2208 [00:13<01:56, 17.08it/s][A
Epoch 5/10:  10%|▉         | 220/2208 [00:13<01:48, 18.25it/s][A
Epoch 5/10:  10%|█         | 223/2208 [00:13<01:44, 18.99it/s][A
  with torch.cuda.amp.autocast():

Epoch 5/10:  10%|█         | 227/2208 [00:13<02:02, 16.15it/s][A
Epoch 5/10:  10%|█         | 229/2208 [00:13<02:01, 16.33it/s][A

Batch 225: Training loss = 0.2024, Training accuracy = 0.9294, F1 = 0.9293



Epoch 5/10:  11%|█         | 232/2208 [00:14<01:51, 17.79it/s][A
Epoch 5/10:  11%|█         | 235/2208 [00:14<01:44, 18.92it/s][A
Epoch 5/10:  11%|█         | 238/2208 [00:14<01:40, 19.58it/s][A
Epoch 5/10:  11%|█         | 241/2208 [00:14<01:38, 20.00it/s][A
Epoch 5/10:  11%|█         | 244/2208 [00:14<01:36, 20.29it/s][A
Epoch 5/10:  11%|█         | 247/2208 [00:14<01:38, 19.84it/s][A
  with torch.cuda.amp.autocast():

Epoch 5/10:  11%|█▏        | 253/2208 [00:15<01:56, 16.73it/s][A

Batch 250: Training loss = 0.3384, Training accuracy = 0.9290, F1 = 0.9290



Epoch 5/10:  12%|█▏        | 256/2208 [00:15<01:48, 17.94it/s][A
Epoch 5/10:  12%|█▏        | 258/2208 [00:15<01:46, 18.36it/s][A
Epoch 5/10:  12%|█▏        | 261/2208 [00:15<01:41, 19.22it/s][A
Epoch 5/10:  12%|█▏        | 264/2208 [00:15<01:38, 19.73it/s][A
Epoch 5/10:  12%|█▏        | 267/2208 [00:15<01:35, 20.25it/s][A
Epoch 5/10:  12%|█▏        | 270/2208 [00:15<01:34, 20.59it/s][A
Epoch 5/10:  12%|█▏        | 273/2208 [00:16<01:32, 20.91it/s][A
  with torch.cuda.amp.autocast():

Epoch 5/10:  13%|█▎        | 279/2208 [00:16<01:39, 19.46it/s][A

Batch 275: Training loss = 0.1751, Training accuracy = 0.9293, F1 = 0.9293



Epoch 5/10:  13%|█▎        | 282/2208 [00:16<01:36, 19.89it/s][A
Epoch 5/10:  13%|█▎        | 285/2208 [00:16<01:35, 20.24it/s][A
Epoch 5/10:  13%|█▎        | 288/2208 [00:16<01:33, 20.58it/s][A
Epoch 5/10:  13%|█▎        | 291/2208 [00:16<01:32, 20.78it/s][A
Epoch 5/10:  13%|█▎        | 294/2208 [00:17<01:38, 19.44it/s][A
Epoch 5/10:  13%|█▎        | 297/2208 [00:17<01:35, 19.94it/s][A
  with torch.cuda.amp.autocast():

Epoch 5/10:  14%|█▎        | 303/2208 [00:17<01:45, 18.01it/s][A

Batch 300: Training loss = 0.2379, Training accuracy = 0.9295, F1 = 0.9294



Epoch 5/10:  14%|█▍        | 306/2208 [00:17<01:40, 18.86it/s][A
Epoch 5/10:  14%|█▍        | 309/2208 [00:17<01:37, 19.39it/s][A
Epoch 5/10:  14%|█▍        | 312/2208 [00:18<01:35, 19.88it/s][A
Epoch 5/10:  14%|█▍        | 315/2208 [00:18<01:33, 20.30it/s][A
Epoch 5/10:  14%|█▍        | 318/2208 [00:18<01:32, 20.45it/s][A
Epoch 5/10:  15%|█▍        | 321/2208 [00:18<01:31, 20.66it/s][A
  with torch.cuda.amp.autocast():

Epoch 5/10:  15%|█▍        | 327/2208 [00:18<01:46, 17.69it/s][A
Epoch 5/10:  15%|█▍        | 330/2208 [00:19<01:40, 18.64it/s][A

Batch 325: Training loss = 0.2119, Training accuracy = 0.9292, F1 = 0.9291



Epoch 5/10:  15%|█▌        | 333/2208 [00:19<01:36, 19.50it/s][A
Epoch 5/10:  15%|█▌        | 336/2208 [00:19<01:33, 20.03it/s][A
Epoch 5/10:  15%|█▌        | 339/2208 [00:19<01:32, 20.29it/s][A
Epoch 5/10:  15%|█▌        | 342/2208 [00:19<01:32, 20.09it/s][A
Epoch 5/10:  16%|█▌        | 345/2208 [00:19<01:31, 20.30it/s][A
Epoch 5/10:  16%|█▌        | 348/2208 [00:19<01:30, 20.59it/s][A
  with torch.cuda.amp.autocast():

Epoch 5/10:  16%|█▌        | 354/2208 [00:20<01:40, 18.49it/s][A

Batch 350: Training loss = 0.3101, Training accuracy = 0.9292, F1 = 0.9292



Epoch 5/10:  16%|█▌        | 357/2208 [00:20<01:35, 19.32it/s][A
Epoch 5/10:  16%|█▋        | 360/2208 [00:20<01:32, 19.89it/s][A
Epoch 5/10:  16%|█▋        | 363/2208 [00:20<01:31, 20.15it/s][A
Epoch 5/10:  17%|█▋        | 366/2208 [00:20<01:30, 20.43it/s][A
Epoch 5/10:  17%|█▋        | 369/2208 [00:20<01:28, 20.68it/s][A
Epoch 5/10:  17%|█▋        | 372/2208 [00:21<01:28, 20.83it/s][A
  with torch.cuda.amp.autocast():

Epoch 5/10:  17%|█▋        | 378/2208 [00:21<01:40, 18.20it/s][A

Batch 375: Training loss = 0.2757, Training accuracy = 0.9289, F1 = 0.9288



Epoch 5/10:  17%|█▋        | 381/2208 [00:21<01:35, 19.12it/s][A
Epoch 5/10:  17%|█▋        | 384/2208 [00:21<01:32, 19.72it/s][A
Epoch 5/10:  18%|█▊        | 387/2208 [00:21<01:30, 20.02it/s][A
Epoch 5/10:  18%|█▊        | 390/2208 [00:22<01:28, 20.47it/s][A
Epoch 5/10:  18%|█▊        | 393/2208 [00:22<01:27, 20.65it/s][A
Epoch 5/10:  18%|█▊        | 396/2208 [00:22<01:27, 20.61it/s][A
  with torch.cuda.amp.autocast():

Epoch 5/10:  18%|█▊        | 402/2208 [00:22<01:50, 16.30it/s][A
Epoch 5/10:  18%|█▊        | 405/2208 [00:22<01:43, 17.36it/s][A

Batch 400: Training loss = 0.2802, Training accuracy = 0.9290, F1 = 0.9289



Epoch 5/10:  18%|█▊        | 408/2208 [00:23<01:38, 18.26it/s][A
Epoch 5/10:  19%|█▊        | 410/2208 [00:23<01:52, 15.95it/s][A
Epoch 5/10:  19%|█▊        | 413/2208 [00:23<01:44, 17.24it/s][A
Epoch 5/10:  19%|█▉        | 415/2208 [00:23<01:45, 16.95it/s][A
Epoch 5/10:  19%|█▉        | 418/2208 [00:23<01:53, 15.74it/s][A
Epoch 5/10:  19%|█▉        | 421/2208 [00:23<01:43, 17.18it/s][A
Epoch 5/10:  19%|█▉        | 424/2208 [00:23<01:38, 18.19it/s][A
  with torch.cuda.amp.autocast():

Epoch 5/10:  19%|█▉        | 429/2208 [00:24<01:49, 16.25it/s][A

Batch 425: Training loss = 0.2385, Training accuracy = 0.9292, F1 = 0.9291



Epoch 5/10:  20%|█▉        | 432/2208 [00:24<01:40, 17.59it/s][A
Epoch 5/10:  20%|█▉        | 435/2208 [00:24<01:35, 18.65it/s][A
Epoch 5/10:  20%|█▉        | 438/2208 [00:24<01:31, 19.31it/s][A
Epoch 5/10:  20%|█▉        | 441/2208 [00:24<01:29, 19.83it/s][A
Epoch 5/10:  20%|██        | 444/2208 [00:25<01:27, 20.09it/s][A
Epoch 5/10:  20%|██        | 447/2208 [00:25<01:29, 19.58it/s][A
  with torch.cuda.amp.autocast():

Epoch 5/10:  20%|██        | 452/2208 [00:25<01:53, 15.46it/s][A
Epoch 5/10:  21%|██        | 455/2208 [00:25<01:43, 16.97it/s][A

Batch 450: Training loss = 0.2934, Training accuracy = 0.9286, F1 = 0.9285



Epoch 5/10:  21%|██        | 458/2208 [00:25<01:36, 18.14it/s][A
Epoch 5/10:  21%|██        | 461/2208 [00:26<01:31, 19.00it/s][A
Epoch 5/10:  21%|██        | 464/2208 [00:26<01:39, 17.61it/s][A
Epoch 5/10:  21%|██        | 466/2208 [00:26<01:36, 17.97it/s][A
Epoch 5/10:  21%|██        | 468/2208 [00:26<01:55, 15.08it/s][A
Epoch 5/10:  21%|██▏       | 471/2208 [00:26<01:43, 16.79it/s][A
Epoch 5/10:  21%|██▏       | 473/2208 [00:26<01:42, 16.97it/s][A
  with torch.cuda.amp.autocast():

Epoch 5/10:  22%|██▏       | 479/2208 [00:27<01:47, 16.10it/s][A

Batch 475: Training loss = 0.2549, Training accuracy = 0.9282, F1 = 0.9280



Epoch 5/10:  22%|██▏       | 482/2208 [00:27<01:38, 17.55it/s][A
Epoch 5/10:  22%|██▏       | 485/2208 [00:27<01:32, 18.60it/s][A
Epoch 5/10:  22%|██▏       | 488/2208 [00:27<01:28, 19.43it/s][A
Epoch 5/10:  22%|██▏       | 491/2208 [00:27<01:26, 19.93it/s][A
Epoch 5/10:  22%|██▏       | 494/2208 [00:27<01:24, 20.40it/s][A
Epoch 5/10:  23%|██▎       | 497/2208 [00:28<01:23, 20.56it/s][A
  with torch.cuda.amp.autocast():

Epoch 5/10:  23%|██▎       | 503/2208 [00:28<01:36, 17.67it/s][A

Batch 500: Training loss = 0.2787, Training accuracy = 0.9278, F1 = 0.9277



Epoch 5/10:  23%|██▎       | 506/2208 [00:28<01:31, 18.69it/s][A
Epoch 5/10:  23%|██▎       | 509/2208 [00:28<01:27, 19.33it/s][A
Epoch 5/10:  23%|██▎       | 512/2208 [00:28<01:25, 19.80it/s][A
Epoch 5/10:  23%|██▎       | 515/2208 [00:28<01:23, 20.26it/s][A
Epoch 5/10:  23%|██▎       | 518/2208 [00:29<01:21, 20.65it/s][A
Epoch 5/10:  24%|██▎       | 521/2208 [00:29<01:21, 20.70it/s][A
  with torch.cuda.amp.autocast():

Epoch 5/10:  24%|██▍       | 527/2208 [00:29<01:40, 16.74it/s][A
Epoch 5/10:  24%|██▍       | 530/2208 [00:29<01:33, 17.90it/s][A

Batch 525: Training loss = 0.0965, Training accuracy = 0.9280, F1 = 0.9279



Epoch 5/10:  24%|██▍       | 533/2208 [00:29<01:29, 18.73it/s][A
Epoch 5/10:  24%|██▍       | 536/2208 [00:30<01:25, 19.46it/s][A
Epoch 5/10:  24%|██▍       | 539/2208 [00:30<01:23, 19.90it/s][A
Epoch 5/10:  25%|██▍       | 542/2208 [00:30<01:22, 20.27it/s][A
Epoch 5/10:  25%|██▍       | 545/2208 [00:30<01:20, 20.58it/s][A
Epoch 5/10:  25%|██▍       | 548/2208 [00:30<01:19, 20.77it/s][A
  with torch.cuda.amp.autocast():

Epoch 5/10:  25%|██▌       | 554/2208 [00:31<01:32, 17.92it/s][A

Batch 550: Training loss = 0.1902, Training accuracy = 0.9281, F1 = 0.9280



Epoch 5/10:  25%|██▌       | 557/2208 [00:31<01:27, 18.82it/s][A
Epoch 5/10:  25%|██▌       | 560/2208 [00:31<01:24, 19.47it/s][A
Epoch 5/10:  25%|██▌       | 563/2208 [00:31<01:22, 19.82it/s][A
Epoch 5/10:  26%|██▌       | 566/2208 [00:31<01:20, 20.30it/s][A
Epoch 5/10:  26%|██▌       | 569/2208 [00:31<01:19, 20.59it/s][A
Epoch 5/10:  26%|██▌       | 572/2208 [00:31<01:18, 20.80it/s][A
  with torch.cuda.amp.autocast():

Epoch 5/10:  26%|██▌       | 578/2208 [00:32<01:35, 17.16it/s][A

Batch 575: Training loss = 0.2203, Training accuracy = 0.9282, F1 = 0.9281



Epoch 5/10:  26%|██▋       | 581/2208 [00:32<01:28, 18.31it/s][A
Epoch 5/10:  26%|██▋       | 584/2208 [00:32<01:25, 19.09it/s][A
Epoch 5/10:  27%|██▋       | 587/2208 [00:32<01:22, 19.76it/s][A
Epoch 5/10:  27%|██▋       | 590/2208 [00:32<01:20, 20.20it/s][A
Epoch 5/10:  27%|██▋       | 593/2208 [00:32<01:19, 20.39it/s][A
Epoch 5/10:  27%|██▋       | 596/2208 [00:33<01:17, 20.68it/s][A
  with torch.cuda.amp.autocast():

Epoch 5/10:  27%|██▋       | 602/2208 [00:33<01:34, 17.06it/s][A
Epoch 5/10:  27%|██▋       | 605/2208 [00:33<01:28, 18.15it/s][A

Batch 600: Training loss = 0.2661, Training accuracy = 0.9283, F1 = 0.9282



Epoch 5/10:  28%|██▊       | 608/2208 [00:33<01:24, 18.95it/s][A
Epoch 5/10:  28%|██▊       | 611/2208 [00:33<01:21, 19.70it/s][A
Epoch 5/10:  28%|██▊       | 614/2208 [00:34<01:19, 20.05it/s][A
Epoch 5/10:  28%|██▊       | 617/2208 [00:34<01:18, 20.40it/s][A
Epoch 5/10:  28%|██▊       | 620/2208 [00:34<01:16, 20.63it/s][A
Epoch 5/10:  28%|██▊       | 623/2208 [00:34<01:16, 20.71it/s][A
  with torch.cuda.amp.autocast():

Epoch 5/10:  28%|██▊       | 629/2208 [00:34<01:29, 17.69it/s][A

Batch 625: Training loss = 0.1723, Training accuracy = 0.9280, F1 = 0.9279



Epoch 5/10:  29%|██▊       | 632/2208 [00:35<01:24, 18.69it/s][A
Epoch 5/10:  29%|██▉       | 635/2208 [00:35<01:21, 19.38it/s][A
Epoch 5/10:  29%|██▉       | 638/2208 [00:35<01:18, 19.89it/s][A
Epoch 5/10:  29%|██▉       | 641/2208 [00:35<01:17, 20.26it/s][A
Epoch 5/10:  29%|██▉       | 644/2208 [00:35<01:16, 20.57it/s][A
Epoch 5/10:  29%|██▉       | 647/2208 [00:35<01:15, 20.64it/s][A
  with torch.cuda.amp.autocast():

Epoch 5/10:  30%|██▉       | 653/2208 [00:36<01:33, 16.63it/s][A

Batch 650: Training loss = 0.2691, Training accuracy = 0.9280, F1 = 0.9279



Epoch 5/10:  30%|██▉       | 656/2208 [00:36<01:27, 17.76it/s][A
Epoch 5/10:  30%|██▉       | 659/2208 [00:36<01:22, 18.70it/s][A
Epoch 5/10:  30%|██▉       | 662/2208 [00:36<01:19, 19.35it/s][A
Epoch 5/10:  30%|███       | 665/2208 [00:36<01:18, 19.63it/s][A
Epoch 5/10:  30%|███       | 668/2208 [00:36<01:17, 19.91it/s][A
Epoch 5/10:  30%|███       | 671/2208 [00:37<01:16, 20.14it/s][A
  with torch.cuda.amp.autocast():

Epoch 5/10:  31%|███       | 677/2208 [00:37<01:31, 16.78it/s][A
Epoch 5/10:  31%|███       | 680/2208 [00:37<01:25, 17.97it/s][A

Batch 675: Training loss = 0.1999, Training accuracy = 0.9283, F1 = 0.9282



Epoch 5/10:  31%|███       | 683/2208 [00:37<01:20, 18.88it/s][A
Epoch 5/10:  31%|███       | 686/2208 [00:37<01:17, 19.55it/s][A
Epoch 5/10:  31%|███       | 689/2208 [00:38<01:31, 16.69it/s][A
Epoch 5/10:  31%|███▏      | 691/2208 [00:38<01:31, 16.52it/s][A
Epoch 5/10:  31%|███▏      | 693/2208 [00:38<01:30, 16.82it/s][A
Epoch 5/10:  31%|███▏      | 695/2208 [00:38<01:28, 17.10it/s][A
Epoch 5/10:  32%|███▏      | 698/2208 [00:38<01:22, 18.39it/s][A
  with torch.cuda.amp.autocast():

Epoch 5/10:  32%|███▏      | 702/2208 [00:38<01:55, 12.99it/s][A
Epoch 5/10:  32%|███▏      | 705/2208 [00:39<01:39, 15.10it/s][A

Batch 700: Training loss = 0.1822, Training accuracy = 0.9285, F1 = 0.9284



Epoch 5/10:  32%|███▏      | 708/2208 [00:39<01:29, 16.83it/s][A
Epoch 5/10:  32%|███▏      | 711/2208 [00:39<01:23, 17.94it/s][A
Epoch 5/10:  32%|███▏      | 714/2208 [00:39<01:19, 18.75it/s][A
Epoch 5/10:  32%|███▏      | 716/2208 [00:39<01:18, 18.97it/s][A
Epoch 5/10:  33%|███▎      | 719/2208 [00:39<01:16, 19.54it/s][A
Epoch 5/10:  33%|███▎      | 722/2208 [00:39<01:14, 20.06it/s][A
  with torch.cuda.amp.autocast():

Epoch 5/10:  33%|███▎      | 727/2208 [00:40<01:47, 13.76it/s][A
Epoch 5/10:  33%|███▎      | 730/2208 [00:40<01:34, 15.61it/s][A

Batch 725: Training loss = 0.1491, Training accuracy = 0.9287, F1 = 0.9286



Epoch 5/10:  33%|███▎      | 733/2208 [00:40<01:26, 17.08it/s][A
Epoch 5/10:  33%|███▎      | 736/2208 [00:40<01:20, 18.19it/s][A
Epoch 5/10:  33%|███▎      | 739/2208 [00:40<01:25, 17.18it/s][A
Epoch 5/10:  34%|███▎      | 742/2208 [00:41<01:21, 18.10it/s][A
Epoch 5/10:  34%|███▎      | 744/2208 [00:41<01:19, 18.45it/s][A
Epoch 5/10:  34%|███▍      | 747/2208 [00:41<01:17, 18.89it/s][A
  with torch.cuda.amp.autocast():

Epoch 5/10:  34%|███▍      | 752/2208 [00:41<01:47, 13.56it/s][A
Epoch 5/10:  34%|███▍      | 755/2208 [00:41<01:34, 15.42it/s][A

Batch 750: Training loss = 0.2407, Training accuracy = 0.9288, F1 = 0.9287



Epoch 5/10:  34%|███▍      | 758/2208 [00:42<01:25, 16.89it/s][A
Epoch 5/10:  34%|███▍      | 761/2208 [00:42<01:19, 18.12it/s][A
Epoch 5/10:  35%|███▍      | 764/2208 [00:42<01:16, 18.81it/s][A
Epoch 5/10:  35%|███▍      | 767/2208 [00:42<01:14, 19.45it/s][A
Epoch 5/10:  35%|███▍      | 770/2208 [00:42<01:12, 19.81it/s][A
Epoch 5/10:  35%|███▌      | 773/2208 [00:42<01:11, 20.08it/s][A
  with torch.cuda.amp.autocast():

Epoch 5/10:  35%|███▌      | 779/2208 [00:43<01:28, 16.06it/s][A

Batch 775: Training loss = 0.1635, Training accuracy = 0.9287, F1 = 0.9286



Epoch 5/10:  35%|███▌      | 782/2208 [00:43<01:21, 17.40it/s][A
Epoch 5/10:  36%|███▌      | 785/2208 [00:43<01:17, 18.31it/s][A
Epoch 5/10:  36%|███▌      | 788/2208 [00:43<01:14, 19.08it/s][A
Epoch 5/10:  36%|███▌      | 791/2208 [00:43<01:12, 19.65it/s][A
Epoch 5/10:  36%|███▌      | 794/2208 [00:44<01:10, 20.08it/s][A
Epoch 5/10:  36%|███▌      | 797/2208 [00:44<01:10, 20.02it/s][A
  with torch.cuda.amp.autocast():

Epoch 5/10:  36%|███▋      | 803/2208 [00:44<01:29, 15.74it/s][A

Batch 800: Training loss = 0.1387, Training accuracy = 0.9287, F1 = 0.9286



Epoch 5/10:  37%|███▋      | 806/2208 [00:44<01:22, 17.00it/s][A
Epoch 5/10:  37%|███▋      | 809/2208 [00:44<01:17, 18.07it/s][A
Epoch 5/10:  37%|███▋      | 812/2208 [00:45<01:14, 18.80it/s][A
Epoch 5/10:  37%|███▋      | 815/2208 [00:45<01:11, 19.43it/s][A
Epoch 5/10:  37%|███▋      | 818/2208 [00:45<01:09, 20.03it/s][A
Epoch 5/10:  37%|███▋      | 821/2208 [00:45<01:07, 20.40it/s][A
  with torch.cuda.amp.autocast():

Epoch 5/10:  37%|███▋      | 827/2208 [00:45<01:32, 14.91it/s][A
Epoch 5/10:  38%|███▊      | 830/2208 [00:46<01:23, 16.46it/s][A

Batch 825: Training loss = 0.2740, Training accuracy = 0.9286, F1 = 0.9285



Epoch 5/10:  38%|███▊      | 833/2208 [00:46<01:17, 17.70it/s][A
Epoch 5/10:  38%|███▊      | 836/2208 [00:46<01:13, 18.57it/s][A
Epoch 5/10:  38%|███▊      | 839/2208 [00:46<01:11, 19.21it/s][A
Epoch 5/10:  38%|███▊      | 842/2208 [00:46<01:08, 19.84it/s][A
Epoch 5/10:  38%|███▊      | 845/2208 [00:46<01:07, 20.26it/s][A
Epoch 5/10:  38%|███▊      | 848/2208 [00:46<01:07, 20.27it/s][A
  with torch.cuda.amp.autocast():

Epoch 5/10:  39%|███▊      | 854/2208 [00:47<01:20, 16.89it/s][A

Batch 850: Training loss = 0.2309, Training accuracy = 0.9288, F1 = 0.9286



Epoch 5/10:  39%|███▉      | 857/2208 [00:47<01:15, 17.98it/s][A
Epoch 5/10:  39%|███▉      | 860/2208 [00:47<01:11, 18.91it/s][A
Epoch 5/10:  39%|███▉      | 863/2208 [00:47<01:08, 19.61it/s][A
Epoch 5/10:  39%|███▉      | 866/2208 [00:47<01:06, 20.04it/s][A
Epoch 5/10:  39%|███▉      | 869/2208 [00:48<01:05, 20.42it/s][A
Epoch 5/10:  39%|███▉      | 872/2208 [00:48<01:04, 20.77it/s][A
  with torch.cuda.amp.autocast():

Epoch 5/10:  40%|███▉      | 878/2208 [00:48<01:24, 15.83it/s][A

Batch 875: Training loss = 0.1200, Training accuracy = 0.9288, F1 = 0.9287



Epoch 5/10:  40%|███▉      | 881/2208 [00:48<01:17, 17.23it/s][A
Epoch 5/10:  40%|████      | 884/2208 [00:48<01:12, 18.35it/s][A
Epoch 5/10:  40%|████      | 887/2208 [00:49<01:09, 19.11it/s][A
Epoch 5/10:  40%|████      | 890/2208 [00:49<01:06, 19.72it/s][A
Epoch 5/10:  40%|████      | 893/2208 [00:49<01:05, 20.09it/s][A
Epoch 5/10:  41%|████      | 896/2208 [00:49<01:08, 19.29it/s][A
  with torch.cuda.amp.autocast():

Epoch 5/10:  41%|████      | 902/2208 [00:49<01:26, 15.08it/s][A
Epoch 5/10:  41%|████      | 905/2208 [00:50<01:18, 16.60it/s][A

Batch 900: Training loss = 0.3565, Training accuracy = 0.9289, F1 = 0.9288



Epoch 5/10:  41%|████      | 908/2208 [00:50<01:13, 17.79it/s][A
Epoch 5/10:  41%|████▏     | 911/2208 [00:50<01:09, 18.62it/s][A
Epoch 5/10:  41%|████▏     | 914/2208 [00:50<01:06, 19.45it/s][A
Epoch 5/10:  42%|████▏     | 917/2208 [00:50<01:04, 20.06it/s][A
Epoch 5/10:  42%|████▏     | 920/2208 [00:50<01:03, 20.41it/s][A
Epoch 5/10:  42%|████▏     | 923/2208 [00:50<01:02, 20.63it/s][A
  with torch.cuda.amp.autocast():

Epoch 5/10:  42%|████▏     | 929/2208 [00:51<01:17, 16.43it/s][A

Batch 925: Training loss = 0.1746, Training accuracy = 0.9290, F1 = 0.9289



Epoch 5/10:  42%|████▏     | 932/2208 [00:51<01:12, 17.63it/s][A
Epoch 5/10:  42%|████▏     | 935/2208 [00:51<01:08, 18.50it/s][A
Epoch 5/10:  42%|████▏     | 938/2208 [00:51<01:05, 19.29it/s][A
Epoch 5/10:  43%|████▎     | 941/2208 [00:51<01:03, 19.88it/s][A
Epoch 5/10:  43%|████▎     | 944/2208 [00:52<01:07, 18.63it/s][A
Epoch 5/10:  43%|████▎     | 947/2208 [00:52<01:05, 19.27it/s][A
  with torch.cuda.amp.autocast():

Epoch 5/10:  43%|████▎     | 953/2208 [00:52<01:27, 14.35it/s][A

Batch 950: Training loss = 0.1663, Training accuracy = 0.9290, F1 = 0.9289



Epoch 5/10:  43%|████▎     | 956/2208 [00:52<01:18, 15.89it/s][A
Epoch 5/10:  43%|████▎     | 959/2208 [00:53<01:12, 17.13it/s][A
Epoch 5/10:  44%|████▎     | 962/2208 [00:53<01:08, 18.09it/s][A
Epoch 5/10:  44%|████▎     | 965/2208 [00:53<01:06, 18.79it/s][A
Epoch 5/10:  44%|████▍     | 968/2208 [00:53<01:04, 19.29it/s][A
Epoch 5/10:  44%|████▍     | 971/2208 [00:53<01:02, 19.76it/s][A
  with torch.cuda.amp.autocast():

Epoch 5/10:  44%|████▍     | 977/2208 [00:54<01:29, 13.77it/s][A
Epoch 5/10:  44%|████▍     | 980/2208 [00:54<01:19, 15.45it/s][A

Batch 975: Training loss = 0.1821, Training accuracy = 0.9290, F1 = 0.9289



Epoch 5/10:  45%|████▍     | 983/2208 [00:54<01:12, 16.80it/s][A
Epoch 5/10:  45%|████▍     | 986/2208 [00:54<01:08, 17.92it/s][A
Epoch 5/10:  45%|████▍     | 989/2208 [00:54<01:04, 18.82it/s][A
Epoch 5/10:  45%|████▍     | 992/2208 [00:54<01:02, 19.43it/s][A
Epoch 5/10:  45%|████▌     | 995/2208 [00:55<01:01, 19.82it/s][A
Epoch 5/10:  45%|████▌     | 998/2208 [00:55<01:00, 19.94it/s][A
  with torch.cuda.amp.autocast():

Epoch 5/10:  45%|████▌     | 1004/2208 [00:55<01:24, 14.31it/s][A

Batch 1000: Training loss = 0.2240, Training accuracy = 0.9290, F1 = 0.9289



Epoch 5/10:  46%|████▌     | 1007/2208 [00:55<01:15, 15.94it/s][A
Epoch 5/10:  46%|████▌     | 1010/2208 [00:56<01:09, 17.20it/s][A
Epoch 5/10:  46%|████▌     | 1013/2208 [00:56<01:05, 18.15it/s][A
Epoch 5/10:  46%|████▌     | 1016/2208 [00:56<01:02, 18.98it/s][A
Epoch 5/10:  46%|████▌     | 1019/2208 [00:56<01:00, 19.57it/s][A
Epoch 5/10:  46%|████▋     | 1022/2208 [00:56<00:59, 19.97it/s][A
  with torch.cuda.amp.autocast():

Epoch 5/10:  47%|████▋     | 1028/2208 [00:57<01:24, 13.94it/s][A

Batch 1025: Training loss = 0.0965, Training accuracy = 0.9291, F1 = 0.9290



Epoch 5/10:  47%|████▋     | 1031/2208 [00:57<01:15, 15.58it/s][A
Epoch 5/10:  47%|████▋     | 1034/2208 [00:57<01:09, 16.99it/s][A
Epoch 5/10:  47%|████▋     | 1037/2208 [00:57<01:04, 18.03it/s][A
Epoch 5/10:  47%|████▋     | 1040/2208 [00:57<01:02, 18.78it/s][A
Epoch 5/10:  47%|████▋     | 1043/2208 [00:57<00:59, 19.47it/s][A
Epoch 5/10:  47%|████▋     | 1046/2208 [00:57<00:58, 20.00it/s][A
  with torch.cuda.amp.autocast():

Epoch 5/10:  48%|████▊     | 1052/2208 [00:58<01:22, 14.05it/s][A
Epoch 5/10:  48%|████▊     | 1055/2208 [00:58<01:13, 15.77it/s][A

Batch 1050: Training loss = 0.2328, Training accuracy = 0.9292, F1 = 0.9291



Epoch 5/10:  48%|████▊     | 1058/2208 [00:58<01:07, 17.14it/s][A
Epoch 5/10:  48%|████▊     | 1061/2208 [00:58<01:02, 18.24it/s][A
Epoch 5/10:  48%|████▊     | 1064/2208 [00:59<01:00, 19.03it/s][A
Epoch 5/10:  48%|████▊     | 1067/2208 [00:59<00:58, 19.64it/s][A
Epoch 5/10:  48%|████▊     | 1070/2208 [00:59<00:56, 20.12it/s][A
Epoch 5/10:  49%|████▊     | 1073/2208 [00:59<00:55, 20.37it/s][A
  with torch.cuda.amp.autocast():

Epoch 5/10:  49%|████▉     | 1079/2208 [00:59<01:09, 16.26it/s][A

Batch 1075: Training loss = 0.1334, Training accuracy = 0.9291, F1 = 0.9290



Epoch 5/10:  49%|████▉     | 1082/2208 [01:00<01:04, 17.52it/s][A
Epoch 5/10:  49%|████▉     | 1085/2208 [01:00<01:00, 18.60it/s][A
Epoch 5/10:  49%|████▉     | 1088/2208 [01:00<00:58, 19.16it/s][A
Epoch 5/10:  49%|████▉     | 1091/2208 [01:00<00:56, 19.78it/s][A
Epoch 5/10:  50%|████▉     | 1094/2208 [01:00<00:55, 20.18it/s][A
Epoch 5/10:  50%|████▉     | 1097/2208 [01:00<00:53, 20.61it/s][A
  with torch.cuda.amp.autocast():

Epoch 5/10:  50%|████▉     | 1103/2208 [01:01<01:19, 13.82it/s][A

Batch 1100: Training loss = 0.2466, Training accuracy = 0.9292, F1 = 0.9291



Epoch 5/10:  50%|█████     | 1106/2208 [01:01<01:11, 15.51it/s][A
Epoch 5/10:  50%|█████     | 1109/2208 [01:01<01:04, 16.94it/s][A
Epoch 5/10:  50%|█████     | 1112/2208 [01:01<01:01, 17.96it/s][A
Epoch 5/10:  50%|█████     | 1115/2208 [01:01<00:57, 18.92it/s][A
Epoch 5/10:  51%|█████     | 1118/2208 [01:02<00:55, 19.57it/s][A
Epoch 5/10:  51%|█████     | 1121/2208 [01:02<00:54, 20.09it/s][A
  with torch.cuda.amp.autocast():

Epoch 5/10:  51%|█████     | 1127/2208 [01:02<01:15, 14.40it/s][A
Epoch 5/10:  51%|█████     | 1130/2208 [01:02<01:07, 15.99it/s][A

Batch 1125: Training loss = 0.1505, Training accuracy = 0.9294, F1 = 0.9293



Epoch 5/10:  51%|█████▏    | 1133/2208 [01:02<01:02, 17.30it/s][A
Epoch 5/10:  51%|█████▏    | 1136/2208 [01:03<00:58, 18.39it/s][A
Epoch 5/10:  52%|█████▏    | 1139/2208 [01:03<00:55, 19.19it/s][A
Epoch 5/10:  52%|█████▏    | 1142/2208 [01:03<00:53, 19.83it/s][A
Epoch 5/10:  52%|█████▏    | 1145/2208 [01:03<00:52, 20.34it/s][A
Epoch 5/10:  52%|█████▏    | 1148/2208 [01:03<00:51, 20.66it/s][A
  with torch.cuda.amp.autocast():

Epoch 5/10:  52%|█████▏    | 1154/2208 [01:04<01:05, 16.09it/s][A

Batch 1150: Training loss = 0.1330, Training accuracy = 0.9295, F1 = 0.9294



Epoch 5/10:  52%|█████▏    | 1157/2208 [01:04<01:00, 17.40it/s][A
Epoch 5/10:  53%|█████▎    | 1160/2208 [01:04<00:56, 18.40it/s][A
Epoch 5/10:  53%|█████▎    | 1163/2208 [01:04<00:54, 19.19it/s][A
Epoch 5/10:  53%|█████▎    | 1166/2208 [01:04<00:52, 19.82it/s][A
Epoch 5/10:  53%|█████▎    | 1169/2208 [01:04<00:51, 20.20it/s][A
Epoch 5/10:  53%|█████▎    | 1172/2208 [01:04<00:50, 20.56it/s][A
  with torch.cuda.amp.autocast():

Epoch 5/10:  53%|█████▎    | 1178/2208 [01:05<01:11, 14.33it/s][A

Batch 1175: Training loss = 0.3024, Training accuracy = 0.9295, F1 = 0.9294



Epoch 5/10:  53%|█████▎    | 1181/2208 [01:05<01:04, 15.96it/s][A
Epoch 5/10:  54%|█████▎    | 1184/2208 [01:05<00:59, 17.22it/s][A
Epoch 5/10:  54%|█████▍    | 1187/2208 [01:05<00:55, 18.24it/s][A
Epoch 5/10:  54%|█████▍    | 1190/2208 [01:06<00:53, 19.07it/s][A
Epoch 5/10:  54%|█████▍    | 1193/2208 [01:06<00:58, 17.31it/s][A
Epoch 5/10:  54%|█████▍    | 1196/2208 [01:06<00:55, 18.23it/s][A
Epoch 5/10:  54%|█████▍    | 1198/2208 [01:06<00:54, 18.40it/s][A
  with torch.cuda.amp.autocast():

Epoch 5/10:  55%|█████▍    | 1204/2208 [01:07<01:09, 14.41it/s][A

Batch 1200: Training loss = 0.2370, Training accuracy = 0.9294, F1 = 0.9293



Epoch 5/10:  55%|█████▍    | 1207/2208 [01:07<01:02, 16.07it/s][A
Epoch 5/10:  55%|█████▍    | 1210/2208 [01:07<00:57, 17.44it/s][A
Epoch 5/10:  55%|█████▍    | 1213/2208 [01:07<00:54, 18.36it/s][A
Epoch 5/10:  55%|█████▌    | 1216/2208 [01:07<00:52, 19.04it/s][A
Epoch 5/10:  55%|█████▌    | 1219/2208 [01:07<00:53, 18.37it/s][A
Epoch 5/10:  55%|█████▌    | 1222/2208 [01:07<00:51, 19.23it/s][A
Epoch 5/10:  55%|█████▌    | 1224/2208 [01:08<00:53, 18.43it/s][A
  with torch.cuda.amp.autocast():

Epoch 5/10:  56%|█████▌    | 1229/2208 [01:08<01:10, 13.84it/s][A

Batch 1225: Training loss = 0.1820, Training accuracy = 0.9295, F1 = 0.9294



Epoch 5/10:  56%|█████▌    | 1232/2208 [01:08<01:02, 15.66it/s][A
Epoch 5/10:  56%|█████▌    | 1235/2208 [01:08<00:57, 17.02it/s][A
Epoch 5/10:  56%|█████▌    | 1237/2208 [01:08<00:55, 17.62it/s][A
Epoch 5/10:  56%|█████▌    | 1240/2208 [01:09<00:51, 18.66it/s][A
Epoch 5/10:  56%|█████▋    | 1243/2208 [01:09<00:50, 19.25it/s][A
Epoch 5/10:  56%|█████▋    | 1246/2208 [01:09<00:51, 18.74it/s][A
Epoch 5/10:  57%|█████▋    | 1249/2208 [01:09<00:49, 19.43it/s][A
  with torch.cuda.amp.autocast():

Epoch 5/10:  57%|█████▋    | 1254/2208 [01:10<01:11, 13.43it/s][A

Batch 1250: Training loss = 0.2838, Training accuracy = 0.9296, F1 = 0.9295



Epoch 5/10:  57%|█████▋    | 1257/2208 [01:10<01:02, 15.25it/s][A
Epoch 5/10:  57%|█████▋    | 1260/2208 [01:10<00:56, 16.68it/s][A
Epoch 5/10:  57%|█████▋    | 1263/2208 [01:10<00:53, 17.82it/s][A
Epoch 5/10:  57%|█████▋    | 1266/2208 [01:10<00:50, 18.70it/s][A
Epoch 5/10:  57%|█████▋    | 1269/2208 [01:10<00:48, 19.48it/s][A
Epoch 5/10:  58%|█████▊    | 1272/2208 [01:10<00:46, 19.99it/s][A
  with torch.cuda.amp.autocast():

Epoch 5/10:  58%|█████▊    | 1278/2208 [01:11<01:08, 13.52it/s][A

Batch 1275: Training loss = 0.1283, Training accuracy = 0.9297, F1 = 0.9296



Epoch 5/10:  58%|█████▊    | 1281/2208 [01:11<01:00, 15.23it/s][A
Epoch 5/10:  58%|█████▊    | 1284/2208 [01:11<00:55, 16.72it/s][A
Epoch 5/10:  58%|█████▊    | 1287/2208 [01:11<00:51, 17.80it/s][A
Epoch 5/10:  58%|█████▊    | 1290/2208 [01:12<00:49, 18.59it/s][A
Epoch 5/10:  59%|█████▊    | 1293/2208 [01:12<00:47, 19.27it/s][A
Epoch 5/10:  59%|█████▊    | 1296/2208 [01:12<00:46, 19.73it/s][A
  with torch.cuda.amp.autocast():

Epoch 5/10:  59%|█████▉    | 1302/2208 [01:12<01:06, 13.69it/s][A
Epoch 5/10:  59%|█████▉    | 1305/2208 [01:12<00:58, 15.42it/s][A

Batch 1300: Training loss = 0.2474, Training accuracy = 0.9297, F1 = 0.9296



Epoch 5/10:  59%|█████▉    | 1308/2208 [01:13<00:53, 16.77it/s][A
Epoch 5/10:  59%|█████▉    | 1311/2208 [01:13<00:50, 17.82it/s][A
Epoch 5/10:  60%|█████▉    | 1314/2208 [01:13<00:47, 18.75it/s][A
Epoch 5/10:  60%|█████▉    | 1317/2208 [01:13<00:45, 19.47it/s][A
Epoch 5/10:  60%|█████▉    | 1320/2208 [01:13<00:44, 19.87it/s][A
Epoch 5/10:  60%|█████▉    | 1323/2208 [01:13<00:43, 20.27it/s][A
  with torch.cuda.amp.autocast():

Epoch 5/10:  60%|██████    | 1329/2208 [01:14<00:57, 15.25it/s][A

Batch 1325: Training loss = 0.1450, Training accuracy = 0.9298, F1 = 0.9297



Epoch 5/10:  60%|██████    | 1332/2208 [01:14<00:52, 16.63it/s][A
Epoch 5/10:  60%|██████    | 1335/2208 [01:14<00:49, 17.81it/s][A
Epoch 5/10:  61%|██████    | 1338/2208 [01:14<00:46, 18.68it/s][A
Epoch 5/10:  61%|██████    | 1341/2208 [01:14<00:44, 19.34it/s][A
Epoch 5/10:  61%|██████    | 1344/2208 [01:15<00:44, 19.57it/s][A
Epoch 5/10:  61%|██████    | 1347/2208 [01:15<00:42, 20.14it/s][A
  with torch.cuda.amp.autocast():

Epoch 5/10:  61%|██████▏   | 1353/2208 [01:15<01:03, 13.48it/s][A

Batch 1350: Training loss = 0.1931, Training accuracy = 0.9300, F1 = 0.9299



Epoch 5/10:  61%|██████▏   | 1356/2208 [01:15<00:55, 15.24it/s][A
Epoch 5/10:  62%|██████▏   | 1359/2208 [01:16<00:51, 16.65it/s][A
Epoch 5/10:  62%|██████▏   | 1362/2208 [01:16<00:47, 17.72it/s][A
Epoch 5/10:  62%|██████▏   | 1365/2208 [01:16<00:45, 18.62it/s][A
Epoch 5/10:  62%|██████▏   | 1368/2208 [01:16<00:43, 19.45it/s][A
Epoch 5/10:  62%|██████▏   | 1371/2208 [01:16<00:42, 19.91it/s][A
  with torch.cuda.amp.autocast():

Epoch 5/10:  62%|██████▏   | 1377/2208 [01:17<01:04, 12.80it/s][A
Epoch 5/10:  62%|██████▎   | 1380/2208 [01:17<00:56, 14.61it/s][A

Batch 1375: Training loss = 0.1721, Training accuracy = 0.9300, F1 = 0.9299



Epoch 5/10:  63%|██████▎   | 1383/2208 [01:17<00:51, 16.16it/s][A
Epoch 5/10:  63%|██████▎   | 1386/2208 [01:17<00:47, 17.44it/s][A
Epoch 5/10:  63%|██████▎   | 1389/2208 [01:17<00:44, 18.45it/s][A
Epoch 5/10:  63%|██████▎   | 1392/2208 [01:17<00:42, 19.20it/s][A
Epoch 5/10:  63%|██████▎   | 1395/2208 [01:18<00:41, 19.68it/s][A
Epoch 5/10:  63%|██████▎   | 1398/2208 [01:18<00:40, 20.15it/s][A
  with torch.cuda.amp.autocast():

Epoch 5/10:  64%|██████▎   | 1404/2208 [01:18<00:54, 14.78it/s][A

Batch 1400: Training loss = 0.1501, Training accuracy = 0.9300, F1 = 0.9299



Epoch 5/10:  64%|██████▎   | 1407/2208 [01:18<00:48, 16.35it/s][A
Epoch 5/10:  64%|██████▍   | 1410/2208 [01:19<00:45, 17.56it/s][A
Epoch 5/10:  64%|██████▍   | 1413/2208 [01:19<00:42, 18.54it/s][A
Epoch 5/10:  64%|██████▍   | 1416/2208 [01:19<00:40, 19.40it/s][A
Epoch 5/10:  64%|██████▍   | 1419/2208 [01:19<00:39, 19.97it/s][A
Epoch 5/10:  64%|██████▍   | 1422/2208 [01:19<00:38, 20.29it/s][A
  with torch.cuda.amp.autocast():

Epoch 5/10:  65%|██████▍   | 1428/2208 [01:20<01:07, 11.62it/s][A

Batch 1425: Training loss = 0.1387, Training accuracy = 0.9301, F1 = 0.9300



Epoch 5/10:  65%|██████▍   | 1431/2208 [01:20<00:57, 13.48it/s][A
Epoch 5/10:  65%|██████▍   | 1434/2208 [01:20<00:51, 15.11it/s][A
Epoch 5/10:  65%|██████▌   | 1437/2208 [01:20<00:46, 16.45it/s][A
Epoch 5/10:  65%|██████▌   | 1440/2208 [01:20<00:43, 17.53it/s][A
Epoch 5/10:  65%|██████▌   | 1443/2208 [01:20<00:41, 18.42it/s][A
Epoch 5/10:  65%|██████▌   | 1446/2208 [01:21<00:39, 19.20it/s][A
  with torch.cuda.amp.autocast():

Epoch 5/10:  66%|██████▌   | 1452/2208 [01:21<01:05, 11.49it/s][A
Epoch 5/10:  66%|██████▌   | 1455/2208 [01:21<00:56, 13.34it/s][A

Batch 1450: Training loss = 0.2555, Training accuracy = 0.9303, F1 = 0.9302



Epoch 5/10:  66%|██████▌   | 1458/2208 [01:22<00:49, 15.01it/s][A
Epoch 5/10:  66%|██████▌   | 1461/2208 [01:22<00:45, 16.37it/s][A
Epoch 5/10:  66%|██████▋   | 1464/2208 [01:22<00:42, 17.50it/s][A
Epoch 5/10:  66%|██████▋   | 1467/2208 [01:22<00:40, 18.51it/s][A
Epoch 5/10:  67%|██████▋   | 1470/2208 [01:22<00:38, 19.26it/s][A
Epoch 5/10:  67%|██████▋   | 1473/2208 [01:22<00:39, 18.41it/s][A
  with torch.cuda.amp.autocast():

Epoch 5/10:  67%|██████▋   | 1477/2208 [01:23<01:06, 10.92it/s][A
Epoch 5/10:  67%|██████▋   | 1480/2208 [01:23<00:55, 13.08it/s][A

Batch 1475: Training loss = 0.1768, Training accuracy = 0.9304, F1 = 0.9303



Epoch 5/10:  67%|██████▋   | 1483/2208 [01:23<00:48, 15.03it/s][A
Epoch 5/10:  67%|██████▋   | 1486/2208 [01:23<00:43, 16.54it/s][A
Epoch 5/10:  67%|██████▋   | 1489/2208 [01:23<00:40, 17.75it/s][A
Epoch 5/10:  68%|██████▊   | 1492/2208 [01:24<00:38, 18.66it/s][A
Epoch 5/10:  68%|██████▊   | 1495/2208 [01:24<00:37, 19.26it/s][A
Epoch 5/10:  68%|██████▊   | 1498/2208 [01:24<00:37, 18.93it/s][A
  with torch.cuda.amp.autocast():

Epoch 5/10:  68%|██████▊   | 1504/2208 [01:24<00:51, 13.67it/s][A

Batch 1500: Training loss = 0.1876, Training accuracy = 0.9306, F1 = 0.9305



Epoch 5/10:  68%|██████▊   | 1507/2208 [01:25<00:45, 15.37it/s][A
Epoch 5/10:  68%|██████▊   | 1510/2208 [01:25<00:41, 16.71it/s][A
Epoch 5/10:  69%|██████▊   | 1513/2208 [01:25<00:38, 17.87it/s][A
Epoch 5/10:  69%|██████▊   | 1516/2208 [01:25<00:37, 18.66it/s][A
Epoch 5/10:  69%|██████▉   | 1519/2208 [01:25<00:35, 19.43it/s][A
Epoch 5/10:  69%|██████▉   | 1522/2208 [01:25<00:34, 19.89it/s][A
  with torch.cuda.amp.autocast():

Epoch 5/10:  69%|██████▉   | 1528/2208 [01:26<00:55, 12.20it/s][A

Batch 1525: Training loss = 0.1023, Training accuracy = 0.9307, F1 = 0.9307



Epoch 5/10:  69%|██████▉   | 1531/2208 [01:26<00:48, 14.04it/s][A
Epoch 5/10:  69%|██████▉   | 1534/2208 [01:26<00:43, 15.62it/s][A
Epoch 5/10:  70%|██████▉   | 1537/2208 [01:26<00:39, 17.00it/s][A
Epoch 5/10:  70%|██████▉   | 1540/2208 [01:26<00:37, 18.03it/s][A
Epoch 5/10:  70%|██████▉   | 1543/2208 [01:27<00:35, 18.89it/s][A
Epoch 5/10:  70%|███████   | 1546/2208 [01:27<00:33, 19.62it/s][A
  with torch.cuda.amp.autocast():

Epoch 5/10:  70%|███████   | 1552/2208 [01:27<00:53, 12.25it/s][A
Epoch 5/10:  70%|███████   | 1555/2208 [01:27<00:46, 14.07it/s][A

Batch 1550: Training loss = 0.0779, Training accuracy = 0.9310, F1 = 0.9309



Epoch 5/10:  71%|███████   | 1558/2208 [01:28<00:41, 15.74it/s][A
Epoch 5/10:  71%|███████   | 1561/2208 [01:28<00:37, 17.05it/s][A
Epoch 5/10:  71%|███████   | 1564/2208 [01:28<00:35, 18.17it/s][A
Epoch 5/10:  71%|███████   | 1567/2208 [01:28<00:33, 18.99it/s][A
Epoch 5/10:  71%|███████   | 1570/2208 [01:28<00:32, 19.54it/s][A
Epoch 5/10:  71%|███████   | 1573/2208 [01:28<00:31, 19.98it/s][A
  with torch.cuda.amp.autocast():

Epoch 5/10:  72%|███████▏  | 1579/2208 [01:29<00:46, 13.59it/s][A

Batch 1575: Training loss = 0.1766, Training accuracy = 0.9310, F1 = 0.9309



Epoch 5/10:  72%|███████▏  | 1582/2208 [01:29<00:41, 15.21it/s][A
Epoch 5/10:  72%|███████▏  | 1585/2208 [01:29<00:37, 16.69it/s][A
Epoch 5/10:  72%|███████▏  | 1588/2208 [01:29<00:34, 17.88it/s][A
Epoch 5/10:  72%|███████▏  | 1591/2208 [01:30<00:32, 18.77it/s][A
Epoch 5/10:  72%|███████▏  | 1594/2208 [01:30<00:31, 19.44it/s][A
Epoch 5/10:  72%|███████▏  | 1597/2208 [01:30<00:30, 19.93it/s][A
  with torch.cuda.amp.autocast():

Epoch 5/10:  73%|███████▎  | 1603/2208 [01:30<00:49, 12.33it/s][A

Batch 1600: Training loss = 0.1438, Training accuracy = 0.9311, F1 = 0.9310



Epoch 5/10:  73%|███████▎  | 1606/2208 [01:31<00:42, 14.16it/s][A
Epoch 5/10:  73%|███████▎  | 1609/2208 [01:31<00:37, 15.84it/s][A
Epoch 5/10:  73%|███████▎  | 1612/2208 [01:31<00:34, 17.10it/s][A
Epoch 5/10:  73%|███████▎  | 1615/2208 [01:31<00:32, 18.13it/s][A
Epoch 5/10:  73%|███████▎  | 1618/2208 [01:31<00:31, 19.01it/s][A
Epoch 5/10:  73%|███████▎  | 1621/2208 [01:31<00:29, 19.69it/s][A
  with torch.cuda.amp.autocast():

Epoch 5/10:  74%|███████▎  | 1627/2208 [01:32<00:47, 12.19it/s][A
Epoch 5/10:  74%|███████▍  | 1630/2208 [01:32<00:41, 14.03it/s][A

Batch 1625: Training loss = 0.1815, Training accuracy = 0.9312, F1 = 0.9311



Epoch 5/10:  74%|███████▍  | 1633/2208 [01:32<00:36, 15.62it/s][A
Epoch 5/10:  74%|███████▍  | 1636/2208 [01:32<00:33, 16.95it/s][A
Epoch 5/10:  74%|███████▍  | 1639/2208 [01:32<00:31, 18.11it/s][A
Epoch 5/10:  74%|███████▍  | 1642/2208 [01:33<00:29, 19.02it/s][A
Epoch 5/10:  75%|███████▍  | 1645/2208 [01:33<00:28, 19.70it/s][A
Epoch 5/10:  75%|███████▍  | 1648/2208 [01:33<00:27, 20.10it/s][A
  with torch.cuda.amp.autocast():

Epoch 5/10:  75%|███████▍  | 1654/2208 [01:33<00:40, 13.82it/s][A

Batch 1650: Training loss = 0.1449, Training accuracy = 0.9313, F1 = 0.9312



Epoch 5/10:  75%|███████▌  | 1657/2208 [01:34<00:35, 15.46it/s][A
Epoch 5/10:  75%|███████▌  | 1660/2208 [01:34<00:32, 16.75it/s][A
Epoch 5/10:  75%|███████▌  | 1663/2208 [01:34<00:30, 17.89it/s][A
Epoch 5/10:  75%|███████▌  | 1666/2208 [01:34<00:29, 18.68it/s][A
Epoch 5/10:  76%|███████▌  | 1669/2208 [01:34<00:28, 19.18it/s][A
Epoch 5/10:  76%|███████▌  | 1672/2208 [01:34<00:27, 19.67it/s][A
  with torch.cuda.amp.autocast():

Epoch 5/10:  76%|███████▌  | 1678/2208 [01:35<00:47, 11.16it/s][A

Batch 1675: Training loss = 0.1931, Training accuracy = 0.9314, F1 = 0.9313



Epoch 5/10:  76%|███████▌  | 1681/2208 [01:35<00:40, 13.06it/s][A
Epoch 5/10:  76%|███████▋  | 1684/2208 [01:35<00:35, 14.81it/s][A
Epoch 5/10:  76%|███████▋  | 1687/2208 [01:35<00:31, 16.34it/s][A
Epoch 5/10:  77%|███████▋  | 1690/2208 [01:36<00:29, 17.57it/s][A
Epoch 5/10:  77%|███████▋  | 1693/2208 [01:36<00:29, 17.29it/s][A
Epoch 5/10:  77%|███████▋  | 1695/2208 [01:36<00:34, 14.92it/s][A
Epoch 5/10:  77%|███████▋  | 1698/2208 [01:36<00:30, 16.47it/s][A
  with torch.cuda.amp.autocast():

Epoch 5/10:  77%|███████▋  | 1704/2208 [01:37<00:40, 12.37it/s][A

Batch 1700: Training loss = 0.2650, Training accuracy = 0.9316, F1 = 0.9315



Epoch 5/10:  77%|███████▋  | 1707/2208 [01:37<00:35, 14.21it/s][A
Epoch 5/10:  77%|███████▋  | 1710/2208 [01:37<00:31, 15.84it/s][A
Epoch 5/10:  78%|███████▊  | 1713/2208 [01:37<00:28, 17.25it/s][A
Epoch 5/10:  78%|███████▊  | 1716/2208 [01:37<00:26, 18.25it/s][A
Epoch 5/10:  78%|███████▊  | 1719/2208 [01:37<00:25, 18.97it/s][A
Epoch 5/10:  78%|███████▊  | 1722/2208 [01:38<00:26, 18.44it/s][A
  with torch.cuda.amp.autocast():

Epoch 5/10:  78%|███████▊  | 1727/2208 [01:38<00:48,  9.89it/s][A
Epoch 5/10:  78%|███████▊  | 1730/2208 [01:38<00:39, 12.01it/s][A

Batch 1725: Training loss = 0.2171, Training accuracy = 0.9316, F1 = 0.9315



Epoch 5/10:  78%|███████▊  | 1733/2208 [01:39<00:33, 13.99it/s][A
Epoch 5/10:  79%|███████▊  | 1736/2208 [01:39<00:30, 15.65it/s][A
Epoch 5/10:  79%|███████▉  | 1739/2208 [01:39<00:27, 17.06it/s][A
Epoch 5/10:  79%|███████▉  | 1742/2208 [01:39<00:25, 18.16it/s][A
Epoch 5/10:  79%|███████▉  | 1745/2208 [01:39<00:24, 18.94it/s][A
Epoch 5/10:  79%|███████▉  | 1748/2208 [01:39<00:23, 19.63it/s][A
  with torch.cuda.amp.autocast():

Epoch 5/10:  79%|███████▉  | 1754/2208 [01:40<00:32, 13.91it/s][A

Batch 1750: Training loss = 0.2083, Training accuracy = 0.9316, F1 = 0.9315



Epoch 5/10:  80%|███████▉  | 1757/2208 [01:40<00:28, 15.56it/s][A
Epoch 5/10:  80%|███████▉  | 1760/2208 [01:40<00:26, 16.96it/s][A
Epoch 5/10:  80%|███████▉  | 1763/2208 [01:40<00:24, 18.10it/s][A
Epoch 5/10:  80%|███████▉  | 1766/2208 [01:41<00:23, 18.90it/s][A
Epoch 5/10:  80%|████████  | 1769/2208 [01:41<00:22, 19.48it/s][A
Epoch 5/10:  80%|████████  | 1772/2208 [01:41<00:21, 20.07it/s][A
  with torch.cuda.amp.autocast():

Epoch 5/10:  81%|████████  | 1778/2208 [01:41<00:35, 12.24it/s][A

Batch 1775: Training loss = 0.3159, Training accuracy = 0.9316, F1 = 0.9315



Epoch 5/10:  81%|████████  | 1781/2208 [01:42<00:30, 14.07it/s][A
Epoch 5/10:  81%|████████  | 1784/2208 [01:42<00:27, 15.67it/s][A
Epoch 5/10:  81%|████████  | 1787/2208 [01:42<00:24, 17.04it/s][A
Epoch 5/10:  81%|████████  | 1790/2208 [01:42<00:23, 18.08it/s][A
Epoch 5/10:  81%|████████  | 1793/2208 [01:42<00:21, 18.90it/s][A
Epoch 5/10:  81%|████████▏ | 1796/2208 [01:42<00:21, 19.54it/s][A
  with torch.cuda.amp.autocast():

Epoch 5/10:  82%|████████▏ | 1802/2208 [01:43<00:34, 11.87it/s][A
Epoch 5/10:  82%|████████▏ | 1805/2208 [01:43<00:29, 13.79it/s][A

Batch 1800: Training loss = 0.1055, Training accuracy = 0.9316, F1 = 0.9315



Epoch 5/10:  82%|████████▏ | 1808/2208 [01:43<00:25, 15.40it/s][A
Epoch 5/10:  82%|████████▏ | 1811/2208 [01:43<00:23, 16.76it/s][A
Epoch 5/10:  82%|████████▏ | 1814/2208 [01:43<00:22, 17.77it/s][A
Epoch 5/10:  82%|████████▏ | 1817/2208 [01:44<00:20, 18.73it/s][A
Epoch 5/10:  82%|████████▏ | 1820/2208 [01:44<00:20, 19.40it/s][A
Epoch 5/10:  83%|████████▎ | 1823/2208 [01:44<00:19, 19.85it/s][A
  with torch.cuda.amp.autocast():

Epoch 5/10:  83%|████████▎ | 1829/2208 [01:44<00:27, 13.90it/s][A

Batch 1825: Training loss = 0.1480, Training accuracy = 0.9317, F1 = 0.9316



Epoch 5/10:  83%|████████▎ | 1832/2208 [01:45<00:24, 15.55it/s][A
Epoch 5/10:  83%|████████▎ | 1835/2208 [01:45<00:22, 16.92it/s][A
Epoch 5/10:  83%|████████▎ | 1838/2208 [01:45<00:20, 18.04it/s][A
Epoch 5/10:  83%|████████▎ | 1841/2208 [01:45<00:19, 18.95it/s][A
Epoch 5/10:  84%|████████▎ | 1844/2208 [01:45<00:18, 19.62it/s][A
Epoch 5/10:  84%|████████▎ | 1847/2208 [01:45<00:17, 20.08it/s][A
  with torch.cuda.amp.autocast():

Epoch 5/10:  84%|████████▍ | 1853/2208 [01:46<00:30, 11.63it/s][A

Batch 1850: Training loss = 0.1173, Training accuracy = 0.9317, F1 = 0.9316



Epoch 5/10:  84%|████████▍ | 1856/2208 [01:46<00:26, 13.44it/s][A
Epoch 5/10:  84%|████████▍ | 1859/2208 [01:46<00:23, 15.17it/s][A
Epoch 5/10:  84%|████████▍ | 1862/2208 [01:46<00:20, 16.62it/s][A
Epoch 5/10:  84%|████████▍ | 1865/2208 [01:47<00:19, 17.72it/s][A
Epoch 5/10:  85%|████████▍ | 1868/2208 [01:47<00:18, 18.56it/s][A
Epoch 5/10:  85%|████████▍ | 1871/2208 [01:47<00:17, 19.24it/s][A
  with torch.cuda.amp.autocast():

Epoch 5/10:  85%|████████▌ | 1877/2208 [01:47<00:28, 11.81it/s][A
Epoch 5/10:  85%|████████▌ | 1880/2208 [01:48<00:23, 13.73it/s][A

Batch 1875: Training loss = 0.1715, Training accuracy = 0.9317, F1 = 0.9316



Epoch 5/10:  85%|████████▌ | 1883/2208 [01:48<00:21, 15.33it/s][A
Epoch 5/10:  85%|████████▌ | 1886/2208 [01:48<00:19, 16.73it/s][A
Epoch 5/10:  86%|████████▌ | 1889/2208 [01:48<00:17, 17.87it/s][A
Epoch 5/10:  86%|████████▌ | 1892/2208 [01:48<00:16, 18.88it/s][A
Epoch 5/10:  86%|████████▌ | 1895/2208 [01:48<00:16, 19.51it/s][A
Epoch 5/10:  86%|████████▌ | 1898/2208 [01:48<00:15, 19.90it/s][A
  with torch.cuda.amp.autocast():

Epoch 5/10:  86%|████████▌ | 1904/2208 [01:49<00:23, 12.89it/s][A

Batch 1900: Training loss = 0.2207, Training accuracy = 0.9317, F1 = 0.9316



Epoch 5/10:  86%|████████▋ | 1907/2208 [01:49<00:20, 14.64it/s][A
Epoch 5/10:  87%|████████▋ | 1910/2208 [01:49<00:18, 16.17it/s][A
Epoch 5/10:  87%|████████▋ | 1913/2208 [01:50<00:17, 17.32it/s][A
Epoch 5/10:  87%|████████▋ | 1916/2208 [01:50<00:16, 18.23it/s][A
Epoch 5/10:  87%|████████▋ | 1919/2208 [01:50<00:15, 19.02it/s][A
Epoch 5/10:  87%|████████▋ | 1922/2208 [01:50<00:14, 19.48it/s][A
  with torch.cuda.amp.autocast():

Epoch 5/10:  87%|████████▋ | 1928/2208 [01:51<00:25, 11.19it/s][A

Batch 1925: Training loss = 0.1880, Training accuracy = 0.9318, F1 = 0.9317



Epoch 5/10:  87%|████████▋ | 1931/2208 [01:51<00:21, 13.05it/s][A
Epoch 5/10:  88%|████████▊ | 1934/2208 [01:51<00:18, 14.72it/s][A
Epoch 5/10:  88%|████████▊ | 1937/2208 [01:51<00:16, 16.20it/s][A
Epoch 5/10:  88%|████████▊ | 1940/2208 [01:51<00:15, 17.36it/s][A
Epoch 5/10:  88%|████████▊ | 1942/2208 [01:51<00:14, 17.79it/s][A
Epoch 5/10:  88%|████████▊ | 1945/2208 [01:52<00:14, 18.63it/s][A
Epoch 5/10:  88%|████████▊ | 1948/2208 [01:52<00:13, 19.31it/s][A
  with torch.cuda.amp.autocast():

Epoch 5/10:  88%|████████▊ | 1954/2208 [01:52<00:20, 12.61it/s][A

Batch 1950: Training loss = 0.3106, Training accuracy = 0.9319, F1 = 0.9318



Epoch 5/10:  89%|████████▊ | 1957/2208 [01:52<00:17, 14.47it/s][A
Epoch 5/10:  89%|████████▉ | 1960/2208 [01:53<00:15, 16.09it/s][A
Epoch 5/10:  89%|████████▉ | 1963/2208 [01:53<00:14, 17.36it/s][A
Epoch 5/10:  89%|████████▉ | 1966/2208 [01:53<00:13, 18.41it/s][A
Epoch 5/10:  89%|████████▉ | 1969/2208 [01:53<00:12, 19.15it/s][A
Epoch 5/10:  89%|████████▉ | 1972/2208 [01:53<00:12, 19.45it/s][A
  with torch.cuda.amp.autocast():

Epoch 5/10:  90%|████████▉ | 1978/2208 [01:54<00:21, 10.65it/s][A

Batch 1975: Training loss = 0.2407, Training accuracy = 0.9320, F1 = 0.9319



Epoch 5/10:  90%|████████▉ | 1981/2208 [01:54<00:18, 12.54it/s][A
Epoch 5/10:  90%|████████▉ | 1984/2208 [01:54<00:15, 14.37it/s][A
Epoch 5/10:  90%|████████▉ | 1987/2208 [01:54<00:13, 15.90it/s][A
Epoch 5/10:  90%|█████████ | 1990/2208 [01:54<00:12, 17.18it/s][A
Epoch 5/10:  90%|█████████ | 1993/2208 [01:55<00:11, 18.19it/s][A
Epoch 5/10:  90%|█████████ | 1996/2208 [01:55<00:11, 19.03it/s][A
  with torch.cuda.amp.autocast():

Epoch 5/10:  91%|█████████ | 2002/2208 [01:55<00:18, 11.38it/s][A
Epoch 5/10:  91%|█████████ | 2005/2208 [01:56<00:15, 13.29it/s][A

Batch 2000: Training loss = 0.1574, Training accuracy = 0.9320, F1 = 0.9319



Epoch 5/10:  91%|█████████ | 2008/2208 [01:56<00:13, 15.04it/s][A
Epoch 5/10:  91%|█████████ | 2011/2208 [01:56<00:11, 16.51it/s][A
Epoch 5/10:  91%|█████████ | 2014/2208 [01:56<00:11, 17.63it/s][A
Epoch 5/10:  91%|█████████▏| 2017/2208 [01:56<00:10, 18.69it/s][A
Epoch 5/10:  91%|█████████▏| 2020/2208 [01:56<00:09, 19.52it/s][A
Epoch 5/10:  92%|█████████▏| 2023/2208 [01:56<00:09, 20.10it/s][A
  with torch.cuda.amp.autocast():

Epoch 5/10:  92%|█████████▏| 2029/2208 [01:57<00:13, 13.00it/s][A

Batch 2025: Training loss = 0.2073, Training accuracy = 0.9322, F1 = 0.9321



Epoch 5/10:  92%|█████████▏| 2032/2208 [01:57<00:11, 14.67it/s][A
Epoch 5/10:  92%|█████████▏| 2035/2208 [01:57<00:10, 16.11it/s][A
Epoch 5/10:  92%|█████████▏| 2038/2208 [01:58<00:09, 17.37it/s][A
Epoch 5/10:  92%|█████████▏| 2041/2208 [01:58<00:09, 18.36it/s][A
Epoch 5/10:  93%|█████████▎| 2044/2208 [01:58<00:08, 19.12it/s][A
Epoch 5/10:  93%|█████████▎| 2047/2208 [01:58<00:08, 19.71it/s][A
  with torch.cuda.amp.autocast():

Epoch 5/10:  93%|█████████▎| 2053/2208 [01:59<00:13, 11.20it/s][A

Batch 2050: Training loss = 0.1785, Training accuracy = 0.9322, F1 = 0.9321



Epoch 5/10:  93%|█████████▎| 2056/2208 [01:59<00:11, 13.11it/s][A
Epoch 5/10:  93%|█████████▎| 2059/2208 [01:59<00:10, 14.87it/s][A
Epoch 5/10:  93%|█████████▎| 2062/2208 [01:59<00:08, 16.35it/s][A
Epoch 5/10:  94%|█████████▎| 2065/2208 [01:59<00:08, 17.54it/s][A
Epoch 5/10:  94%|█████████▎| 2068/2208 [01:59<00:07, 18.56it/s][A
Epoch 5/10:  94%|█████████▍| 2071/2208 [01:59<00:07, 19.24it/s][A
  with torch.cuda.amp.autocast():

Epoch 5/10:  94%|█████████▍| 2077/2208 [02:00<00:11, 11.04it/s][A
Epoch 5/10:  94%|█████████▍| 2080/2208 [02:00<00:09, 12.93it/s][A

Batch 2075: Training loss = 0.2208, Training accuracy = 0.9323, F1 = 0.9322



Epoch 5/10:  94%|█████████▍| 2083/2208 [02:00<00:08, 14.70it/s][A
Epoch 5/10:  94%|█████████▍| 2086/2208 [02:01<00:07, 16.21it/s][A
Epoch 5/10:  95%|█████████▍| 2089/2208 [02:01<00:06, 17.48it/s][A
Epoch 5/10:  95%|█████████▍| 2092/2208 [02:01<00:06, 18.50it/s][A
Epoch 5/10:  95%|█████████▍| 2095/2208 [02:01<00:05, 19.26it/s][A
Epoch 5/10:  95%|█████████▌| 2098/2208 [02:01<00:05, 19.84it/s][A
  with torch.cuda.amp.autocast():

Epoch 5/10:  95%|█████████▌| 2104/2208 [02:02<00:07, 13.04it/s][A

Batch 2100: Training loss = 0.1927, Training accuracy = 0.9323, F1 = 0.9322



Epoch 5/10:  95%|█████████▌| 2107/2208 [02:02<00:06, 14.82it/s][A
Epoch 5/10:  96%|█████████▌| 2110/2208 [02:02<00:05, 16.37it/s][A
Epoch 5/10:  96%|█████████▌| 2113/2208 [02:02<00:05, 17.48it/s][A
Epoch 5/10:  96%|█████████▌| 2116/2208 [02:02<00:04, 18.42it/s][A
Epoch 5/10:  96%|█████████▌| 2119/2208 [02:03<00:04, 19.12it/s][A
Epoch 5/10:  96%|█████████▌| 2122/2208 [02:03<00:04, 19.55it/s][A
  with torch.cuda.amp.autocast():

Epoch 5/10:  96%|█████████▋| 2128/2208 [02:03<00:07, 10.74it/s][A

Batch 2125: Training loss = 0.1863, Training accuracy = 0.9323, F1 = 0.9322



Epoch 5/10:  97%|█████████▋| 2131/2208 [02:04<00:06, 12.67it/s][A
Epoch 5/10:  97%|█████████▋| 2134/2208 [02:04<00:05, 14.45it/s][A
Epoch 5/10:  97%|█████████▋| 2137/2208 [02:04<00:04, 15.92it/s][A
Epoch 5/10:  97%|█████████▋| 2139/2208 [02:04<00:04, 16.66it/s][A
Epoch 5/10:  97%|█████████▋| 2142/2208 [02:04<00:03, 17.73it/s][A
Epoch 5/10:  97%|█████████▋| 2145/2208 [02:04<00:03, 18.68it/s][A
Epoch 5/10:  97%|█████████▋| 2148/2208 [02:04<00:03, 19.41it/s][A
  with torch.cuda.amp.autocast():

Epoch 5/10:  98%|█████████▊| 2154/2208 [02:05<00:04, 12.30it/s][A

Batch 2150: Training loss = 0.1607, Training accuracy = 0.9325, F1 = 0.9324



Epoch 5/10:  98%|█████████▊| 2157/2208 [02:05<00:03, 14.11it/s][A
Epoch 5/10:  98%|█████████▊| 2160/2208 [02:05<00:03, 15.66it/s][A
Epoch 5/10:  98%|█████████▊| 2163/2208 [02:06<00:02, 17.02it/s][A
Epoch 5/10:  98%|█████████▊| 2166/2208 [02:06<00:02, 18.12it/s][A
Epoch 5/10:  98%|█████████▊| 2169/2208 [02:06<00:02, 17.74it/s][A
Epoch 5/10:  98%|█████████▊| 2172/2208 [02:06<00:01, 18.15it/s][A
  with torch.cuda.amp.autocast():

Epoch 5/10:  99%|█████████▊| 2177/2208 [02:07<00:03,  9.22it/s][A
Epoch 5/10:  99%|█████████▊| 2180/2208 [02:07<00:02, 11.34it/s][A

Batch 2175: Training loss = 0.2960, Training accuracy = 0.9325, F1 = 0.9324



Epoch 5/10:  99%|█████████▉| 2183/2208 [02:07<00:01, 13.31it/s][A
Epoch 5/10:  99%|█████████▉| 2186/2208 [02:07<00:01, 15.11it/s][A
Epoch 5/10:  99%|█████████▉| 2189/2208 [02:07<00:01, 16.63it/s][A
Epoch 5/10:  99%|█████████▉| 2192/2208 [02:07<00:00, 17.79it/s][A
Epoch 5/10:  99%|█████████▉| 2195/2208 [02:08<00:00, 18.74it/s][A
Epoch 5/10: 100%|█████████▉| 2198/2208 [02:08<00:00, 19.38it/s][A
  with torch.cuda.amp.autocast():

Epoch 5/10: 100%|█████████▉| 2204/2208 [02:08<00:00, 12.52it/s][A

Batch 2200: Training loss = 0.2104, Training accuracy = 0.9326, F1 = 0.9325



Epoch 5/10: 100%|█████████▉| 2207/2208 [02:09<00:00, 14.41it/s][A
                                                               [A


Epoch 5 Training Metrics:
Loss: 0.2022
Accuracy: 0.9326
F1 Score: 0.9325
Precision: 0.9325
Recall: 0.9326

Starting validation...



Validation:   0%|          | 0/552 [00:00<?, ?it/s][A
Validation:   0%|          | 1/552 [00:01<14:46,  1.61s/it][A
Validation:   1%|          | 3/552 [00:01<04:19,  2.12it/s][A
Validation:   1%|          | 5/552 [00:01<02:20,  3.89it/s][A
Validation:   1%|▏         | 7/552 [00:01<01:33,  5.84it/s][A
Validation:   2%|▏         | 9/552 [00:02<01:08,  7.92it/s][A
Validation:   2%|▏         | 11/552 [00:02<00:54,  9.95it/s][A
Validation:   2%|▏         | 13/552 [00:02<00:45, 11.85it/s][A
Validation:   3%|▎         | 15/552 [00:02<00:39, 13.45it/s][A
Validation:   3%|▎         | 17/552 [00:02<00:36, 14.73it/s][A
Validation:   3%|▎         | 19/552 [00:02<00:33, 15.80it/s][A
Validation:   4%|▍         | 21/552 [00:02<00:31, 16.68it/s][A
Validation:   4%|▍         | 23/552 [00:02<00:30, 17.27it/s][A
Validation:   5%|▍         | 25/552 [00:02<00:29, 17.68it/s][A
Validation:   5%|▍         | 27/552 [00:03<00:29, 18.02it/s][A
Validation:   5%|▌         | 29/552 [00:03<00:28, 18.


Epoch 5 Validation Metrics:
Loss: 0.1748
Accuracy: 0.9421
F1 Score: 0.9416
Precision: 0.9441
Recall: 0.9421


Training epochs:  50%|█████     | 5/10 [13:25<13:27, 161.46s/it]


Starting epoch 6/10



  with torch.cuda.amp.autocast():

  with torch.cuda.amp.autocast():

Epoch 6/10:   0%|          | 3/2208 [00:01<17:00,  2.16it/s][A

Batch 0: Training loss = 0.1793, Training accuracy = 0.9297, F1 = 0.9245



Epoch 6/10:   0%|          | 5/2208 [00:01<09:13,  3.98it/s][A
Epoch 6/10:   0%|          | 8/2208 [00:01<05:18,  6.91it/s][A
Epoch 6/10:   0%|          | 11/2208 [00:02<03:46,  9.69it/s][A
Epoch 6/10:   1%|          | 14/2208 [00:02<02:59, 12.21it/s][A
Epoch 6/10:   1%|          | 16/2208 [00:02<02:41, 13.59it/s][A
Epoch 6/10:   1%|          | 19/2208 [00:02<02:20, 15.53it/s][A
Epoch 6/10:   1%|          | 21/2208 [00:02<02:29, 14.64it/s][A
Epoch 6/10:   1%|          | 24/2208 [00:02<02:12, 16.44it/s][A
  with torch.cuda.amp.autocast():

Epoch 6/10:   1%|▏         | 29/2208 [00:03<02:00, 18.13it/s][A

Batch 25: Training loss = 0.0930, Training accuracy = 0.9378, F1 = 0.9374



Epoch 6/10:   1%|▏         | 32/2208 [00:03<01:54, 18.98it/s][A
Epoch 6/10:   2%|▏         | 34/2208 [00:03<01:53, 19.12it/s][A
Epoch 6/10:   2%|▏         | 37/2208 [00:03<01:55, 18.80it/s][A
Epoch 6/10:   2%|▏         | 40/2208 [00:03<01:51, 19.51it/s][A
Epoch 6/10:   2%|▏         | 42/2208 [00:03<01:53, 19.16it/s][A
Epoch 6/10:   2%|▏         | 45/2208 [00:03<01:56, 18.56it/s][A
Epoch 6/10:   2%|▏         | 48/2208 [00:04<01:51, 19.39it/s][A
  with torch.cuda.amp.autocast():

Epoch 6/10:   2%|▏         | 52/2208 [00:04<01:56, 18.55it/s][A
Epoch 6/10:   2%|▏         | 54/2208 [00:04<01:55, 18.63it/s][A

Batch 50: Training loss = 0.1180, Training accuracy = 0.9404, F1 = 0.9401



Epoch 6/10:   3%|▎         | 57/2208 [00:04<01:50, 19.55it/s][A
Epoch 6/10:   3%|▎         | 60/2208 [00:04<01:46, 20.10it/s][A
Epoch 6/10:   3%|▎         | 63/2208 [00:04<01:45, 20.40it/s][A
Epoch 6/10:   3%|▎         | 66/2208 [00:04<01:51, 19.15it/s][A
Epoch 6/10:   3%|▎         | 68/2208 [00:05<01:55, 18.52it/s][A
Epoch 6/10:   3%|▎         | 71/2208 [00:05<01:50, 19.29it/s][A
Epoch 6/10:   3%|▎         | 73/2208 [00:05<02:01, 17.59it/s][A
  with torch.cuda.amp.autocast():

Epoch 6/10:   4%|▎         | 79/2208 [00:05<01:55, 18.46it/s][A

Batch 75: Training loss = 0.2456, Training accuracy = 0.9369, F1 = 0.9367



Epoch 6/10:   4%|▎         | 82/2208 [00:05<01:50, 19.24it/s][A
Epoch 6/10:   4%|▍         | 85/2208 [00:05<01:47, 19.72it/s][A
Epoch 6/10:   4%|▍         | 88/2208 [00:06<01:45, 20.02it/s][A
Epoch 6/10:   4%|▍         | 91/2208 [00:06<01:44, 20.17it/s][A
Epoch 6/10:   4%|▍         | 94/2208 [00:06<01:43, 20.45it/s][A
Epoch 6/10:   4%|▍         | 97/2208 [00:06<01:46, 19.89it/s][A
  with torch.cuda.amp.autocast():

Epoch 6/10:   5%|▍         | 103/2208 [00:07<02:13, 15.76it/s][A
Epoch 6/10:   5%|▍         | 105/2208 [00:07<02:07, 16.54it/s][A

Batch 100: Training loss = 0.2321, Training accuracy = 0.9369, F1 = 0.9368



Epoch 6/10:   5%|▍         | 108/2208 [00:07<01:58, 17.78it/s][A
Epoch 6/10:   5%|▍         | 110/2208 [00:07<01:57, 17.87it/s][A
Epoch 6/10:   5%|▌         | 113/2208 [00:07<01:54, 18.37it/s][A
Epoch 6/10:   5%|▌         | 116/2208 [00:07<01:48, 19.23it/s][A
Epoch 6/10:   5%|▌         | 118/2208 [00:07<01:56, 17.91it/s][A
Epoch 6/10:   5%|▌         | 121/2208 [00:07<01:51, 18.76it/s][A
Epoch 6/10:   6%|▌         | 124/2208 [00:08<01:46, 19.48it/s][A
  with torch.cuda.amp.autocast():

Epoch 6/10:   6%|▌         | 129/2208 [00:08<01:49, 18.95it/s][A

Batch 125: Training loss = 0.1566, Training accuracy = 0.9374, F1 = 0.9372



Epoch 6/10:   6%|▌         | 132/2208 [00:08<01:45, 19.65it/s][A
Epoch 6/10:   6%|▌         | 134/2208 [00:08<01:52, 18.50it/s][A
Epoch 6/10:   6%|▌         | 136/2208 [00:08<01:50, 18.82it/s][A
Epoch 6/10:   6%|▋         | 139/2208 [00:08<01:46, 19.48it/s][A
Epoch 6/10:   6%|▋         | 142/2208 [00:09<01:43, 20.04it/s][A
Epoch 6/10:   7%|▋         | 145/2208 [00:09<01:47, 19.27it/s][A
Epoch 6/10:   7%|▋         | 148/2208 [00:09<01:44, 19.70it/s][A
  with torch.cuda.amp.autocast():

Epoch 6/10:   7%|▋         | 152/2208 [00:09<02:11, 15.64it/s][A
Epoch 6/10:   7%|▋         | 155/2208 [00:09<01:59, 17.18it/s][A

Batch 150: Training loss = 0.1664, Training accuracy = 0.9374, F1 = 0.9372



Epoch 6/10:   7%|▋         | 158/2208 [00:09<01:51, 18.45it/s][A
Epoch 6/10:   7%|▋         | 161/2208 [00:10<01:45, 19.33it/s][A
Epoch 6/10:   7%|▋         | 164/2208 [00:10<01:42, 19.94it/s][A
Epoch 6/10:   8%|▊         | 167/2208 [00:10<01:41, 20.16it/s][A
Epoch 6/10:   8%|▊         | 170/2208 [00:10<01:41, 20.05it/s][A
Epoch 6/10:   8%|▊         | 173/2208 [00:10<01:42, 19.76it/s][A
  with torch.cuda.amp.autocast():

Epoch 6/10:   8%|▊         | 179/2208 [00:10<01:43, 19.53it/s][A

Batch 175: Training loss = 0.1270, Training accuracy = 0.9374, F1 = 0.9372



Epoch 6/10:   8%|▊         | 182/2208 [00:11<01:41, 19.89it/s][A
Epoch 6/10:   8%|▊         | 185/2208 [00:11<01:41, 19.97it/s][A
Epoch 6/10:   9%|▊         | 188/2208 [00:11<01:39, 20.37it/s][A
Epoch 6/10:   9%|▊         | 191/2208 [00:11<01:43, 19.57it/s][A
Epoch 6/10:   9%|▊         | 193/2208 [00:11<01:49, 18.39it/s][A
Epoch 6/10:   9%|▉         | 196/2208 [00:11<01:45, 19.06it/s][A
Epoch 6/10:   9%|▉         | 199/2208 [00:12<01:42, 19.69it/s][A
  with torch.cuda.amp.autocast():

Epoch 6/10:   9%|▉         | 204/2208 [00:12<01:53, 17.67it/s][A

Batch 200: Training loss = 0.1492, Training accuracy = 0.9365, F1 = 0.9363



Epoch 6/10:   9%|▉         | 207/2208 [00:12<01:46, 18.71it/s][A
Epoch 6/10:  10%|▉         | 210/2208 [00:12<01:43, 19.37it/s][A
Epoch 6/10:  10%|▉         | 213/2208 [00:12<01:45, 18.94it/s][A
Epoch 6/10:  10%|▉         | 216/2208 [00:12<01:41, 19.66it/s][A
Epoch 6/10:  10%|▉         | 218/2208 [00:13<01:49, 18.20it/s][A
Epoch 6/10:  10%|▉         | 220/2208 [00:13<02:00, 16.49it/s][A
Epoch 6/10:  10%|█         | 223/2208 [00:13<01:50, 17.90it/s][A
  with torch.cuda.amp.autocast():

Epoch 6/10:  10%|█         | 227/2208 [00:13<01:59, 16.53it/s][A
Epoch 6/10:  10%|█         | 229/2208 [00:13<01:58, 16.69it/s][A

Batch 225: Training loss = 0.1377, Training accuracy = 0.9371, F1 = 0.9370



Epoch 6/10:  11%|█         | 232/2208 [00:13<01:49, 18.09it/s][A
Epoch 6/10:  11%|█         | 235/2208 [00:14<01:43, 19.03it/s][A
Epoch 6/10:  11%|█         | 238/2208 [00:14<01:40, 19.59it/s][A
Epoch 6/10:  11%|█         | 241/2208 [00:14<01:37, 20.14it/s][A
Epoch 6/10:  11%|█         | 244/2208 [00:14<01:37, 20.05it/s][A
Epoch 6/10:  11%|█         | 247/2208 [00:14<01:35, 20.47it/s][A
  with torch.cuda.amp.autocast():

Epoch 6/10:  11%|█▏        | 252/2208 [00:14<01:47, 18.25it/s][A
Epoch 6/10:  12%|█▏        | 255/2208 [00:15<01:42, 19.09it/s][A

Batch 250: Training loss = 0.2673, Training accuracy = 0.9373, F1 = 0.9372



Epoch 6/10:  12%|█▏        | 257/2208 [00:15<01:41, 19.27it/s][A
Epoch 6/10:  12%|█▏        | 260/2208 [00:15<01:37, 20.02it/s][A
Epoch 6/10:  12%|█▏        | 263/2208 [00:15<01:35, 20.34it/s][A
Epoch 6/10:  12%|█▏        | 266/2208 [00:15<01:34, 20.60it/s][A
Epoch 6/10:  12%|█▏        | 269/2208 [00:15<01:35, 20.38it/s][A
Epoch 6/10:  12%|█▏        | 272/2208 [00:15<01:35, 20.29it/s][A
  with torch.cuda.amp.autocast():

Epoch 6/10:  13%|█▎        | 278/2208 [00:16<01:50, 17.39it/s][A

Batch 275: Training loss = 0.0931, Training accuracy = 0.9372, F1 = 0.9371



Epoch 6/10:  13%|█▎        | 281/2208 [00:16<01:44, 18.46it/s][A
Epoch 6/10:  13%|█▎        | 284/2208 [00:16<01:40, 19.17it/s][A
Epoch 6/10:  13%|█▎        | 287/2208 [00:16<01:37, 19.76it/s][A
Epoch 6/10:  13%|█▎        | 290/2208 [00:16<01:34, 20.22it/s][A
Epoch 6/10:  13%|█▎        | 293/2208 [00:16<01:33, 20.42it/s][A
Epoch 6/10:  13%|█▎        | 296/2208 [00:17<01:33, 20.46it/s][A
  with torch.cuda.amp.autocast():

Epoch 6/10:  14%|█▎        | 302/2208 [00:17<01:42, 18.60it/s][A
Epoch 6/10:  14%|█▍        | 305/2208 [00:17<01:38, 19.30it/s][A

Batch 300: Training loss = 0.1500, Training accuracy = 0.9380, F1 = 0.9378



Epoch 6/10:  14%|█▍        | 308/2208 [00:17<01:36, 19.75it/s][A
Epoch 6/10:  14%|█▍        | 311/2208 [00:17<01:34, 20.12it/s][A
Epoch 6/10:  14%|█▍        | 314/2208 [00:18<01:32, 20.43it/s][A
Epoch 6/10:  14%|█▍        | 317/2208 [00:18<01:31, 20.58it/s][A
Epoch 6/10:  14%|█▍        | 320/2208 [00:18<01:33, 20.21it/s][A
Epoch 6/10:  15%|█▍        | 323/2208 [00:18<01:33, 20.07it/s][A
  with torch.cuda.amp.autocast():

Epoch 6/10:  15%|█▍        | 329/2208 [00:18<01:39, 18.98it/s][A

Batch 325: Training loss = 0.1937, Training accuracy = 0.9387, F1 = 0.9386



Epoch 6/10:  15%|█▌        | 332/2208 [00:18<01:35, 19.65it/s][A
Epoch 6/10:  15%|█▌        | 335/2208 [00:19<01:33, 20.12it/s][A
Epoch 6/10:  15%|█▌        | 338/2208 [00:19<01:44, 17.86it/s][A
Epoch 6/10:  15%|█▌        | 341/2208 [00:19<01:39, 18.80it/s][A
Epoch 6/10:  16%|█▌        | 343/2208 [00:19<01:39, 18.73it/s][A
Epoch 6/10:  16%|█▌        | 346/2208 [00:19<01:35, 19.48it/s][A
Epoch 6/10:  16%|█▌        | 349/2208 [00:19<01:40, 18.44it/s][A
  with torch.cuda.amp.autocast():

Epoch 6/10:  16%|█▌        | 353/2208 [00:20<01:51, 16.69it/s][A

Batch 350: Training loss = 0.1737, Training accuracy = 0.9391, F1 = 0.9389



Epoch 6/10:  16%|█▌        | 356/2208 [00:20<01:42, 18.00it/s][A
Epoch 6/10:  16%|█▋        | 359/2208 [00:20<01:37, 18.93it/s][A
Epoch 6/10:  16%|█▋        | 362/2208 [00:20<01:33, 19.69it/s][A
Epoch 6/10:  17%|█▋        | 365/2208 [00:20<01:34, 19.60it/s][A
Epoch 6/10:  17%|█▋        | 368/2208 [00:20<01:34, 19.40it/s][A
Epoch 6/10:  17%|█▋        | 371/2208 [00:21<01:32, 19.89it/s][A
Epoch 6/10:  17%|█▋        | 373/2208 [00:21<01:39, 18.35it/s][A
  with torch.cuda.amp.autocast():

Epoch 6/10:  17%|█▋        | 379/2208 [00:21<01:42, 17.84it/s][A

Batch 375: Training loss = 0.1481, Training accuracy = 0.9391, F1 = 0.9390



Epoch 6/10:  17%|█▋        | 382/2208 [00:21<01:37, 18.65it/s][A
Epoch 6/10:  17%|█▋        | 385/2208 [00:21<01:35, 19.09it/s][A
Epoch 6/10:  18%|█▊        | 388/2208 [00:21<01:33, 19.53it/s][A
Epoch 6/10:  18%|█▊        | 390/2208 [00:22<01:39, 18.36it/s][A
Epoch 6/10:  18%|█▊        | 393/2208 [00:22<01:47, 16.94it/s][A
Epoch 6/10:  18%|█▊        | 396/2208 [00:22<01:40, 18.07it/s][A
Epoch 6/10:  18%|█▊        | 399/2208 [00:22<01:35, 18.85it/s][A
  with torch.cuda.amp.autocast():

Epoch 6/10:  18%|█▊        | 403/2208 [00:22<01:47, 16.75it/s][A

Batch 400: Training loss = 0.2940, Training accuracy = 0.9394, F1 = 0.9393



Epoch 6/10:  18%|█▊        | 406/2208 [00:23<01:41, 17.78it/s][A
Epoch 6/10:  19%|█▊        | 409/2208 [00:23<01:36, 18.67it/s][A
Epoch 6/10:  19%|█▊        | 412/2208 [00:23<01:32, 19.41it/s][A
Epoch 6/10:  19%|█▉        | 415/2208 [00:23<01:29, 20.04it/s][A
Epoch 6/10:  19%|█▉        | 418/2208 [00:23<01:36, 18.51it/s][A
Epoch 6/10:  19%|█▉        | 421/2208 [00:23<01:37, 18.26it/s][A
Epoch 6/10:  19%|█▉        | 424/2208 [00:23<01:33, 18.99it/s][A
  with torch.cuda.amp.autocast():

Epoch 6/10:  19%|█▉        | 429/2208 [00:24<01:43, 17.14it/s][A

Batch 425: Training loss = 0.2354, Training accuracy = 0.9394, F1 = 0.9393



Epoch 6/10:  20%|█▉        | 432/2208 [00:24<01:36, 18.38it/s][A
Epoch 6/10:  20%|█▉        | 435/2208 [00:24<01:31, 19.29it/s][A
Epoch 6/10:  20%|█▉        | 437/2208 [00:24<01:32, 19.13it/s][A
Epoch 6/10:  20%|█▉        | 440/2208 [00:24<01:29, 19.80it/s][A
Epoch 6/10:  20%|██        | 443/2208 [00:24<01:27, 20.19it/s][A
Epoch 6/10:  20%|██        | 446/2208 [00:25<01:26, 20.44it/s][A
  with torch.cuda.amp.autocast():

Epoch 6/10:  20%|██        | 452/2208 [00:25<01:44, 16.79it/s][A
Epoch 6/10:  21%|██        | 455/2208 [00:25<01:37, 17.97it/s][A

Batch 450: Training loss = 0.2521, Training accuracy = 0.9398, F1 = 0.9397



Epoch 6/10:  21%|██        | 458/2208 [00:25<01:32, 18.90it/s][A
Epoch 6/10:  21%|██        | 461/2208 [00:25<01:29, 19.49it/s][A
Epoch 6/10:  21%|██        | 464/2208 [00:26<01:27, 19.87it/s][A
Epoch 6/10:  21%|██        | 467/2208 [00:26<01:25, 20.35it/s][A
Epoch 6/10:  21%|██▏       | 470/2208 [00:26<01:23, 20.77it/s][A
Epoch 6/10:  21%|██▏       | 473/2208 [00:26<01:23, 20.87it/s][A
  with torch.cuda.amp.autocast():

Epoch 6/10:  22%|██▏       | 479/2208 [00:26<01:32, 18.59it/s][A

Batch 475: Training loss = 0.1770, Training accuracy = 0.9397, F1 = 0.9396



Epoch 6/10:  22%|██▏       | 482/2208 [00:27<01:29, 19.34it/s][A
Epoch 6/10:  22%|██▏       | 485/2208 [00:27<01:27, 19.77it/s][A
Epoch 6/10:  22%|██▏       | 488/2208 [00:27<01:24, 20.28it/s][A
Epoch 6/10:  22%|██▏       | 491/2208 [00:27<01:23, 20.51it/s][A
Epoch 6/10:  22%|██▏       | 494/2208 [00:27<01:22, 20.82it/s][A
Epoch 6/10:  23%|██▎       | 497/2208 [00:27<01:21, 20.99it/s][A
  with torch.cuda.amp.autocast():

Epoch 6/10:  23%|██▎       | 503/2208 [00:28<01:41, 16.81it/s][A

Batch 500: Training loss = 0.2201, Training accuracy = 0.9398, F1 = 0.9397



Epoch 6/10:  23%|██▎       | 506/2208 [00:28<01:34, 17.96it/s][A
Epoch 6/10:  23%|██▎       | 509/2208 [00:28<01:29, 18.88it/s][A
Epoch 6/10:  23%|██▎       | 512/2208 [00:28<01:26, 19.58it/s][A
Epoch 6/10:  23%|██▎       | 515/2208 [00:28<01:24, 20.05it/s][A
Epoch 6/10:  23%|██▎       | 518/2208 [00:28<01:23, 20.31it/s][A
Epoch 6/10:  24%|██▎       | 521/2208 [00:28<01:22, 20.45it/s][A
  with torch.cuda.amp.autocast():

Epoch 6/10:  24%|██▍       | 527/2208 [00:29<01:36, 17.41it/s][A
Epoch 6/10:  24%|██▍       | 530/2208 [00:29<01:31, 18.38it/s][A

Batch 525: Training loss = 0.1657, Training accuracy = 0.9397, F1 = 0.9396



Epoch 6/10:  24%|██▍       | 533/2208 [00:29<01:27, 19.14it/s][A
Epoch 6/10:  24%|██▍       | 536/2208 [00:29<01:24, 19.88it/s][A
Epoch 6/10:  24%|██▍       | 539/2208 [00:29<01:22, 20.30it/s][A
Epoch 6/10:  25%|██▍       | 542/2208 [00:30<01:20, 20.57it/s][A
Epoch 6/10:  25%|██▍       | 545/2208 [00:30<01:20, 20.57it/s][A
Epoch 6/10:  25%|██▍       | 548/2208 [00:30<01:19, 20.78it/s][A
  with torch.cuda.amp.autocast():

Epoch 6/10:  25%|██▌       | 554/2208 [00:30<01:29, 18.43it/s][A

Batch 550: Training loss = 0.2007, Training accuracy = 0.9399, F1 = 0.9398



Epoch 6/10:  25%|██▌       | 557/2208 [00:30<01:25, 19.34it/s][A
Epoch 6/10:  25%|██▌       | 560/2208 [00:30<01:22, 20.03it/s][A
Epoch 6/10:  25%|██▌       | 563/2208 [00:31<01:21, 20.17it/s][A
Epoch 6/10:  26%|██▌       | 566/2208 [00:31<01:19, 20.56it/s][A
Epoch 6/10:  26%|██▌       | 569/2208 [00:31<01:18, 20.80it/s][A
Epoch 6/10:  26%|██▌       | 572/2208 [00:31<01:18, 20.88it/s][A
  with torch.cuda.amp.autocast():

Epoch 6/10:  26%|██▌       | 578/2208 [00:31<01:33, 17.43it/s][A

Batch 575: Training loss = 0.1601, Training accuracy = 0.9400, F1 = 0.9399



Epoch 6/10:  26%|██▋       | 580/2208 [00:32<01:34, 17.23it/s][A
Epoch 6/10:  26%|██▋       | 583/2208 [00:32<01:28, 18.38it/s][A
Epoch 6/10:  27%|██▋       | 586/2208 [00:32<01:24, 19.22it/s][A
Epoch 6/10:  27%|██▋       | 589/2208 [00:32<01:21, 19.75it/s][A
Epoch 6/10:  27%|██▋       | 592/2208 [00:32<01:20, 20.20it/s][A
Epoch 6/10:  27%|██▋       | 595/2208 [00:32<01:18, 20.64it/s][A
Epoch 6/10:  27%|██▋       | 598/2208 [00:32<01:17, 20.86it/s][A
  with torch.cuda.amp.autocast():

Epoch 6/10:  27%|██▋       | 603/2208 [00:33<01:30, 17.73it/s][A

Batch 600: Training loss = 0.2103, Training accuracy = 0.9402, F1 = 0.9401



Epoch 6/10:  27%|██▋       | 606/2208 [00:33<01:25, 18.74it/s][A
Epoch 6/10:  28%|██▊       | 609/2208 [00:33<01:22, 19.50it/s][A
Epoch 6/10:  28%|██▊       | 612/2208 [00:33<01:19, 19.97it/s][A
Epoch 6/10:  28%|██▊       | 615/2208 [00:33<01:18, 20.28it/s][A
Epoch 6/10:  28%|██▊       | 618/2208 [00:33<01:19, 20.04it/s][A
Epoch 6/10:  28%|██▊       | 621/2208 [00:34<01:17, 20.45it/s][A
Epoch 6/10:  28%|██▊       | 624/2208 [00:34<01:20, 19.68it/s][A
  with torch.cuda.amp.autocast():

Epoch 6/10:  28%|██▊       | 629/2208 [00:34<01:42, 15.36it/s][A

Batch 625: Training loss = 0.1445, Training accuracy = 0.9401, F1 = 0.9400



Epoch 6/10:  29%|██▊       | 632/2208 [00:34<01:33, 16.89it/s][A
Epoch 6/10:  29%|██▉       | 635/2208 [00:35<01:26, 18.08it/s][A
Epoch 6/10:  29%|██▉       | 638/2208 [00:35<01:23, 18.88it/s][A
Epoch 6/10:  29%|██▉       | 641/2208 [00:35<01:20, 19.45it/s][A
Epoch 6/10:  29%|██▉       | 644/2208 [00:35<01:18, 19.84it/s][A
Epoch 6/10:  29%|██▉       | 647/2208 [00:35<01:17, 20.16it/s][A
  with torch.cuda.amp.autocast():

Epoch 6/10:  30%|██▉       | 653/2208 [00:35<01:33, 16.58it/s][A

Batch 650: Training loss = 0.1336, Training accuracy = 0.9403, F1 = 0.9402



Epoch 6/10:  30%|██▉       | 656/2208 [00:36<01:27, 17.81it/s][A
Epoch 6/10:  30%|██▉       | 659/2208 [00:36<01:22, 18.69it/s][A
Epoch 6/10:  30%|██▉       | 662/2208 [00:36<01:19, 19.47it/s][A
Epoch 6/10:  30%|███       | 665/2208 [00:36<01:16, 20.06it/s][A
Epoch 6/10:  30%|███       | 668/2208 [00:36<01:15, 20.49it/s][A
Epoch 6/10:  30%|███       | 671/2208 [00:36<01:14, 20.67it/s][A
Epoch 6/10:  31%|███       | 674/2208 [00:36<01:19, 19.28it/s][A
  with torch.cuda.amp.autocast():

Epoch 6/10:  31%|███       | 679/2208 [00:37<01:36, 15.92it/s][A

Batch 675: Training loss = 0.1795, Training accuracy = 0.9406, F1 = 0.9405



Epoch 6/10:  31%|███       | 682/2208 [00:37<01:28, 17.32it/s][A
Epoch 6/10:  31%|███       | 685/2208 [00:37<01:23, 18.27it/s][A
Epoch 6/10:  31%|███       | 688/2208 [00:37<01:19, 19.06it/s][A
Epoch 6/10:  31%|███▏      | 691/2208 [00:37<01:17, 19.54it/s][A
Epoch 6/10:  31%|███▏      | 694/2208 [00:38<01:16, 19.86it/s][A
Epoch 6/10:  32%|███▏      | 697/2208 [00:38<01:14, 20.20it/s][A
  with torch.cuda.amp.autocast():

Epoch 6/10:  32%|███▏      | 702/2208 [00:38<01:46, 14.15it/s][A
Epoch 6/10:  32%|███▏      | 705/2208 [00:38<01:34, 15.87it/s][A

Batch 700: Training loss = 0.1925, Training accuracy = 0.9407, F1 = 0.9407



Epoch 6/10:  32%|███▏      | 708/2208 [00:38<01:27, 17.17it/s][A
Epoch 6/10:  32%|███▏      | 711/2208 [00:39<01:22, 18.21it/s][A
Epoch 6/10:  32%|███▏      | 714/2208 [00:39<01:18, 19.08it/s][A
Epoch 6/10:  32%|███▏      | 717/2208 [00:39<01:16, 19.58it/s][A
Epoch 6/10:  33%|███▎      | 720/2208 [00:39<01:14, 20.04it/s][A
Epoch 6/10:  33%|███▎      | 723/2208 [00:39<01:17, 19.16it/s][A
  with torch.cuda.amp.autocast():

Epoch 6/10:  33%|███▎      | 729/2208 [00:40<01:26, 17.12it/s][A

Batch 725: Training loss = 0.1172, Training accuracy = 0.9406, F1 = 0.9405



Epoch 6/10:  33%|███▎      | 732/2208 [00:40<01:20, 18.29it/s][A
Epoch 6/10:  33%|███▎      | 735/2208 [00:40<01:16, 19.16it/s][A
Epoch 6/10:  33%|███▎      | 738/2208 [00:40<01:14, 19.79it/s][A
Epoch 6/10:  34%|███▎      | 741/2208 [00:40<01:12, 20.31it/s][A
Epoch 6/10:  34%|███▎      | 744/2208 [00:40<01:11, 20.59it/s][A
Epoch 6/10:  34%|███▍      | 747/2208 [00:40<01:10, 20.81it/s][A
  with torch.cuda.amp.autocast():

Epoch 6/10:  34%|███▍      | 753/2208 [00:41<01:27, 16.56it/s][A

Batch 750: Training loss = 0.1619, Training accuracy = 0.9406, F1 = 0.9405



Epoch 6/10:  34%|███▍      | 756/2208 [00:41<01:21, 17.76it/s][A
Epoch 6/10:  34%|███▍      | 759/2208 [00:41<01:17, 18.73it/s][A
Epoch 6/10:  35%|███▍      | 762/2208 [00:41<01:14, 19.39it/s][A
Epoch 6/10:  35%|███▍      | 765/2208 [00:41<01:12, 19.92it/s][A
Epoch 6/10:  35%|███▍      | 768/2208 [00:42<01:11, 20.26it/s][A
Epoch 6/10:  35%|███▍      | 771/2208 [00:42<01:11, 20.13it/s][A
  with torch.cuda.amp.autocast():

Epoch 6/10:  35%|███▌      | 777/2208 [00:42<01:31, 15.69it/s][A
Epoch 6/10:  35%|███▌      | 780/2208 [00:42<01:23, 17.09it/s][A

Batch 775: Training loss = 0.1533, Training accuracy = 0.9407, F1 = 0.9406



Epoch 6/10:  35%|███▌      | 783/2208 [00:42<01:18, 18.06it/s][A
Epoch 6/10:  36%|███▌      | 786/2208 [00:43<01:15, 18.83it/s][A
Epoch 6/10:  36%|███▌      | 789/2208 [00:43<01:12, 19.51it/s][A
Epoch 6/10:  36%|███▌      | 792/2208 [00:43<01:10, 19.99it/s][A
Epoch 6/10:  36%|███▌      | 795/2208 [00:43<01:09, 20.39it/s][A
Epoch 6/10:  36%|███▌      | 798/2208 [00:43<01:08, 20.67it/s][A
  with torch.cuda.amp.autocast():

Epoch 6/10:  36%|███▋      | 804/2208 [00:44<01:20, 17.34it/s][A

Batch 800: Training loss = 0.2396, Training accuracy = 0.9407, F1 = 0.9406



Epoch 6/10:  37%|███▋      | 807/2208 [00:44<01:16, 18.32it/s][A
Epoch 6/10:  37%|███▋      | 810/2208 [00:44<01:12, 19.23it/s][A
Epoch 6/10:  37%|███▋      | 813/2208 [00:44<01:10, 19.74it/s][A
Epoch 6/10:  37%|███▋      | 816/2208 [00:44<01:08, 20.33it/s][A
Epoch 6/10:  37%|███▋      | 819/2208 [00:44<01:07, 20.52it/s][A
Epoch 6/10:  37%|███▋      | 822/2208 [00:44<01:06, 20.73it/s][A
  with torch.cuda.amp.autocast():

Epoch 6/10:  38%|███▊      | 828/2208 [00:45<01:29, 15.46it/s][A

Batch 825: Training loss = 0.1556, Training accuracy = 0.9408, F1 = 0.9407



Epoch 6/10:  38%|███▊      | 831/2208 [00:45<01:21, 16.89it/s][A
Epoch 6/10:  38%|███▊      | 834/2208 [00:45<01:16, 18.04it/s][A
Epoch 6/10:  38%|███▊      | 837/2208 [00:45<01:12, 18.97it/s][A
Epoch 6/10:  38%|███▊      | 840/2208 [00:45<01:09, 19.54it/s][A
Epoch 6/10:  38%|███▊      | 843/2208 [00:46<01:08, 20.01it/s][A
Epoch 6/10:  38%|███▊      | 846/2208 [00:46<01:06, 20.51it/s][A
  with torch.cuda.amp.autocast():

Epoch 6/10:  39%|███▊      | 852/2208 [00:46<01:25, 15.88it/s][A
Epoch 6/10:  39%|███▊      | 855/2208 [00:46<01:18, 17.23it/s][A

Batch 850: Training loss = 0.1918, Training accuracy = 0.9408, F1 = 0.9407



Epoch 6/10:  39%|███▉      | 858/2208 [00:46<01:14, 18.11it/s][A
Epoch 6/10:  39%|███▉      | 861/2208 [00:47<01:11, 18.96it/s][A
Epoch 6/10:  39%|███▉      | 864/2208 [00:47<01:08, 19.61it/s][A
Epoch 6/10:  39%|███▉      | 867/2208 [00:47<01:06, 20.10it/s][A
Epoch 6/10:  39%|███▉      | 870/2208 [00:47<01:05, 20.44it/s][A
Epoch 6/10:  40%|███▉      | 873/2208 [00:47<01:04, 20.62it/s][A
  with torch.cuda.amp.autocast():

Epoch 6/10:  40%|███▉      | 879/2208 [00:48<01:17, 17.26it/s][A

Batch 875: Training loss = 0.1976, Training accuracy = 0.9409, F1 = 0.9408



Epoch 6/10:  40%|███▉      | 882/2208 [00:48<01:12, 18.36it/s][A
Epoch 6/10:  40%|████      | 885/2208 [00:48<01:09, 19.13it/s][A
Epoch 6/10:  40%|████      | 888/2208 [00:48<01:06, 19.77it/s][A
Epoch 6/10:  40%|████      | 891/2208 [00:48<01:05, 20.05it/s][A
Epoch 6/10:  40%|████      | 894/2208 [00:48<01:04, 20.47it/s][A
Epoch 6/10:  41%|████      | 897/2208 [00:48<01:03, 20.70it/s][A
  with torch.cuda.amp.autocast():

Epoch 6/10:  41%|████      | 903/2208 [00:49<01:24, 15.41it/s][A

Batch 900: Training loss = 0.1600, Training accuracy = 0.9410, F1 = 0.9409



Epoch 6/10:  41%|████      | 906/2208 [00:49<01:17, 16.81it/s][A
Epoch 6/10:  41%|████      | 909/2208 [00:49<01:12, 17.93it/s][A
Epoch 6/10:  41%|████▏     | 912/2208 [00:49<01:09, 18.69it/s][A
Epoch 6/10:  41%|████▏     | 914/2208 [00:49<01:09, 18.60it/s][A
Epoch 6/10:  42%|████▏     | 917/2208 [00:50<01:07, 19.23it/s][A
Epoch 6/10:  42%|████▏     | 920/2208 [00:50<01:05, 19.68it/s][A
Epoch 6/10:  42%|████▏     | 923/2208 [00:50<01:09, 18.59it/s][A
  with torch.cuda.amp.autocast():

Epoch 6/10:  42%|████▏     | 927/2208 [00:50<01:39, 12.90it/s][A
Epoch 6/10:  42%|████▏     | 930/2208 [00:50<01:25, 14.96it/s][A

Batch 925: Training loss = 0.2161, Training accuracy = 0.9410, F1 = 0.9409



Epoch 6/10:  42%|████▏     | 933/2208 [00:51<01:16, 16.58it/s][A
Epoch 6/10:  42%|████▏     | 936/2208 [00:51<01:11, 17.79it/s][A
Epoch 6/10:  43%|████▎     | 939/2208 [00:51<01:08, 18.58it/s][A
Epoch 6/10:  43%|████▎     | 942/2208 [00:51<01:05, 19.29it/s][A
Epoch 6/10:  43%|████▎     | 945/2208 [00:51<01:03, 19.81it/s][A
Epoch 6/10:  43%|████▎     | 948/2208 [00:51<01:02, 20.13it/s][A
  with torch.cuda.amp.autocast():

Epoch 6/10:  43%|████▎     | 954/2208 [00:52<01:19, 15.73it/s][A

Batch 950: Training loss = 0.1815, Training accuracy = 0.9410, F1 = 0.9409



Epoch 6/10:  43%|████▎     | 957/2208 [00:52<01:12, 17.15it/s][A
Epoch 6/10:  43%|████▎     | 960/2208 [00:52<01:08, 18.21it/s][A
Epoch 6/10:  44%|████▎     | 963/2208 [00:52<01:05, 18.89it/s][A
Epoch 6/10:  44%|████▍     | 966/2208 [00:52<01:08, 18.11it/s][A
Epoch 6/10:  44%|████▍     | 968/2208 [00:53<01:07, 18.44it/s][A
Epoch 6/10:  44%|████▍     | 970/2208 [00:53<01:05, 18.79it/s][A
Epoch 6/10:  44%|████▍     | 972/2208 [00:53<01:13, 16.78it/s][A
  with torch.cuda.amp.autocast():

Epoch 6/10:  44%|████▍     | 977/2208 [00:53<01:43, 11.89it/s][A
Epoch 6/10:  44%|████▍     | 980/2208 [00:53<01:26, 14.13it/s][A

Batch 975: Training loss = 0.3496, Training accuracy = 0.9409, F1 = 0.9408



Epoch 6/10:  44%|████▍     | 982/2208 [00:53<01:20, 15.22it/s][A
Epoch 6/10:  45%|████▍     | 985/2208 [00:54<01:12, 16.86it/s][A
Epoch 6/10:  45%|████▍     | 988/2208 [00:54<01:07, 18.06it/s][A
Epoch 6/10:  45%|████▍     | 991/2208 [00:54<01:04, 18.93it/s][A
Epoch 6/10:  45%|████▌     | 994/2208 [00:54<01:01, 19.62it/s][A
Epoch 6/10:  45%|████▌     | 997/2208 [00:54<01:00, 20.17it/s][A
  with torch.cuda.amp.autocast():

Epoch 6/10:  45%|████▌     | 1003/2208 [00:55<01:22, 14.54it/s][A

Batch 1000: Training loss = 0.1631, Training accuracy = 0.9409, F1 = 0.9408



Epoch 6/10:  46%|████▌     | 1006/2208 [00:55<01:14, 16.22it/s][A
Epoch 6/10:  46%|████▌     | 1009/2208 [00:55<01:08, 17.49it/s][A
Epoch 6/10:  46%|████▌     | 1012/2208 [00:55<01:04, 18.51it/s][A
Epoch 6/10:  46%|████▌     | 1015/2208 [00:55<01:01, 19.41it/s][A
Epoch 6/10:  46%|████▌     | 1018/2208 [00:55<00:59, 19.85it/s][A
Epoch 6/10:  46%|████▌     | 1021/2208 [00:56<00:58, 20.16it/s][A
  with torch.cuda.amp.autocast():

Epoch 6/10:  47%|████▋     | 1027/2208 [00:56<01:25, 13.78it/s][A
Epoch 6/10:  47%|████▋     | 1030/2208 [00:56<01:16, 15.48it/s][A

Batch 1025: Training loss = 0.1471, Training accuracy = 0.9410, F1 = 0.9409



Epoch 6/10:  47%|████▋     | 1033/2208 [00:56<01:10, 16.78it/s][A
Epoch 6/10:  47%|████▋     | 1036/2208 [00:56<01:05, 17.91it/s][A
Epoch 6/10:  47%|████▋     | 1039/2208 [00:57<01:02, 18.80it/s][A
Epoch 6/10:  47%|████▋     | 1042/2208 [00:57<01:00, 19.42it/s][A
Epoch 6/10:  47%|████▋     | 1045/2208 [00:57<00:58, 19.96it/s][A
Epoch 6/10:  47%|████▋     | 1048/2208 [00:57<00:57, 20.30it/s][A
  with torch.cuda.amp.autocast():

Epoch 6/10:  48%|████▊     | 1054/2208 [00:58<01:14, 15.54it/s][A

Batch 1050: Training loss = 0.1740, Training accuracy = 0.9411, F1 = 0.9410



Epoch 6/10:  48%|████▊     | 1057/2208 [00:58<01:07, 16.93it/s][A
Epoch 6/10:  48%|████▊     | 1060/2208 [00:58<01:03, 18.09it/s][A
Epoch 6/10:  48%|████▊     | 1063/2208 [00:58<01:00, 18.92it/s][A
Epoch 6/10:  48%|████▊     | 1066/2208 [00:58<00:58, 19.46it/s][A
Epoch 6/10:  48%|████▊     | 1069/2208 [00:58<00:57, 19.89it/s][A
Epoch 6/10:  49%|████▊     | 1072/2208 [00:58<00:56, 20.23it/s][A
  with torch.cuda.amp.autocast():

Epoch 6/10:  49%|████▉     | 1078/2208 [00:59<01:18, 14.43it/s][A

Batch 1075: Training loss = 0.0758, Training accuracy = 0.9411, F1 = 0.9411



Epoch 6/10:  49%|████▉     | 1081/2208 [00:59<01:10, 16.05it/s][A
Epoch 6/10:  49%|████▉     | 1084/2208 [00:59<01:04, 17.41it/s][A
Epoch 6/10:  49%|████▉     | 1087/2208 [00:59<01:00, 18.41it/s][A
Epoch 6/10:  49%|████▉     | 1090/2208 [00:59<00:58, 19.19it/s][A
Epoch 6/10:  50%|████▉     | 1093/2208 [01:00<00:56, 19.68it/s][A
Epoch 6/10:  50%|████▉     | 1096/2208 [01:00<00:55, 20.04it/s][A
  with torch.cuda.amp.autocast():

Epoch 6/10:  50%|████▉     | 1102/2208 [01:00<01:14, 14.76it/s][A
Epoch 6/10:  50%|█████     | 1105/2208 [01:00<01:07, 16.34it/s][A

Batch 1100: Training loss = 0.2661, Training accuracy = 0.9411, F1 = 0.9410



Epoch 6/10:  50%|█████     | 1108/2208 [01:00<01:02, 17.55it/s][A
Epoch 6/10:  50%|█████     | 1111/2208 [01:01<00:59, 18.58it/s][A
Epoch 6/10:  50%|█████     | 1114/2208 [01:01<00:56, 19.28it/s][A
Epoch 6/10:  51%|█████     | 1117/2208 [01:01<00:54, 19.91it/s][A
Epoch 6/10:  51%|█████     | 1120/2208 [01:01<00:53, 20.31it/s][A
Epoch 6/10:  51%|█████     | 1123/2208 [01:01<00:52, 20.57it/s][A
  with torch.cuda.amp.autocast():

Epoch 6/10:  51%|█████     | 1129/2208 [01:02<01:08, 15.84it/s][A

Batch 1125: Training loss = 0.1931, Training accuracy = 0.9412, F1 = 0.9411



Epoch 6/10:  51%|█████▏    | 1132/2208 [01:02<01:02, 17.17it/s][A
Epoch 6/10:  51%|█████▏    | 1135/2208 [01:02<00:58, 18.29it/s][A
Epoch 6/10:  52%|█████▏    | 1138/2208 [01:02<00:56, 18.93it/s][A
Epoch 6/10:  52%|█████▏    | 1141/2208 [01:02<00:54, 19.46it/s][A
Epoch 6/10:  52%|█████▏    | 1144/2208 [01:02<00:53, 19.91it/s][A
Epoch 6/10:  52%|█████▏    | 1147/2208 [01:03<00:52, 20.17it/s][A
  with torch.cuda.amp.autocast():

Epoch 6/10:  52%|█████▏    | 1153/2208 [01:03<01:15, 13.97it/s][A

Batch 1150: Training loss = 0.2213, Training accuracy = 0.9413, F1 = 0.9412



Epoch 6/10:  52%|█████▏    | 1156/2208 [01:03<01:07, 15.62it/s][A
Epoch 6/10:  52%|█████▏    | 1159/2208 [01:03<01:01, 16.94it/s][A
Epoch 6/10:  53%|█████▎    | 1162/2208 [01:03<00:58, 18.03it/s][A
Epoch 6/10:  53%|█████▎    | 1165/2208 [01:04<00:55, 18.91it/s][A
Epoch 6/10:  53%|█████▎    | 1168/2208 [01:04<00:53, 19.30it/s][A
Epoch 6/10:  53%|█████▎    | 1171/2208 [01:04<00:52, 19.83it/s][A
  with torch.cuda.amp.autocast():

Epoch 6/10:  53%|█████▎    | 1177/2208 [01:04<01:17, 13.28it/s][A
Epoch 6/10:  53%|█████▎    | 1180/2208 [01:05<01:08, 14.97it/s][A

Batch 1175: Training loss = 0.1206, Training accuracy = 0.9413, F1 = 0.9412



Epoch 6/10:  54%|█████▎    | 1183/2208 [01:05<01:02, 16.36it/s][A
Epoch 6/10:  54%|█████▎    | 1186/2208 [01:05<00:58, 17.48it/s][A
Epoch 6/10:  54%|█████▍    | 1189/2208 [01:05<00:55, 18.38it/s][A
Epoch 6/10:  54%|█████▍    | 1192/2208 [01:05<00:53, 19.07it/s][A
Epoch 6/10:  54%|█████▍    | 1195/2208 [01:05<00:52, 19.42it/s][A
Epoch 6/10:  54%|█████▍    | 1198/2208 [01:05<00:51, 19.79it/s][A
  with torch.cuda.amp.autocast():

Epoch 6/10:  55%|█████▍    | 1204/2208 [01:06<01:09, 14.48it/s][A

Batch 1200: Training loss = 0.1524, Training accuracy = 0.9413, F1 = 0.9413



Epoch 6/10:  55%|█████▍    | 1207/2208 [01:06<01:02, 15.94it/s][A
Epoch 6/10:  55%|█████▍    | 1210/2208 [01:06<00:58, 17.20it/s][A
Epoch 6/10:  55%|█████▍    | 1213/2208 [01:06<00:54, 18.18it/s][A
Epoch 6/10:  55%|█████▌    | 1216/2208 [01:07<00:54, 18.25it/s][A
Epoch 6/10:  55%|█████▌    | 1219/2208 [01:07<00:59, 16.51it/s][A
Epoch 6/10:  55%|█████▌    | 1222/2208 [01:07<00:56, 17.61it/s][A
  with torch.cuda.amp.autocast():

Epoch 6/10:  56%|█████▌    | 1227/2208 [01:08<01:22, 11.92it/s][A
Epoch 6/10:  56%|█████▌    | 1230/2208 [01:08<01:10, 13.96it/s][A

Batch 1225: Training loss = 0.2034, Training accuracy = 0.9413, F1 = 0.9412



Epoch 6/10:  56%|█████▌    | 1232/2208 [01:08<01:05, 14.93it/s][A
Epoch 6/10:  56%|█████▌    | 1235/2208 [01:08<00:58, 16.56it/s][A
Epoch 6/10:  56%|█████▌    | 1238/2208 [01:08<00:54, 17.84it/s][A
Epoch 6/10:  56%|█████▌    | 1241/2208 [01:08<00:51, 18.89it/s][A
Epoch 6/10:  56%|█████▋    | 1244/2208 [01:08<00:49, 19.60it/s][A
Epoch 6/10:  56%|█████▋    | 1247/2208 [01:08<00:48, 19.97it/s][A
  with torch.cuda.amp.autocast():

Epoch 6/10:  57%|█████▋    | 1253/2208 [01:09<01:11, 13.31it/s][A

Batch 1250: Training loss = 0.1710, Training accuracy = 0.9414, F1 = 0.9414



Epoch 6/10:  57%|█████▋    | 1256/2208 [01:09<01:03, 15.05it/s][A
Epoch 6/10:  57%|█████▋    | 1259/2208 [01:09<00:57, 16.52it/s][A
Epoch 6/10:  57%|█████▋    | 1262/2208 [01:09<00:53, 17.71it/s][A
Epoch 6/10:  57%|█████▋    | 1265/2208 [01:10<00:50, 18.63it/s][A
Epoch 6/10:  57%|█████▋    | 1268/2208 [01:10<00:48, 19.31it/s][A
Epoch 6/10:  58%|█████▊    | 1271/2208 [01:10<00:47, 19.74it/s][A
  with torch.cuda.amp.autocast():

Epoch 6/10:  58%|█████▊    | 1277/2208 [01:10<01:07, 13.84it/s][A
Epoch 6/10:  58%|█████▊    | 1280/2208 [01:11<00:59, 15.54it/s][A

Batch 1275: Training loss = 0.1995, Training accuracy = 0.9415, F1 = 0.9414



Epoch 6/10:  58%|█████▊    | 1283/2208 [01:11<00:54, 16.93it/s][A
Epoch 6/10:  58%|█████▊    | 1286/2208 [01:11<00:51, 18.05it/s][A
Epoch 6/10:  58%|█████▊    | 1289/2208 [01:11<00:48, 18.96it/s][A
Epoch 6/10:  59%|█████▊    | 1292/2208 [01:11<00:47, 19.48it/s][A
Epoch 6/10:  59%|█████▊    | 1295/2208 [01:11<00:45, 19.94it/s][A
Epoch 6/10:  59%|█████▉    | 1298/2208 [01:11<00:44, 20.33it/s][A
  with torch.cuda.amp.autocast():

Epoch 6/10:  59%|█████▉    | 1304/2208 [01:12<00:59, 15.17it/s][A

Batch 1300: Training loss = 0.1545, Training accuracy = 0.9416, F1 = 0.9415



Epoch 6/10:  59%|█████▉    | 1307/2208 [01:12<00:54, 16.68it/s][A
Epoch 6/10:  59%|█████▉    | 1310/2208 [01:12<00:50, 17.94it/s][A
Epoch 6/10:  59%|█████▉    | 1313/2208 [01:12<00:47, 18.80it/s][A
Epoch 6/10:  60%|█████▉    | 1316/2208 [01:12<00:46, 19.38it/s][A
Epoch 6/10:  60%|█████▉    | 1319/2208 [01:13<00:44, 19.94it/s][A
Epoch 6/10:  60%|█████▉    | 1322/2208 [01:13<00:43, 20.36it/s][A
  with torch.cuda.amp.autocast():

Epoch 6/10:  60%|██████    | 1328/2208 [01:13<01:07, 13.12it/s][A

Batch 1325: Training loss = 0.2069, Training accuracy = 0.9415, F1 = 0.9414



Epoch 6/10:  60%|██████    | 1331/2208 [01:13<00:58, 14.90it/s][A
Epoch 6/10:  60%|██████    | 1334/2208 [01:14<00:53, 16.40it/s][A
Epoch 6/10:  61%|██████    | 1337/2208 [01:14<00:49, 17.61it/s][A
Epoch 6/10:  61%|██████    | 1340/2208 [01:14<00:46, 18.56it/s][A
Epoch 6/10:  61%|██████    | 1343/2208 [01:14<00:44, 19.32it/s][A
Epoch 6/10:  61%|██████    | 1346/2208 [01:14<00:43, 19.80it/s][A
  with torch.cuda.amp.autocast():

Epoch 6/10:  61%|██████    | 1352/2208 [01:15<01:07, 12.61it/s][A
Epoch 6/10:  61%|██████▏   | 1355/2208 [01:15<00:59, 14.45it/s][A

Batch 1350: Training loss = 0.1930, Training accuracy = 0.9415, F1 = 0.9414



Epoch 6/10:  62%|██████▏   | 1358/2208 [01:15<00:53, 16.00it/s][A
Epoch 6/10:  62%|██████▏   | 1361/2208 [01:15<00:49, 17.24it/s][A
Epoch 6/10:  62%|██████▏   | 1364/2208 [01:15<00:46, 18.28it/s][A
Epoch 6/10:  62%|██████▏   | 1367/2208 [01:15<00:44, 19.10it/s][A
Epoch 6/10:  62%|██████▏   | 1370/2208 [01:16<00:42, 19.71it/s][A
Epoch 6/10:  62%|██████▏   | 1373/2208 [01:16<00:41, 20.20it/s][A
  with torch.cuda.amp.autocast():

Epoch 6/10:  62%|██████▏   | 1379/2208 [01:16<00:54, 15.08it/s][A

Batch 1375: Training loss = 0.1806, Training accuracy = 0.9415, F1 = 0.9414



Epoch 6/10:  63%|██████▎   | 1382/2208 [01:16<00:49, 16.56it/s][A
Epoch 6/10:  63%|██████▎   | 1385/2208 [01:17<00:46, 17.66it/s][A
Epoch 6/10:  63%|██████▎   | 1388/2208 [01:17<00:44, 18.62it/s][A
Epoch 6/10:  63%|██████▎   | 1391/2208 [01:17<00:42, 19.19it/s][A
Epoch 6/10:  63%|██████▎   | 1394/2208 [01:17<00:41, 19.73it/s][A
Epoch 6/10:  63%|██████▎   | 1397/2208 [01:17<00:40, 20.17it/s][A
  with torch.cuda.amp.autocast():

Epoch 6/10:  64%|██████▎   | 1403/2208 [01:18<00:59, 13.47it/s][A

Batch 1400: Training loss = 0.1719, Training accuracy = 0.9415, F1 = 0.9414



Epoch 6/10:  64%|██████▎   | 1406/2208 [01:18<00:52, 15.18it/s][A
Epoch 6/10:  64%|██████▍   | 1409/2208 [01:18<00:48, 16.55it/s][A
Epoch 6/10:  64%|██████▍   | 1412/2208 [01:18<00:44, 17.75it/s][A
Epoch 6/10:  64%|██████▍   | 1415/2208 [01:18<00:42, 18.69it/s][A
Epoch 6/10:  64%|██████▍   | 1418/2208 [01:18<00:45, 17.49it/s][A
Epoch 6/10:  64%|██████▍   | 1420/2208 [01:19<00:43, 17.95it/s][A
Epoch 6/10:  64%|██████▍   | 1422/2208 [01:19<00:46, 16.88it/s][A
Epoch 6/10:  64%|██████▍   | 1424/2208 [01:19<00:44, 17.54it/s][A
  with torch.cuda.amp.autocast():

Epoch 6/10:  65%|██████▍   | 1429/2208 [01:19<01:02, 12.42it/s][A

Batch 1425: Training loss = 0.1482, Training accuracy = 0.9416, F1 = 0.9415



Epoch 6/10:  65%|██████▍   | 1432/2208 [01:19<00:53, 14.45it/s][A
Epoch 6/10:  65%|██████▍   | 1435/2208 [01:20<00:48, 16.00it/s][A
Epoch 6/10:  65%|██████▌   | 1438/2208 [01:20<00:44, 17.24it/s][A
Epoch 6/10:  65%|██████▌   | 1441/2208 [01:20<00:42, 18.25it/s][A
Epoch 6/10:  65%|██████▌   | 1444/2208 [01:20<00:40, 19.10it/s][A
Epoch 6/10:  66%|██████▌   | 1447/2208 [01:20<00:39, 19.48it/s][A
  with torch.cuda.amp.autocast():

Epoch 6/10:  66%|██████▌   | 1452/2208 [01:21<01:09, 10.94it/s][A
Epoch 6/10:  66%|██████▌   | 1455/2208 [01:21<00:57, 13.06it/s][A

Batch 1450: Training loss = 0.1552, Training accuracy = 0.9416, F1 = 0.9416



Epoch 6/10:  66%|██████▌   | 1458/2208 [01:21<00:50, 14.81it/s][A
Epoch 6/10:  66%|██████▌   | 1460/2208 [01:21<00:47, 15.75it/s][A
Epoch 6/10:  66%|██████▌   | 1462/2208 [01:21<00:45, 16.57it/s][A
Epoch 6/10:  66%|██████▋   | 1464/2208 [01:21<00:42, 17.35it/s][A
Epoch 6/10:  66%|██████▋   | 1467/2208 [01:22<00:40, 18.49it/s][A
Epoch 6/10:  67%|██████▋   | 1470/2208 [01:22<00:38, 19.32it/s][A
Epoch 6/10:  67%|██████▋   | 1473/2208 [01:22<00:40, 18.37it/s][A
  with torch.cuda.amp.autocast():

Epoch 6/10:  67%|██████▋   | 1479/2208 [01:22<00:52, 13.92it/s][A

Batch 1475: Training loss = 0.1681, Training accuracy = 0.9415, F1 = 0.9414



Epoch 6/10:  67%|██████▋   | 1482/2208 [01:23<00:46, 15.69it/s][A
Epoch 6/10:  67%|██████▋   | 1485/2208 [01:23<00:42, 17.09it/s][A
Epoch 6/10:  67%|██████▋   | 1488/2208 [01:23<00:39, 18.18it/s][A
Epoch 6/10:  68%|██████▊   | 1491/2208 [01:23<00:37, 19.01it/s][A
Epoch 6/10:  68%|██████▊   | 1494/2208 [01:23<00:36, 19.69it/s][A
Epoch 6/10:  68%|██████▊   | 1497/2208 [01:23<00:35, 20.18it/s][A
  with torch.cuda.amp.autocast():

Epoch 6/10:  68%|██████▊   | 1503/2208 [01:24<00:54, 12.90it/s][A

Batch 1500: Training loss = 0.0942, Training accuracy = 0.9417, F1 = 0.9416



Epoch 6/10:  68%|██████▊   | 1506/2208 [01:24<00:47, 14.70it/s][A
Epoch 6/10:  68%|██████▊   | 1509/2208 [01:24<00:42, 16.28it/s][A
Epoch 6/10:  68%|██████▊   | 1512/2208 [01:24<00:39, 17.49it/s][A
Epoch 6/10:  69%|██████▊   | 1515/2208 [01:24<00:37, 18.48it/s][A
Epoch 6/10:  69%|██████▉   | 1518/2208 [01:25<00:35, 19.20it/s][A
Epoch 6/10:  69%|██████▉   | 1521/2208 [01:25<00:34, 19.84it/s][A
  with torch.cuda.amp.autocast():

Epoch 6/10:  69%|██████▉   | 1527/2208 [01:25<00:53, 12.75it/s][A
Epoch 6/10:  69%|██████▉   | 1530/2208 [01:25<00:46, 14.55it/s][A

Batch 1525: Training loss = 0.2128, Training accuracy = 0.9416, F1 = 0.9416



Epoch 6/10:  69%|██████▉   | 1533/2208 [01:26<00:41, 16.12it/s][A
Epoch 6/10:  70%|██████▉   | 1536/2208 [01:26<00:38, 17.43it/s][A
Epoch 6/10:  70%|██████▉   | 1539/2208 [01:26<00:36, 18.44it/s][A
Epoch 6/10:  70%|██████▉   | 1542/2208 [01:26<00:34, 19.20it/s][A
Epoch 6/10:  70%|██████▉   | 1545/2208 [01:26<00:33, 19.71it/s][A
Epoch 6/10:  70%|███████   | 1548/2208 [01:26<00:32, 20.17it/s][A
  with torch.cuda.amp.autocast():

Epoch 6/10:  70%|███████   | 1554/2208 [01:27<00:45, 14.36it/s][A

Batch 1550: Training loss = 0.1441, Training accuracy = 0.9417, F1 = 0.9416



Epoch 6/10:  71%|███████   | 1557/2208 [01:27<00:40, 15.91it/s][A
Epoch 6/10:  71%|███████   | 1560/2208 [01:27<00:37, 17.25it/s][A
Epoch 6/10:  71%|███████   | 1563/2208 [01:27<00:35, 18.30it/s][A
Epoch 6/10:  71%|███████   | 1566/2208 [01:27<00:33, 19.03it/s][A
Epoch 6/10:  71%|███████   | 1569/2208 [01:28<00:32, 19.63it/s][A
Epoch 6/10:  71%|███████   | 1572/2208 [01:28<00:31, 19.96it/s][A
  with torch.cuda.amp.autocast():

Epoch 6/10:  71%|███████▏  | 1578/2208 [01:28<00:49, 12.73it/s][A

Batch 1575: Training loss = 0.1019, Training accuracy = 0.9418, F1 = 0.9417



Epoch 6/10:  72%|███████▏  | 1581/2208 [01:28<00:43, 14.57it/s][A
Epoch 6/10:  72%|███████▏  | 1584/2208 [01:29<00:38, 16.11it/s][A
Epoch 6/10:  72%|███████▏  | 1587/2208 [01:29<00:35, 17.42it/s][A
Epoch 6/10:  72%|███████▏  | 1590/2208 [01:29<00:33, 18.47it/s][A
Epoch 6/10:  72%|███████▏  | 1593/2208 [01:29<00:32, 19.22it/s][A
Epoch 6/10:  72%|███████▏  | 1596/2208 [01:29<00:31, 19.72it/s][A
  with torch.cuda.amp.autocast():

Epoch 6/10:  73%|███████▎  | 1602/2208 [01:30<00:48, 12.46it/s][A
Epoch 6/10:  73%|███████▎  | 1605/2208 [01:30<00:42, 14.30it/s][A

Batch 1600: Training loss = 0.1147, Training accuracy = 0.9418, F1 = 0.9418



Epoch 6/10:  73%|███████▎  | 1608/2208 [01:30<00:37, 15.91it/s][A
Epoch 6/10:  73%|███████▎  | 1611/2208 [01:30<00:34, 17.15it/s][A
Epoch 6/10:  73%|███████▎  | 1614/2208 [01:30<00:32, 18.33it/s][A
Epoch 6/10:  73%|███████▎  | 1617/2208 [01:30<00:30, 19.21it/s][A
Epoch 6/10:  73%|███████▎  | 1620/2208 [01:31<00:29, 19.79it/s][A
Epoch 6/10:  74%|███████▎  | 1623/2208 [01:31<00:28, 20.24it/s][A
  with torch.cuda.amp.autocast():

Epoch 6/10:  74%|███████▍  | 1629/2208 [01:31<00:41, 13.86it/s][A

Batch 1625: Training loss = 0.1488, Training accuracy = 0.9418, F1 = 0.9417



Epoch 6/10:  74%|███████▍  | 1632/2208 [01:31<00:37, 15.52it/s][A
Epoch 6/10:  74%|███████▍  | 1635/2208 [01:32<00:33, 16.92it/s][A
Epoch 6/10:  74%|███████▍  | 1638/2208 [01:32<00:31, 17.96it/s][A
Epoch 6/10:  74%|███████▍  | 1641/2208 [01:32<00:30, 18.75it/s][A
Epoch 6/10:  74%|███████▍  | 1644/2208 [01:32<00:29, 19.33it/s][A
Epoch 6/10:  75%|███████▍  | 1647/2208 [01:32<00:28, 19.73it/s][A
  with torch.cuda.amp.autocast():

Epoch 6/10:  75%|███████▍  | 1653/2208 [01:33<00:46, 11.88it/s][A

Batch 1650: Training loss = 0.1909, Training accuracy = 0.9418, F1 = 0.9417



Epoch 6/10:  75%|███████▌  | 1656/2208 [01:33<00:40, 13.74it/s][A
Epoch 6/10:  75%|███████▌  | 1659/2208 [01:33<00:35, 15.37it/s][A
Epoch 6/10:  75%|███████▌  | 1662/2208 [01:33<00:32, 16.77it/s][A
Epoch 6/10:  75%|███████▌  | 1665/2208 [01:33<00:30, 17.84it/s][A
Epoch 6/10:  76%|███████▌  | 1668/2208 [01:34<00:28, 18.65it/s][A
Epoch 6/10:  76%|███████▌  | 1671/2208 [01:34<00:27, 19.24it/s][A
  with torch.cuda.amp.autocast():

Epoch 6/10:  76%|███████▌  | 1677/2208 [01:34<00:48, 10.96it/s][A
Epoch 6/10:  76%|███████▌  | 1680/2208 [01:35<00:41, 12.85it/s][A

Batch 1675: Training loss = 0.1469, Training accuracy = 0.9420, F1 = 0.9419



Epoch 6/10:  76%|███████▌  | 1683/2208 [01:35<00:35, 14.63it/s][A
Epoch 6/10:  76%|███████▋  | 1686/2208 [01:35<00:32, 16.23it/s][A
Epoch 6/10:  76%|███████▋  | 1689/2208 [01:35<00:29, 17.48it/s][A
Epoch 6/10:  77%|███████▋  | 1692/2208 [01:35<00:28, 18.41it/s][A
Epoch 6/10:  77%|███████▋  | 1695/2208 [01:35<00:29, 17.21it/s][A
Epoch 6/10:  77%|███████▋  | 1698/2208 [01:35<00:28, 18.19it/s][A
  with torch.cuda.amp.autocast():

Epoch 6/10:  77%|███████▋  | 1702/2208 [01:36<00:50,  9.96it/s][A
Epoch 6/10:  77%|███████▋  | 1705/2208 [01:36<00:41, 12.22it/s][A

Batch 1700: Training loss = 0.2601, Training accuracy = 0.9420, F1 = 0.9419



Epoch 6/10:  77%|███████▋  | 1708/2208 [01:36<00:35, 14.20it/s][A
Epoch 6/10:  77%|███████▋  | 1711/2208 [01:36<00:31, 15.83it/s][A
Epoch 6/10:  78%|███████▊  | 1714/2208 [01:37<00:28, 17.30it/s][A
Epoch 6/10:  78%|███████▊  | 1717/2208 [01:37<00:26, 18.39it/s][A
Epoch 6/10:  78%|███████▊  | 1720/2208 [01:37<00:25, 19.16it/s][A
Epoch 6/10:  78%|███████▊  | 1723/2208 [01:37<00:24, 19.79it/s][A
  with torch.cuda.amp.autocast():

Epoch 6/10:  78%|███████▊  | 1729/2208 [01:38<00:34, 13.91it/s][A

Batch 1725: Training loss = 0.0835, Training accuracy = 0.9419, F1 = 0.9419



Epoch 6/10:  78%|███████▊  | 1732/2208 [01:38<00:30, 15.53it/s][A
Epoch 6/10:  79%|███████▊  | 1735/2208 [01:38<00:27, 16.93it/s][A
Epoch 6/10:  79%|███████▊  | 1738/2208 [01:38<00:26, 17.99it/s][A
Epoch 6/10:  79%|███████▉  | 1741/2208 [01:38<00:24, 18.80it/s][A
Epoch 6/10:  79%|███████▉  | 1744/2208 [01:38<00:23, 19.49it/s][A
Epoch 6/10:  79%|███████▉  | 1747/2208 [01:39<00:23, 19.99it/s][A
  with torch.cuda.amp.autocast():

Epoch 6/10:  79%|███████▉  | 1753/2208 [01:39<00:39, 11.52it/s][A

Batch 1750: Training loss = 0.3099, Training accuracy = 0.9420, F1 = 0.9419



Epoch 6/10:  80%|███████▉  | 1756/2208 [01:39<00:33, 13.41it/s][A
Epoch 6/10:  80%|███████▉  | 1759/2208 [01:39<00:29, 15.06it/s][A
Epoch 6/10:  80%|███████▉  | 1762/2208 [01:40<00:27, 16.48it/s][A
Epoch 6/10:  80%|███████▉  | 1765/2208 [01:40<00:24, 17.74it/s][A
Epoch 6/10:  80%|████████  | 1768/2208 [01:40<00:23, 18.75it/s][A
Epoch 6/10:  80%|████████  | 1771/2208 [01:40<00:22, 19.51it/s][A
  with torch.cuda.amp.autocast():

Epoch 6/10:  80%|████████  | 1777/2208 [01:41<00:35, 12.09it/s][A
Epoch 6/10:  81%|████████  | 1780/2208 [01:41<00:30, 14.00it/s][A

Batch 1775: Training loss = 0.2066, Training accuracy = 0.9420, F1 = 0.9419



Epoch 6/10:  81%|████████  | 1783/2208 [01:41<00:27, 15.64it/s][A
Epoch 6/10:  81%|████████  | 1786/2208 [01:41<00:24, 16.99it/s][A
Epoch 6/10:  81%|████████  | 1789/2208 [01:41<00:23, 18.09it/s][A
Epoch 6/10:  81%|████████  | 1792/2208 [01:41<00:21, 18.96it/s][A
Epoch 6/10:  81%|████████▏ | 1795/2208 [01:41<00:20, 19.73it/s][A
Epoch 6/10:  81%|████████▏ | 1798/2208 [01:42<00:20, 20.21it/s][A
  with torch.cuda.amp.autocast():

Epoch 6/10:  82%|████████▏ | 1804/2208 [01:42<00:29, 13.78it/s][A

Batch 1800: Training loss = 0.0810, Training accuracy = 0.9421, F1 = 0.9420



Epoch 6/10:  82%|████████▏ | 1807/2208 [01:42<00:26, 15.39it/s][A
Epoch 6/10:  82%|████████▏ | 1810/2208 [01:43<00:23, 16.77it/s][A
Epoch 6/10:  82%|████████▏ | 1813/2208 [01:43<00:22, 17.92it/s][A
Epoch 6/10:  82%|████████▏ | 1816/2208 [01:43<00:20, 18.69it/s][A
Epoch 6/10:  82%|████████▏ | 1819/2208 [01:43<00:20, 19.17it/s][A
Epoch 6/10:  83%|████████▎ | 1822/2208 [01:43<00:19, 19.74it/s][A
  with torch.cuda.amp.autocast():

Epoch 6/10:  83%|████████▎ | 1828/2208 [01:44<00:32, 11.61it/s][A

Batch 1825: Training loss = 0.1989, Training accuracy = 0.9421, F1 = 0.9420



Epoch 6/10:  83%|████████▎ | 1831/2208 [01:44<00:28, 13.46it/s][A
Epoch 6/10:  83%|████████▎ | 1834/2208 [01:44<00:24, 15.12it/s][A
Epoch 6/10:  83%|████████▎ | 1837/2208 [01:44<00:22, 16.58it/s][A
Epoch 6/10:  83%|████████▎ | 1840/2208 [01:44<00:20, 17.79it/s][A
Epoch 6/10:  83%|████████▎ | 1843/2208 [01:44<00:19, 18.65it/s][A
Epoch 6/10:  84%|████████▎ | 1846/2208 [01:45<00:18, 19.24it/s][A
  with torch.cuda.amp.autocast():

Epoch 6/10:  84%|████████▍ | 1852/2208 [01:45<00:30, 11.50it/s][A
Epoch 6/10:  84%|████████▍ | 1855/2208 [01:45<00:26, 13.37it/s][A

Batch 1850: Training loss = 0.1713, Training accuracy = 0.9420, F1 = 0.9419



Epoch 6/10:  84%|████████▍ | 1858/2208 [01:46<00:23, 15.06it/s][A
Epoch 6/10:  84%|████████▍ | 1861/2208 [01:46<00:21, 16.51it/s][A
Epoch 6/10:  84%|████████▍ | 1864/2208 [01:46<00:19, 17.66it/s][A
Epoch 6/10:  85%|████████▍ | 1867/2208 [01:46<00:18, 18.68it/s][A
Epoch 6/10:  85%|████████▍ | 1870/2208 [01:46<00:17, 19.24it/s][A
Epoch 6/10:  85%|████████▍ | 1873/2208 [01:46<00:16, 19.75it/s][A
  with torch.cuda.amp.autocast():

Epoch 6/10:  85%|████████▌ | 1879/2208 [01:47<00:26, 12.47it/s][A

Batch 1875: Training loss = 0.1000, Training accuracy = 0.9420, F1 = 0.9420



Epoch 6/10:  85%|████████▌ | 1882/2208 [01:47<00:22, 14.24it/s][A
Epoch 6/10:  85%|████████▌ | 1885/2208 [01:47<00:20, 15.84it/s][A
Epoch 6/10:  86%|████████▌ | 1888/2208 [01:47<00:18, 17.19it/s][A
Epoch 6/10:  86%|████████▌ | 1891/2208 [01:48<00:17, 18.17it/s][A
Epoch 6/10:  86%|████████▌ | 1894/2208 [01:48<00:18, 17.02it/s][A
Epoch 6/10:  86%|████████▌ | 1897/2208 [01:48<00:17, 18.18it/s][A
  with torch.cuda.amp.autocast():

Epoch 6/10:  86%|████████▌ | 1902/2208 [01:49<00:29, 10.37it/s][A
Epoch 6/10:  86%|████████▋ | 1905/2208 [01:49<00:24, 12.50it/s][A

Batch 1900: Training loss = 0.2893, Training accuracy = 0.9420, F1 = 0.9420



Epoch 6/10:  86%|████████▋ | 1908/2208 [01:49<00:20, 14.32it/s][A
Epoch 6/10:  87%|████████▋ | 1911/2208 [01:49<00:18, 15.93it/s][A
Epoch 6/10:  87%|████████▋ | 1914/2208 [01:49<00:17, 17.16it/s][A
Epoch 6/10:  87%|████████▋ | 1917/2208 [01:49<00:16, 18.05it/s][A
Epoch 6/10:  87%|████████▋ | 1920/2208 [01:49<00:15, 18.91it/s][A
Epoch 6/10:  87%|████████▋ | 1923/2208 [01:50<00:14, 19.31it/s][A
  with torch.cuda.amp.autocast():

Epoch 6/10:  87%|████████▋ | 1929/2208 [01:50<00:21, 12.84it/s][A

Batch 1925: Training loss = 0.2148, Training accuracy = 0.9422, F1 = 0.9421



Epoch 6/10:  88%|████████▊ | 1932/2208 [01:50<00:18, 14.58it/s][A
Epoch 6/10:  88%|████████▊ | 1935/2208 [01:50<00:17, 15.97it/s][A
Epoch 6/10:  88%|████████▊ | 1937/2208 [01:51<00:16, 16.69it/s][A
Epoch 6/10:  88%|████████▊ | 1940/2208 [01:51<00:15, 17.78it/s][A
Epoch 6/10:  88%|████████▊ | 1943/2208 [01:51<00:14, 18.65it/s][A
Epoch 6/10:  88%|████████▊ | 1946/2208 [01:51<00:13, 19.37it/s][A
  with torch.cuda.amp.autocast():

Epoch 6/10:  88%|████████▊ | 1952/2208 [01:52<00:22, 11.52it/s][A
Epoch 6/10:  89%|████████▊ | 1955/2208 [01:52<00:18, 13.45it/s][A

Batch 1950: Training loss = 0.1423, Training accuracy = 0.9422, F1 = 0.9422



Epoch 6/10:  89%|████████▊ | 1958/2208 [01:52<00:16, 15.20it/s][A
Epoch 6/10:  89%|████████▉ | 1961/2208 [01:52<00:14, 16.64it/s][A
Epoch 6/10:  89%|████████▉ | 1964/2208 [01:52<00:13, 17.82it/s][A
Epoch 6/10:  89%|████████▉ | 1967/2208 [01:52<00:12, 18.78it/s][A
Epoch 6/10:  89%|████████▉ | 1970/2208 [01:53<00:12, 19.47it/s][A
Epoch 6/10:  89%|████████▉ | 1973/2208 [01:53<00:11, 19.95it/s][A
  with torch.cuda.amp.autocast():

Epoch 6/10:  90%|████████▉ | 1979/2208 [01:53<00:17, 13.35it/s][A

Batch 1975: Training loss = 0.1584, Training accuracy = 0.9423, F1 = 0.9422



Epoch 6/10:  90%|████████▉ | 1982/2208 [01:53<00:14, 15.08it/s][A
Epoch 6/10:  90%|████████▉ | 1985/2208 [01:54<00:13, 16.60it/s][A
Epoch 6/10:  90%|█████████ | 1988/2208 [01:54<00:12, 17.80it/s][A
Epoch 6/10:  90%|█████████ | 1991/2208 [01:54<00:11, 18.68it/s][A
Epoch 6/10:  90%|█████████ | 1994/2208 [01:54<00:10, 19.48it/s][A
Epoch 6/10:  90%|█████████ | 1997/2208 [01:54<00:10, 19.96it/s][A
  with torch.cuda.amp.autocast():

Epoch 6/10:  91%|█████████ | 2003/2208 [01:55<00:18, 11.15it/s][A

Batch 2000: Training loss = 0.1410, Training accuracy = 0.9424, F1 = 0.9423



Epoch 6/10:  91%|█████████ | 2006/2208 [01:55<00:15, 13.05it/s][A
Epoch 6/10:  91%|█████████ | 2009/2208 [01:55<00:13, 14.82it/s][A
Epoch 6/10:  91%|█████████ | 2012/2208 [01:55<00:12, 16.32it/s][A
Epoch 6/10:  91%|█████████▏| 2015/2208 [01:55<00:10, 17.60it/s][A
Epoch 6/10:  91%|█████████▏| 2018/2208 [01:56<00:10, 18.55it/s][A
Epoch 6/10:  92%|█████████▏| 2021/2208 [01:56<00:09, 19.35it/s][A
  with torch.cuda.amp.autocast():

Epoch 6/10:  92%|█████████▏| 2027/2208 [01:56<00:16, 11.28it/s][A
Epoch 6/10:  92%|█████████▏| 2030/2208 [01:56<00:13, 13.22it/s][A

Batch 2025: Training loss = 0.1011, Training accuracy = 0.9425, F1 = 0.9424



Epoch 6/10:  92%|█████████▏| 2033/2208 [01:57<00:11, 14.97it/s][A
Epoch 6/10:  92%|█████████▏| 2036/2208 [01:57<00:10, 16.52it/s][A
Epoch 6/10:  92%|█████████▏| 2039/2208 [01:57<00:09, 17.59it/s][A
Epoch 6/10:  92%|█████████▏| 2042/2208 [01:57<00:08, 18.48it/s][A
Epoch 6/10:  93%|█████████▎| 2045/2208 [01:57<00:08, 19.33it/s][A
Epoch 6/10:  93%|█████████▎| 2048/2208 [01:57<00:08, 19.95it/s][A
  with torch.cuda.amp.autocast():

Epoch 6/10:  93%|█████████▎| 2054/2208 [01:58<00:11, 13.08it/s][A

Batch 2050: Training loss = 0.1441, Training accuracy = 0.9426, F1 = 0.9425



Epoch 6/10:  93%|█████████▎| 2057/2208 [01:58<00:10, 14.86it/s][A
Epoch 6/10:  93%|█████████▎| 2060/2208 [01:58<00:09, 16.32it/s][A
Epoch 6/10:  93%|█████████▎| 2063/2208 [01:58<00:08, 17.51it/s][A
Epoch 6/10:  94%|█████████▎| 2066/2208 [01:59<00:07, 18.49it/s][A
Epoch 6/10:  94%|█████████▎| 2069/2208 [01:59<00:07, 19.23it/s][A
Epoch 6/10:  94%|█████████▍| 2072/2208 [01:59<00:06, 19.79it/s][A
  with torch.cuda.amp.autocast():

Epoch 6/10:  94%|█████████▍| 2078/2208 [02:00<00:11, 11.15it/s][A

Batch 2075: Training loss = 0.0694, Training accuracy = 0.9426, F1 = 0.9425



Epoch 6/10:  94%|█████████▍| 2081/2208 [02:00<00:09, 13.07it/s][A
Epoch 6/10:  94%|█████████▍| 2084/2208 [02:00<00:08, 14.80it/s][A
Epoch 6/10:  95%|█████████▍| 2087/2208 [02:00<00:07, 16.28it/s][A
Epoch 6/10:  95%|█████████▍| 2090/2208 [02:00<00:06, 17.57it/s][A
Epoch 6/10:  95%|█████████▍| 2093/2208 [02:00<00:06, 18.64it/s][A
Epoch 6/10:  95%|█████████▍| 2096/2208 [02:00<00:05, 19.46it/s][A
  with torch.cuda.amp.autocast():

Epoch 6/10:  95%|█████████▌| 2102/2208 [02:01<00:09, 10.90it/s][A
Epoch 6/10:  95%|█████████▌| 2105/2208 [02:01<00:08, 12.83it/s][A

Batch 2100: Training loss = 0.2824, Training accuracy = 0.9426, F1 = 0.9425



Epoch 6/10:  95%|█████████▌| 2108/2208 [02:01<00:06, 14.59it/s][A
Epoch 6/10:  96%|█████████▌| 2110/2208 [02:01<00:06, 15.47it/s][A
Epoch 6/10:  96%|█████████▌| 2112/2208 [02:02<00:05, 16.34it/s][A
Epoch 6/10:  96%|█████████▌| 2115/2208 [02:02<00:05, 17.72it/s][A
Epoch 6/10:  96%|█████████▌| 2118/2208 [02:02<00:04, 18.74it/s][A
Epoch 6/10:  96%|█████████▌| 2121/2208 [02:02<00:05, 17.29it/s][A
Epoch 6/10:  96%|█████████▌| 2123/2208 [02:02<00:05, 16.84it/s][A
  with torch.cuda.amp.autocast():

Epoch 6/10:  96%|█████████▋| 2127/2208 [02:03<00:09,  8.74it/s][A
Epoch 6/10:  96%|█████████▋| 2130/2208 [02:03<00:06, 11.15it/s][A

Batch 2125: Training loss = 0.2640, Training accuracy = 0.9426, F1 = 0.9425



Epoch 6/10:  97%|█████████▋| 2133/2208 [02:03<00:05, 13.35it/s][A
Epoch 6/10:  97%|█████████▋| 2136/2208 [02:03<00:04, 15.23it/s][A
Epoch 6/10:  97%|█████████▋| 2138/2208 [02:03<00:04, 16.14it/s][A
Epoch 6/10:  97%|█████████▋| 2141/2208 [02:04<00:03, 17.60it/s][A
Epoch 6/10:  97%|█████████▋| 2144/2208 [02:04<00:03, 18.49it/s][A
Epoch 6/10:  97%|█████████▋| 2147/2208 [02:04<00:03, 17.66it/s][A
  with torch.cuda.amp.autocast():

Epoch 6/10:  97%|█████████▋| 2152/2208 [02:05<00:06,  9.32it/s][A
Epoch 6/10:  98%|█████████▊| 2155/2208 [02:05<00:04, 11.47it/s][A

Batch 2150: Training loss = 0.1026, Training accuracy = 0.9426, F1 = 0.9426



Epoch 6/10:  98%|█████████▊| 2158/2208 [02:05<00:03, 13.40it/s][A
Epoch 6/10:  98%|█████████▊| 2161/2208 [02:05<00:03, 15.21it/s][A
Epoch 6/10:  98%|█████████▊| 2164/2208 [02:05<00:02, 16.66it/s][A
Epoch 6/10:  98%|█████████▊| 2167/2208 [02:05<00:02, 17.83it/s][A
Epoch 6/10:  98%|█████████▊| 2170/2208 [02:05<00:02, 18.73it/s][A
Epoch 6/10:  98%|█████████▊| 2173/2208 [02:06<00:01, 19.27it/s][A
  with torch.cuda.amp.autocast():

Epoch 6/10:  99%|█████████▊| 2179/2208 [02:06<00:02, 12.68it/s][A

Batch 2175: Training loss = 0.1986, Training accuracy = 0.9427, F1 = 0.9426



Epoch 6/10:  99%|█████████▉| 2182/2208 [02:06<00:01, 14.48it/s][A
Epoch 6/10:  99%|█████████▉| 2185/2208 [02:07<00:01, 16.12it/s][A
Epoch 6/10:  99%|█████████▉| 2188/2208 [02:07<00:01, 17.41it/s][A
Epoch 6/10:  99%|█████████▉| 2191/2208 [02:07<00:00, 18.43it/s][A
Epoch 6/10:  99%|█████████▉| 2194/2208 [02:07<00:00, 19.16it/s][A
Epoch 6/10: 100%|█████████▉| 2197/2208 [02:07<00:00, 19.85it/s][A
  with torch.cuda.amp.autocast():

Epoch 6/10: 100%|█████████▉| 2203/2208 [02:08<00:00, 11.16it/s][A

Batch 2200: Training loss = 0.1591, Training accuracy = 0.9428, F1 = 0.9427



Epoch 6/10: 100%|█████████▉| 2206/2208 [02:08<00:00, 13.12it/s][A
                                                               [A


Epoch 6 Training Metrics:
Loss: 0.1732
Accuracy: 0.9427
F1 Score: 0.9427
Precision: 0.9426
Recall: 0.9427

Starting validation...



Validation:   0%|          | 0/552 [00:00<?, ?it/s][A
Validation:   0%|          | 1/552 [00:01<15:19,  1.67s/it][A
Validation:   1%|          | 3/552 [00:01<04:24,  2.08it/s][A
Validation:   1%|          | 5/552 [00:01<02:27,  3.71it/s][A
Validation:   1%|▏         | 7/552 [00:02<01:36,  5.63it/s][A
Validation:   2%|▏         | 9/552 [00:02<01:11,  7.64it/s][A
Validation:   2%|▏         | 11/552 [00:02<00:55,  9.67it/s][A
Validation:   2%|▏         | 13/552 [00:02<00:46, 11.57it/s][A
Validation:   3%|▎         | 15/552 [00:02<00:40, 13.23it/s][A
Validation:   3%|▎         | 17/552 [00:02<00:36, 14.65it/s][A
Validation:   3%|▎         | 19/552 [00:02<00:33, 15.80it/s][A
Validation:   4%|▍         | 21/552 [00:02<00:32, 16.54it/s][A
Validation:   4%|▍         | 23/552 [00:02<00:30, 17.30it/s][A
Validation:   5%|▍         | 25/552 [00:02<00:29, 17.81it/s][A
Validation:   5%|▍         | 27/552 [00:03<00:28, 18.17it/s][A
Validation:   5%|▌         | 29/552 [00:03<00:28, 18.


Epoch 6 Validation Metrics:
Loss: 0.1558
Accuracy: 0.9492
F1 Score: 0.9491
Precision: 0.9511
Recall: 0.9492


Training epochs:  60%|██████    | 6/10 [16:07<10:45, 161.45s/it]


Starting epoch 7/10



  with torch.cuda.amp.autocast():

  with torch.cuda.amp.autocast():

Epoch 7/10:   0%|          | 3/2208 [00:01<16:51,  2.18it/s][A

Batch 0: Training loss = 0.2283, Training accuracy = 0.9375, F1 = 0.9349



Epoch 7/10:   0%|          | 5/2208 [00:01<09:08,  4.02it/s][A
Epoch 7/10:   0%|          | 8/2208 [00:01<05:13,  7.01it/s][A
Epoch 7/10:   0%|          | 11/2208 [00:02<03:43,  9.82it/s][A
Epoch 7/10:   1%|          | 14/2208 [00:02<03:09, 11.57it/s][A
Epoch 7/10:   1%|          | 17/2208 [00:02<02:38, 13.82it/s][A
Epoch 7/10:   1%|          | 20/2208 [00:02<02:19, 15.67it/s][A
Epoch 7/10:   1%|          | 23/2208 [00:02<02:07, 17.18it/s][A
  with torch.cuda.amp.autocast():

Epoch 7/10:   1%|▏         | 29/2208 [00:03<01:56, 18.70it/s][A

Batch 25: Training loss = 0.1746, Training accuracy = 0.9474, F1 = 0.9471



Epoch 7/10:   1%|▏         | 32/2208 [00:03<01:52, 19.27it/s][A
Epoch 7/10:   2%|▏         | 35/2208 [00:03<01:50, 19.73it/s][A
Epoch 7/10:   2%|▏         | 38/2208 [00:03<02:07, 16.97it/s][A
Epoch 7/10:   2%|▏         | 41/2208 [00:03<01:59, 18.18it/s][A
Epoch 7/10:   2%|▏         | 44/2208 [00:03<01:54, 18.97it/s][A
Epoch 7/10:   2%|▏         | 46/2208 [00:03<02:08, 16.78it/s][A
Epoch 7/10:   2%|▏         | 49/2208 [00:04<01:59, 18.04it/s][A
  with torch.cuda.amp.autocast():

Epoch 7/10:   2%|▏         | 53/2208 [00:04<02:00, 17.86it/s][A

Batch 50: Training loss = 0.1092, Training accuracy = 0.9488, F1 = 0.9488



Epoch 7/10:   3%|▎         | 56/2208 [00:04<01:54, 18.72it/s][A
Epoch 7/10:   3%|▎         | 59/2208 [00:04<01:50, 19.44it/s][A
Epoch 7/10:   3%|▎         | 61/2208 [00:04<01:52, 19.01it/s][A
Epoch 7/10:   3%|▎         | 64/2208 [00:04<01:49, 19.56it/s][A
Epoch 7/10:   3%|▎         | 66/2208 [00:05<01:55, 18.50it/s][A
Epoch 7/10:   3%|▎         | 69/2208 [00:05<02:00, 17.72it/s][A
Epoch 7/10:   3%|▎         | 71/2208 [00:05<01:57, 18.22it/s][A
Epoch 7/10:   3%|▎         | 73/2208 [00:05<02:19, 15.30it/s][A
  with torch.cuda.amp.autocast():

Epoch 7/10:   4%|▎         | 79/2208 [00:05<01:58, 17.93it/s][A

Batch 75: Training loss = 0.2531, Training accuracy = 0.9491, F1 = 0.9490



Epoch 7/10:   4%|▎         | 82/2208 [00:05<01:52, 18.88it/s][A
Epoch 7/10:   4%|▍         | 85/2208 [00:06<01:48, 19.62it/s][A
Epoch 7/10:   4%|▍         | 88/2208 [00:06<01:45, 20.00it/s][A
Epoch 7/10:   4%|▍         | 91/2208 [00:06<01:58, 17.83it/s][A
Epoch 7/10:   4%|▍         | 94/2208 [00:06<01:53, 18.63it/s][A
Epoch 7/10:   4%|▍         | 97/2208 [00:06<01:49, 19.32it/s][A
Epoch 7/10:   4%|▍         | 99/2208 [00:06<01:50, 19.10it/s][A
  with torch.cuda.amp.autocast():

Epoch 7/10:   5%|▍         | 103/2208 [00:07<02:00, 17.49it/s][A

Batch 100: Training loss = 0.1785, Training accuracy = 0.9483, F1 = 0.9483



Epoch 7/10:   5%|▍         | 106/2208 [00:07<01:52, 18.61it/s][A
Epoch 7/10:   5%|▍         | 108/2208 [00:07<02:11, 15.94it/s][A
Epoch 7/10:   5%|▌         | 111/2208 [00:07<02:00, 17.46it/s][A
Epoch 7/10:   5%|▌         | 114/2208 [00:07<01:52, 18.55it/s][A
Epoch 7/10:   5%|▌         | 116/2208 [00:07<01:54, 18.21it/s][A
Epoch 7/10:   5%|▌         | 119/2208 [00:07<01:57, 17.77it/s][A
Epoch 7/10:   6%|▌         | 122/2208 [00:08<01:50, 18.89it/s][A
Epoch 7/10:   6%|▌         | 124/2208 [00:08<01:50, 18.90it/s][A
  with torch.cuda.amp.autocast():

Epoch 7/10:   6%|▌         | 129/2208 [00:08<01:48, 19.11it/s][A

Batch 125: Training loss = 0.1339, Training accuracy = 0.9492, F1 = 0.9491



Epoch 7/10:   6%|▌         | 132/2208 [00:08<01:44, 19.85it/s][A
Epoch 7/10:   6%|▌         | 135/2208 [00:08<01:42, 20.18it/s][A
Epoch 7/10:   6%|▋         | 138/2208 [00:08<01:41, 20.47it/s][A
Epoch 7/10:   6%|▋         | 141/2208 [00:09<01:40, 20.54it/s][A
Epoch 7/10:   7%|▋         | 144/2208 [00:09<01:39, 20.64it/s][A
Epoch 7/10:   7%|▋         | 147/2208 [00:09<01:40, 20.51it/s][A
  with torch.cuda.amp.autocast():

Epoch 7/10:   7%|▋         | 153/2208 [00:09<01:45, 19.50it/s][A

Batch 150: Training loss = 0.0809, Training accuracy = 0.9487, F1 = 0.9486



Epoch 7/10:   7%|▋         | 156/2208 [00:09<01:42, 19.93it/s][A
Epoch 7/10:   7%|▋         | 159/2208 [00:09<01:47, 19.12it/s][A
Epoch 7/10:   7%|▋         | 162/2208 [00:10<01:46, 19.26it/s][A
Epoch 7/10:   7%|▋         | 165/2208 [00:10<01:43, 19.69it/s][A
Epoch 7/10:   8%|▊         | 167/2208 [00:10<01:56, 17.55it/s][A
Epoch 7/10:   8%|▊         | 169/2208 [00:10<01:53, 17.98it/s][A
Epoch 7/10:   8%|▊         | 171/2208 [00:10<01:54, 17.80it/s][A
Epoch 7/10:   8%|▊         | 174/2208 [00:10<01:47, 18.84it/s][A
  with torch.cuda.amp.autocast():

Epoch 7/10:   8%|▊         | 178/2208 [00:11<02:02, 16.58it/s][A

Batch 175: Training loss = 0.1108, Training accuracy = 0.9487, F1 = 0.9486



Epoch 7/10:   8%|▊         | 181/2208 [00:11<01:52, 18.04it/s][A
Epoch 7/10:   8%|▊         | 184/2208 [00:11<01:46, 19.09it/s][A
Epoch 7/10:   8%|▊         | 187/2208 [00:11<01:42, 19.66it/s][A
Epoch 7/10:   9%|▊         | 189/2208 [00:11<01:42, 19.70it/s][A
Epoch 7/10:   9%|▊         | 191/2208 [00:11<01:42, 19.67it/s][A
Epoch 7/10:   9%|▉         | 194/2208 [00:11<01:43, 19.37it/s][A
Epoch 7/10:   9%|▉         | 197/2208 [00:11<01:40, 19.98it/s][A
Epoch 7/10:   9%|▉         | 199/2208 [00:12<01:42, 19.58it/s][A
  with torch.cuda.amp.autocast():

Epoch 7/10:   9%|▉         | 204/2208 [00:12<01:49, 18.24it/s][A

Batch 200: Training loss = 0.1721, Training accuracy = 0.9490, F1 = 0.9489



Epoch 7/10:   9%|▉         | 207/2208 [00:12<01:44, 19.23it/s][A
Epoch 7/10:  10%|▉         | 210/2208 [00:12<01:43, 19.38it/s][A
Epoch 7/10:  10%|▉         | 213/2208 [00:12<01:40, 19.91it/s][A
Epoch 7/10:  10%|▉         | 216/2208 [00:12<01:38, 20.16it/s][A
Epoch 7/10:  10%|▉         | 219/2208 [00:13<01:37, 20.36it/s][A
Epoch 7/10:  10%|█         | 222/2208 [00:13<01:44, 18.99it/s][A
Epoch 7/10:  10%|█         | 224/2208 [00:13<01:43, 19.21it/s][A
  with torch.cuda.amp.autocast():

Epoch 7/10:  10%|█         | 229/2208 [00:13<01:49, 18.05it/s][A

Batch 225: Training loss = 0.2022, Training accuracy = 0.9487, F1 = 0.9486



Epoch 7/10:  10%|█         | 231/2208 [00:13<01:46, 18.49it/s][A
Epoch 7/10:  11%|█         | 234/2208 [00:13<01:42, 19.31it/s][A
Epoch 7/10:  11%|█         | 237/2208 [00:14<01:39, 19.82it/s][A
Epoch 7/10:  11%|█         | 240/2208 [00:14<01:37, 20.18it/s][A
Epoch 7/10:  11%|█         | 243/2208 [00:14<01:36, 20.39it/s][A
Epoch 7/10:  11%|█         | 246/2208 [00:14<01:35, 20.59it/s][A
  with torch.cuda.amp.autocast():

Epoch 7/10:  11%|█▏        | 252/2208 [00:14<01:49, 17.93it/s][A
Epoch 7/10:  12%|█▏        | 255/2208 [00:15<01:43, 18.91it/s][A

Batch 250: Training loss = 0.1493, Training accuracy = 0.9488, F1 = 0.9487



Epoch 7/10:  12%|█▏        | 258/2208 [00:15<01:39, 19.68it/s][A
Epoch 7/10:  12%|█▏        | 261/2208 [00:15<01:36, 20.08it/s][A
Epoch 7/10:  12%|█▏        | 264/2208 [00:15<01:38, 19.77it/s][A
Epoch 7/10:  12%|█▏        | 267/2208 [00:15<01:36, 20.03it/s][A
Epoch 7/10:  12%|█▏        | 270/2208 [00:15<01:38, 19.65it/s][A
Epoch 7/10:  12%|█▏        | 272/2208 [00:15<01:40, 19.35it/s][A
  with torch.cuda.amp.autocast():

Epoch 7/10:  13%|█▎        | 277/2208 [00:16<01:56, 16.64it/s][A
Epoch 7/10:  13%|█▎        | 280/2208 [00:16<01:47, 17.95it/s][A

Batch 275: Training loss = 0.1653, Training accuracy = 0.9495, F1 = 0.9495



Epoch 7/10:  13%|█▎        | 283/2208 [00:16<01:41, 18.89it/s][A
Epoch 7/10:  13%|█▎        | 286/2208 [00:16<01:38, 19.60it/s][A
Epoch 7/10:  13%|█▎        | 288/2208 [00:16<01:37, 19.60it/s][A
Epoch 7/10:  13%|█▎        | 291/2208 [00:16<01:35, 20.04it/s][A
Epoch 7/10:  13%|█▎        | 294/2208 [00:17<01:34, 20.27it/s][A
Epoch 7/10:  13%|█▎        | 297/2208 [00:17<01:33, 20.54it/s][A
  with torch.cuda.amp.autocast():

Epoch 7/10:  14%|█▎        | 303/2208 [00:17<01:48, 17.54it/s][A

Batch 300: Training loss = 0.2472, Training accuracy = 0.9496, F1 = 0.9496



Epoch 7/10:  14%|█▍        | 306/2208 [00:17<01:42, 18.55it/s][A
Epoch 7/10:  14%|█▍        | 309/2208 [00:17<01:38, 19.28it/s][A
Epoch 7/10:  14%|█▍        | 312/2208 [00:17<01:36, 19.71it/s][A
Epoch 7/10:  14%|█▍        | 315/2208 [00:18<01:34, 20.10it/s][A
Epoch 7/10:  14%|█▍        | 318/2208 [00:18<01:32, 20.46it/s][A
Epoch 7/10:  15%|█▍        | 321/2208 [00:18<01:31, 20.73it/s][A
  with torch.cuda.amp.autocast():

Epoch 7/10:  15%|█▍        | 327/2208 [00:18<01:59, 15.68it/s][A
Epoch 7/10:  15%|█▍        | 330/2208 [00:18<01:50, 17.02it/s][A

Batch 325: Training loss = 0.1198, Training accuracy = 0.9499, F1 = 0.9498



Epoch 7/10:  15%|█▌        | 332/2208 [00:19<01:46, 17.57it/s][A
Epoch 7/10:  15%|█▌        | 335/2208 [00:19<01:41, 18.50it/s][A
Epoch 7/10:  15%|█▌        | 338/2208 [00:19<01:37, 19.26it/s][A
Epoch 7/10:  15%|█▌        | 341/2208 [00:19<01:34, 19.83it/s][A
Epoch 7/10:  16%|█▌        | 344/2208 [00:19<01:33, 19.98it/s][A
Epoch 7/10:  16%|█▌        | 347/2208 [00:19<01:31, 20.27it/s][A
  with torch.cuda.amp.autocast():

Epoch 7/10:  16%|█▌        | 353/2208 [00:20<01:46, 17.46it/s][A

Batch 350: Training loss = 0.1592, Training accuracy = 0.9499, F1 = 0.9498



Epoch 7/10:  16%|█▌        | 356/2208 [00:20<01:40, 18.43it/s][A
Epoch 7/10:  16%|█▋        | 359/2208 [00:20<01:36, 19.13it/s][A
Epoch 7/10:  16%|█▋        | 361/2208 [00:20<01:35, 19.25it/s][A
Epoch 7/10:  16%|█▋        | 364/2208 [00:20<01:33, 19.75it/s][A
Epoch 7/10:  17%|█▋        | 367/2208 [00:20<01:32, 19.96it/s][A
Epoch 7/10:  17%|█▋        | 370/2208 [00:20<01:34, 19.37it/s][A
Epoch 7/10:  17%|█▋        | 373/2208 [00:21<01:37, 18.85it/s][A
  with torch.cuda.amp.autocast():

Epoch 7/10:  17%|█▋        | 379/2208 [00:21<01:44, 17.58it/s][A

Batch 375: Training loss = 0.2425, Training accuracy = 0.9494, F1 = 0.9493



Epoch 7/10:  17%|█▋        | 382/2208 [00:21<01:38, 18.57it/s][A
Epoch 7/10:  17%|█▋        | 384/2208 [00:21<01:40, 18.15it/s][A
Epoch 7/10:  17%|█▋        | 386/2208 [00:21<01:40, 18.16it/s][A
Epoch 7/10:  18%|█▊        | 388/2208 [00:22<01:41, 18.02it/s][A
Epoch 7/10:  18%|█▊        | 390/2208 [00:22<01:39, 18.20it/s][A
Epoch 7/10:  18%|█▊        | 392/2208 [00:22<01:42, 17.76it/s][A
Epoch 7/10:  18%|█▊        | 395/2208 [00:22<01:36, 18.83it/s][A
Epoch 7/10:  18%|█▊        | 397/2208 [00:22<01:52, 16.11it/s][A
  with torch.cuda.amp.autocast():

Epoch 7/10:  18%|█▊        | 402/2208 [00:22<02:01, 14.92it/s][A
Epoch 7/10:  18%|█▊        | 405/2208 [00:23<01:47, 16.70it/s][A

Batch 400: Training loss = 0.1405, Training accuracy = 0.9494, F1 = 0.9494



Epoch 7/10:  18%|█▊        | 408/2208 [00:23<01:40, 17.92it/s][A
Epoch 7/10:  19%|█▊        | 411/2208 [00:23<01:35, 18.82it/s][A
Epoch 7/10:  19%|█▉        | 414/2208 [00:23<01:31, 19.60it/s][A
Epoch 7/10:  19%|█▉        | 416/2208 [00:23<01:35, 18.71it/s][A
Epoch 7/10:  19%|█▉        | 419/2208 [00:23<01:31, 19.46it/s][A
Epoch 7/10:  19%|█▉        | 422/2208 [00:23<01:29, 19.92it/s][A
Epoch 7/10:  19%|█▉        | 424/2208 [00:24<01:32, 19.23it/s][A
  with torch.cuda.amp.autocast():

Epoch 7/10:  19%|█▉        | 429/2208 [00:24<01:38, 18.00it/s][A

Batch 425: Training loss = 0.3588, Training accuracy = 0.9496, F1 = 0.9495



Epoch 7/10:  20%|█▉        | 432/2208 [00:24<01:33, 19.04it/s][A
Epoch 7/10:  20%|█▉        | 434/2208 [00:24<01:32, 19.24it/s][A
Epoch 7/10:  20%|█▉        | 437/2208 [00:24<01:29, 19.77it/s][A
Epoch 7/10:  20%|█▉        | 439/2208 [00:24<01:34, 18.79it/s][A
Epoch 7/10:  20%|██        | 442/2208 [00:24<01:29, 19.66it/s][A
Epoch 7/10:  20%|██        | 444/2208 [00:25<01:34, 18.66it/s][A
Epoch 7/10:  20%|██        | 447/2208 [00:25<01:30, 19.43it/s][A
  with torch.cuda.amp.autocast():

Epoch 7/10:  20%|██        | 452/2208 [00:25<01:50, 15.90it/s][A
Epoch 7/10:  21%|██        | 455/2208 [00:25<01:40, 17.40it/s][A

Batch 450: Training loss = 0.1759, Training accuracy = 0.9497, F1 = 0.9497



Epoch 7/10:  21%|██        | 458/2208 [00:25<01:34, 18.46it/s][A
Epoch 7/10:  21%|██        | 461/2208 [00:26<01:31, 19.14it/s][A
Epoch 7/10:  21%|██        | 464/2208 [00:26<01:28, 19.81it/s][A
Epoch 7/10:  21%|██        | 467/2208 [00:26<01:26, 20.14it/s][A
Epoch 7/10:  21%|██▏       | 470/2208 [00:26<01:24, 20.46it/s][A
Epoch 7/10:  21%|██▏       | 473/2208 [00:26<01:23, 20.77it/s][A
  with torch.cuda.amp.autocast():

Epoch 7/10:  22%|██▏       | 479/2208 [00:26<01:32, 18.65it/s][A

Batch 475: Training loss = 0.0898, Training accuracy = 0.9499, F1 = 0.9498



Epoch 7/10:  22%|██▏       | 482/2208 [00:27<01:28, 19.40it/s][A
Epoch 7/10:  22%|██▏       | 485/2208 [00:27<01:26, 19.93it/s][A
Epoch 7/10:  22%|██▏       | 488/2208 [00:27<01:24, 20.27it/s][A
Epoch 7/10:  22%|██▏       | 491/2208 [00:27<01:23, 20.67it/s][A
Epoch 7/10:  22%|██▏       | 494/2208 [00:27<01:21, 20.97it/s][A
Epoch 7/10:  23%|██▎       | 497/2208 [00:27<01:21, 21.12it/s][A
  with torch.cuda.amp.autocast():

Epoch 7/10:  23%|██▎       | 503/2208 [00:28<01:43, 16.53it/s][A

Batch 500: Training loss = 0.1613, Training accuracy = 0.9501, F1 = 0.9500



Epoch 7/10:  23%|██▎       | 506/2208 [00:28<01:35, 17.82it/s][A
Epoch 7/10:  23%|██▎       | 509/2208 [00:28<01:30, 18.68it/s][A
Epoch 7/10:  23%|██▎       | 512/2208 [00:28<01:28, 19.26it/s][A
Epoch 7/10:  23%|██▎       | 515/2208 [00:28<01:24, 19.92it/s][A
Epoch 7/10:  23%|██▎       | 518/2208 [00:28<01:23, 20.31it/s][A
Epoch 7/10:  24%|██▎       | 521/2208 [00:29<01:21, 20.59it/s][A
  with torch.cuda.amp.autocast():

Epoch 7/10:  24%|██▍       | 527/2208 [00:29<01:37, 17.24it/s][A
Epoch 7/10:  24%|██▍       | 530/2208 [00:29<01:31, 18.35it/s][A

Batch 525: Training loss = 0.0618, Training accuracy = 0.9498, F1 = 0.9497



Epoch 7/10:  24%|██▍       | 533/2208 [00:29<01:27, 19.23it/s][A
Epoch 7/10:  24%|██▍       | 536/2208 [00:29<01:24, 19.80it/s][A
Epoch 7/10:  24%|██▍       | 539/2208 [00:29<01:22, 20.22it/s][A
Epoch 7/10:  25%|██▍       | 542/2208 [00:30<01:21, 20.52it/s][A
Epoch 7/10:  25%|██▍       | 545/2208 [00:30<01:20, 20.76it/s][A
Epoch 7/10:  25%|██▍       | 548/2208 [00:30<01:19, 20.80it/s][A
  with torch.cuda.amp.autocast():

Epoch 7/10:  25%|██▌       | 554/2208 [00:30<01:30, 18.26it/s][A

Batch 550: Training loss = 0.1695, Training accuracy = 0.9497, F1 = 0.9497



Epoch 7/10:  25%|██▌       | 557/2208 [00:30<01:26, 19.14it/s][A
Epoch 7/10:  25%|██▌       | 559/2208 [00:31<01:25, 19.31it/s][A
Epoch 7/10:  25%|██▌       | 562/2208 [00:31<01:22, 19.86it/s][A
Epoch 7/10:  26%|██▌       | 565/2208 [00:31<01:20, 20.41it/s][A
Epoch 7/10:  26%|██▌       | 568/2208 [00:31<01:19, 20.63it/s][A
Epoch 7/10:  26%|██▌       | 571/2208 [00:31<01:19, 20.71it/s][A
  with torch.cuda.amp.autocast():

Epoch 7/10:  26%|██▌       | 577/2208 [00:32<01:39, 16.46it/s][A
Epoch 7/10:  26%|██▋       | 580/2208 [00:32<01:31, 17.70it/s][A

Batch 575: Training loss = 0.1064, Training accuracy = 0.9496, F1 = 0.9495



Epoch 7/10:  26%|██▋       | 583/2208 [00:32<01:27, 18.56it/s][A
Epoch 7/10:  27%|██▋       | 586/2208 [00:32<01:24, 19.31it/s][A
Epoch 7/10:  27%|██▋       | 589/2208 [00:32<01:21, 19.83it/s][A
Epoch 7/10:  27%|██▋       | 592/2208 [00:32<01:19, 20.23it/s][A
Epoch 7/10:  27%|██▋       | 595/2208 [00:32<01:19, 20.33it/s][A
Epoch 7/10:  27%|██▋       | 598/2208 [00:33<01:18, 20.60it/s][A
  with torch.cuda.amp.autocast():

Epoch 7/10:  27%|██▋       | 604/2208 [00:33<01:36, 16.63it/s][A

Batch 600: Training loss = 0.2890, Training accuracy = 0.9497, F1 = 0.9497



Epoch 7/10:  27%|██▋       | 607/2208 [00:33<01:29, 17.83it/s][A
Epoch 7/10:  28%|██▊       | 610/2208 [00:33<01:24, 18.83it/s][A
Epoch 7/10:  28%|██▊       | 613/2208 [00:33<01:21, 19.47it/s][A
Epoch 7/10:  28%|██▊       | 616/2208 [00:34<01:19, 20.01it/s][A
Epoch 7/10:  28%|██▊       | 619/2208 [00:34<01:29, 17.70it/s][A
Epoch 7/10:  28%|██▊       | 622/2208 [00:34<01:25, 18.56it/s][A
  with torch.cuda.amp.autocast():

Epoch 7/10:  28%|██▊       | 627/2208 [00:34<01:45, 14.95it/s][A
Epoch 7/10:  29%|██▊       | 630/2208 [00:34<01:36, 16.44it/s][A

Batch 625: Training loss = 0.1414, Training accuracy = 0.9496, F1 = 0.9495



Epoch 7/10:  29%|██▊       | 633/2208 [00:35<01:30, 17.32it/s][A
Epoch 7/10:  29%|██▉       | 636/2208 [00:35<01:25, 18.30it/s][A
Epoch 7/10:  29%|██▉       | 638/2208 [00:35<01:32, 16.93it/s][A
Epoch 7/10:  29%|██▉       | 641/2208 [00:35<01:26, 18.08it/s][A
Epoch 7/10:  29%|██▉       | 644/2208 [00:35<01:22, 18.94it/s][A
Epoch 7/10:  29%|██▉       | 646/2208 [00:35<01:21, 19.13it/s][A
Epoch 7/10:  29%|██▉       | 648/2208 [00:35<01:20, 19.33it/s][A
  with torch.cuda.amp.autocast():

Epoch 7/10:  30%|██▉       | 652/2208 [00:36<01:59, 12.99it/s][A
Epoch 7/10:  30%|██▉       | 655/2208 [00:36<01:41, 15.29it/s][A

Batch 650: Training loss = 0.0925, Training accuracy = 0.9496, F1 = 0.9495



Epoch 7/10:  30%|██▉       | 658/2208 [00:36<01:32, 16.83it/s][A
Epoch 7/10:  30%|██▉       | 661/2208 [00:36<01:25, 18.11it/s][A
Epoch 7/10:  30%|███       | 664/2208 [00:36<01:21, 19.03it/s][A
Epoch 7/10:  30%|███       | 666/2208 [00:36<01:25, 18.10it/s][A
Epoch 7/10:  30%|███       | 669/2208 [00:37<01:36, 15.88it/s][A
Epoch 7/10:  30%|███       | 671/2208 [00:37<01:32, 16.68it/s][A
Epoch 7/10:  31%|███       | 674/2208 [00:37<01:25, 18.01it/s][A
  with torch.cuda.amp.autocast():

Epoch 7/10:  31%|███       | 679/2208 [00:37<01:33, 16.42it/s][A

Batch 675: Training loss = 0.1162, Training accuracy = 0.9498, F1 = 0.9497



Epoch 7/10:  31%|███       | 682/2208 [00:37<01:25, 17.79it/s][A
Epoch 7/10:  31%|███       | 685/2208 [00:38<01:20, 18.88it/s][A
Epoch 7/10:  31%|███       | 688/2208 [00:38<01:17, 19.67it/s][A
Epoch 7/10:  31%|███▏      | 691/2208 [00:38<01:15, 20.19it/s][A
Epoch 7/10:  31%|███▏      | 694/2208 [00:38<01:17, 19.62it/s][A
Epoch 7/10:  32%|███▏      | 696/2208 [00:38<01:16, 19.67it/s][A
  with torch.cuda.amp.autocast():

Epoch 7/10:  32%|███▏      | 702/2208 [00:39<01:36, 15.65it/s][A
Epoch 7/10:  32%|███▏      | 705/2208 [00:39<01:27, 17.18it/s][A

Batch 700: Training loss = 0.2157, Training accuracy = 0.9498, F1 = 0.9497



Epoch 7/10:  32%|███▏      | 708/2208 [00:39<01:21, 18.30it/s][A
Epoch 7/10:  32%|███▏      | 711/2208 [00:39<01:18, 19.12it/s][A
Epoch 7/10:  32%|███▏      | 714/2208 [00:39<01:15, 19.81it/s][A
Epoch 7/10:  32%|███▏      | 717/2208 [00:39<01:13, 20.20it/s][A
Epoch 7/10:  33%|███▎      | 720/2208 [00:39<01:12, 20.58it/s][A
Epoch 7/10:  33%|███▎      | 723/2208 [00:40<01:12, 20.49it/s][A
  with torch.cuda.amp.autocast():

Epoch 7/10:  33%|███▎      | 729/2208 [00:40<01:23, 17.73it/s][A

Batch 725: Training loss = 0.2028, Training accuracy = 0.9497, F1 = 0.9497



Epoch 7/10:  33%|███▎      | 732/2208 [00:40<01:18, 18.70it/s][A
Epoch 7/10:  33%|███▎      | 735/2208 [00:40<01:15, 19.44it/s][A
Epoch 7/10:  33%|███▎      | 738/2208 [00:40<01:13, 20.04it/s][A
Epoch 7/10:  34%|███▎      | 741/2208 [00:41<01:16, 19.26it/s][A
Epoch 7/10:  34%|███▎      | 744/2208 [00:41<01:14, 19.59it/s][A
Epoch 7/10:  34%|███▍      | 747/2208 [00:41<01:12, 20.23it/s][A
  with torch.cuda.amp.autocast():

Epoch 7/10:  34%|███▍      | 753/2208 [00:41<01:33, 15.48it/s][A

Batch 750: Training loss = 0.2739, Training accuracy = 0.9497, F1 = 0.9496



Epoch 7/10:  34%|███▍      | 756/2208 [00:41<01:25, 16.95it/s][A
Epoch 7/10:  34%|███▍      | 759/2208 [00:42<01:20, 17.99it/s][A
Epoch 7/10:  35%|███▍      | 762/2208 [00:42<01:16, 18.91it/s][A
Epoch 7/10:  35%|███▍      | 765/2208 [00:42<01:13, 19.61it/s][A
Epoch 7/10:  35%|███▍      | 768/2208 [00:42<01:11, 20.05it/s][A
Epoch 7/10:  35%|███▍      | 771/2208 [00:42<01:10, 20.24it/s][A
  with torch.cuda.amp.autocast():

Epoch 7/10:  35%|███▌      | 777/2208 [00:42<01:28, 16.14it/s][A
Epoch 7/10:  35%|███▌      | 780/2208 [00:43<01:21, 17.45it/s][A

Batch 775: Training loss = 0.1062, Training accuracy = 0.9500, F1 = 0.9500



Epoch 7/10:  35%|███▌      | 783/2208 [00:43<01:17, 18.42it/s][A
Epoch 7/10:  36%|███▌      | 786/2208 [00:43<01:14, 19.11it/s][A
Epoch 7/10:  36%|███▌      | 789/2208 [00:43<01:11, 19.73it/s][A
Epoch 7/10:  36%|███▌      | 792/2208 [00:43<01:10, 20.18it/s][A
Epoch 7/10:  36%|███▌      | 795/2208 [00:43<01:09, 20.47it/s][A
Epoch 7/10:  36%|███▌      | 798/2208 [00:43<01:08, 20.72it/s][A
  with torch.cuda.amp.autocast():

Epoch 7/10:  36%|███▋      | 804/2208 [00:44<01:21, 17.19it/s][A

Batch 800: Training loss = 0.0894, Training accuracy = 0.9502, F1 = 0.9501



Epoch 7/10:  37%|███▋      | 807/2208 [00:44<01:17, 18.15it/s][A
Epoch 7/10:  37%|███▋      | 810/2208 [00:44<01:13, 19.05it/s][A
Epoch 7/10:  37%|███▋      | 813/2208 [00:44<01:10, 19.66it/s][A
Epoch 7/10:  37%|███▋      | 816/2208 [00:44<01:09, 20.07it/s][A
Epoch 7/10:  37%|███▋      | 819/2208 [00:45<01:08, 20.30it/s][A
Epoch 7/10:  37%|███▋      | 822/2208 [00:45<01:07, 20.61it/s][A
  with torch.cuda.amp.autocast():

Epoch 7/10:  38%|███▊      | 828/2208 [00:45<01:26, 15.96it/s][A

Batch 825: Training loss = 0.0965, Training accuracy = 0.9501, F1 = 0.9500



Epoch 7/10:  38%|███▊      | 831/2208 [00:45<01:19, 17.40it/s][A
Epoch 7/10:  38%|███▊      | 834/2208 [00:45<01:14, 18.38it/s][A
Epoch 7/10:  38%|███▊      | 837/2208 [00:46<01:11, 19.15it/s][A
Epoch 7/10:  38%|███▊      | 840/2208 [00:46<01:09, 19.80it/s][A
Epoch 7/10:  38%|███▊      | 843/2208 [00:46<01:07, 20.15it/s][A
Epoch 7/10:  38%|███▊      | 846/2208 [00:46<01:06, 20.48it/s][A
  with torch.cuda.amp.autocast():

Epoch 7/10:  39%|███▊      | 852/2208 [00:46<01:24, 15.97it/s][A
Epoch 7/10:  39%|███▊      | 855/2208 [00:47<01:18, 17.34it/s][A

Batch 850: Training loss = 0.2923, Training accuracy = 0.9499, F1 = 0.9499



Epoch 7/10:  39%|███▉      | 858/2208 [00:47<01:13, 18.44it/s][A
Epoch 7/10:  39%|███▉      | 861/2208 [00:47<01:10, 19.08it/s][A
Epoch 7/10:  39%|███▉      | 864/2208 [00:47<01:08, 19.56it/s][A
Epoch 7/10:  39%|███▉      | 867/2208 [00:47<01:07, 19.99it/s][A
Epoch 7/10:  39%|███▉      | 870/2208 [00:47<01:05, 20.37it/s][A
Epoch 7/10:  40%|███▉      | 873/2208 [00:48<01:16, 17.35it/s][A
  with torch.cuda.amp.autocast():

Epoch 7/10:  40%|███▉      | 879/2208 [00:48<01:25, 15.54it/s][A

Batch 875: Training loss = 0.1253, Training accuracy = 0.9498, F1 = 0.9498



Epoch 7/10:  40%|███▉      | 882/2208 [00:48<01:18, 16.92it/s][A
Epoch 7/10:  40%|████      | 885/2208 [00:48<01:13, 17.95it/s][A
Epoch 7/10:  40%|████      | 888/2208 [00:48<01:10, 18.79it/s][A
Epoch 7/10:  40%|████      | 891/2208 [00:49<01:07, 19.38it/s][A
Epoch 7/10:  40%|████      | 894/2208 [00:49<01:07, 19.40it/s][A
Epoch 7/10:  41%|████      | 897/2208 [00:49<01:05, 19.93it/s][A
  with torch.cuda.amp.autocast():

Epoch 7/10:  41%|████      | 903/2208 [00:49<01:35, 13.62it/s][A

Batch 900: Training loss = 0.1682, Training accuracy = 0.9498, F1 = 0.9498



Epoch 7/10:  41%|████      | 906/2208 [00:50<01:25, 15.26it/s][A
Epoch 7/10:  41%|████      | 909/2208 [00:50<01:17, 16.68it/s][A
Epoch 7/10:  41%|████▏     | 912/2208 [00:50<01:12, 17.78it/s][A
Epoch 7/10:  41%|████▏     | 914/2208 [00:50<01:12, 17.81it/s][A
Epoch 7/10:  42%|████▏     | 917/2208 [00:50<01:08, 18.82it/s][A
Epoch 7/10:  42%|████▏     | 919/2208 [00:50<01:10, 18.34it/s][A
Epoch 7/10:  42%|████▏     | 922/2208 [00:50<01:07, 19.11it/s][A
Epoch 7/10:  42%|████▏     | 924/2208 [00:50<01:12, 17.67it/s][A
  with torch.cuda.amp.autocast():

Epoch 7/10:  42%|████▏     | 929/2208 [00:51<01:32, 13.80it/s][A

Batch 925: Training loss = 0.0836, Training accuracy = 0.9498, F1 = 0.9497



Epoch 7/10:  42%|████▏     | 932/2208 [00:51<01:21, 15.65it/s][A
Epoch 7/10:  42%|████▏     | 935/2208 [00:51<01:14, 17.08it/s][A
Epoch 7/10:  42%|████▏     | 938/2208 [00:51<01:09, 18.24it/s][A
Epoch 7/10:  43%|████▎     | 941/2208 [00:52<01:05, 19.22it/s][A
Epoch 7/10:  43%|████▎     | 944/2208 [00:52<01:09, 18.24it/s][A
Epoch 7/10:  43%|████▎     | 947/2208 [00:52<01:06, 19.09it/s][A
Epoch 7/10:  43%|████▎     | 949/2208 [00:52<01:05, 19.28it/s][A
  with torch.cuda.amp.autocast():

Epoch 7/10:  43%|████▎     | 954/2208 [00:52<01:20, 15.54it/s][A

Batch 950: Training loss = 0.0837, Training accuracy = 0.9498, F1 = 0.9498



Epoch 7/10:  43%|████▎     | 957/2208 [00:53<01:13, 17.09it/s][A
Epoch 7/10:  43%|████▎     | 960/2208 [00:53<01:08, 18.28it/s][A
Epoch 7/10:  44%|████▎     | 963/2208 [00:53<01:04, 19.26it/s][A
Epoch 7/10:  44%|████▍     | 966/2208 [00:53<01:02, 19.84it/s][A
Epoch 7/10:  44%|████▍     | 969/2208 [00:53<01:02, 19.82it/s][A
Epoch 7/10:  44%|████▍     | 972/2208 [00:53<01:11, 17.39it/s][A
  with torch.cuda.amp.autocast():

Epoch 7/10:  44%|████▍     | 977/2208 [00:54<01:35, 12.91it/s][A
Epoch 7/10:  44%|████▍     | 980/2208 [00:54<01:22, 14.85it/s][A

Batch 975: Training loss = 0.2004, Training accuracy = 0.9497, F1 = 0.9497



Epoch 7/10:  45%|████▍     | 983/2208 [00:54<01:14, 16.39it/s][A
Epoch 7/10:  45%|████▍     | 986/2208 [00:54<01:09, 17.63it/s][A
Epoch 7/10:  45%|████▍     | 989/2208 [00:54<01:05, 18.48it/s][A
Epoch 7/10:  45%|████▍     | 992/2208 [00:54<01:03, 19.27it/s][A
Epoch 7/10:  45%|████▌     | 995/2208 [00:55<01:01, 19.81it/s][A
Epoch 7/10:  45%|████▌     | 998/2208 [00:55<00:59, 20.33it/s][A
  with torch.cuda.amp.autocast():

Epoch 7/10:  45%|████▌     | 1004/2208 [00:55<01:15, 15.94it/s][A

Batch 1000: Training loss = 0.1649, Training accuracy = 0.9497, F1 = 0.9496



Epoch 7/10:  46%|████▌     | 1007/2208 [00:55<01:09, 17.30it/s][A
Epoch 7/10:  46%|████▌     | 1009/2208 [00:55<01:07, 17.79it/s][A
Epoch 7/10:  46%|████▌     | 1012/2208 [00:56<01:04, 18.67it/s][A
Epoch 7/10:  46%|████▌     | 1015/2208 [00:56<01:01, 19.47it/s][A
Epoch 7/10:  46%|████▌     | 1018/2208 [00:56<00:59, 20.00it/s][A
Epoch 7/10:  46%|████▌     | 1021/2208 [00:56<00:58, 20.34it/s][A
  with torch.cuda.amp.autocast():

Epoch 7/10:  47%|████▋     | 1027/2208 [00:57<01:19, 14.94it/s][A
Epoch 7/10:  47%|████▋     | 1030/2208 [00:57<01:11, 16.44it/s][A

Batch 1025: Training loss = 0.1250, Training accuracy = 0.9497, F1 = 0.9497



Epoch 7/10:  47%|████▋     | 1033/2208 [00:57<01:06, 17.73it/s][A
Epoch 7/10:  47%|████▋     | 1036/2208 [00:57<01:02, 18.77it/s][A
Epoch 7/10:  47%|████▋     | 1039/2208 [00:57<00:59, 19.49it/s][A
Epoch 7/10:  47%|████▋     | 1042/2208 [00:57<00:58, 20.02it/s][A
Epoch 7/10:  47%|████▋     | 1045/2208 [00:57<00:56, 20.47it/s][A
Epoch 7/10:  47%|████▋     | 1048/2208 [00:57<00:55, 20.73it/s][A
  with torch.cuda.amp.autocast():

Epoch 7/10:  48%|████▊     | 1054/2208 [00:58<01:09, 16.52it/s][A

Batch 1050: Training loss = 0.0923, Training accuracy = 0.9498, F1 = 0.9498



Epoch 7/10:  48%|████▊     | 1057/2208 [00:58<01:05, 17.66it/s][A
Epoch 7/10:  48%|████▊     | 1060/2208 [00:58<01:01, 18.62it/s][A
Epoch 7/10:  48%|████▊     | 1063/2208 [00:58<00:59, 19.29it/s][A
Epoch 7/10:  48%|████▊     | 1066/2208 [00:59<00:57, 19.79it/s][A
Epoch 7/10:  48%|████▊     | 1069/2208 [00:59<00:56, 20.31it/s][A
Epoch 7/10:  49%|████▊     | 1072/2208 [00:59<00:54, 20.67it/s][A
  with torch.cuda.amp.autocast():

Epoch 7/10:  49%|████▉     | 1078/2208 [00:59<01:16, 14.76it/s][A

Batch 1075: Training loss = 0.1031, Training accuracy = 0.9498, F1 = 0.9497



Epoch 7/10:  49%|████▉     | 1081/2208 [00:59<01:09, 16.27it/s][A
Epoch 7/10:  49%|████▉     | 1084/2208 [01:00<01:04, 17.45it/s][A
Epoch 7/10:  49%|████▉     | 1086/2208 [01:00<01:02, 17.94it/s][A
Epoch 7/10:  49%|████▉     | 1089/2208 [01:00<00:59, 18.80it/s][A
Epoch 7/10:  49%|████▉     | 1092/2208 [01:00<00:57, 19.52it/s][A
Epoch 7/10:  50%|████▉     | 1095/2208 [01:00<00:55, 19.97it/s][A
Epoch 7/10:  50%|████▉     | 1098/2208 [01:00<00:54, 20.22it/s][A
  with torch.cuda.amp.autocast():

Epoch 7/10:  50%|█████     | 1104/2208 [01:01<01:09, 15.96it/s][A

Batch 1100: Training loss = 0.1599, Training accuracy = 0.9498, F1 = 0.9497



Epoch 7/10:  50%|█████     | 1107/2208 [01:01<01:03, 17.36it/s][A
Epoch 7/10:  50%|█████     | 1110/2208 [01:01<01:00, 18.26it/s][A
Epoch 7/10:  50%|█████     | 1113/2208 [01:01<00:57, 19.11it/s][A
Epoch 7/10:  51%|█████     | 1116/2208 [01:01<00:55, 19.67it/s][A
Epoch 7/10:  51%|█████     | 1119/2208 [01:01<00:55, 19.72it/s][A
Epoch 7/10:  51%|█████     | 1122/2208 [01:02<00:54, 20.04it/s][A
  with torch.cuda.amp.autocast():

Epoch 7/10:  51%|█████     | 1128/2208 [01:02<01:18, 13.72it/s][A

Batch 1125: Training loss = 0.2085, Training accuracy = 0.9497, F1 = 0.9496



Epoch 7/10:  51%|█████     | 1131/2208 [01:02<01:09, 15.42it/s][A
Epoch 7/10:  51%|█████▏    | 1134/2208 [01:02<01:03, 16.82it/s][A
Epoch 7/10:  51%|█████▏    | 1137/2208 [01:03<01:00, 17.85it/s][A
Epoch 7/10:  52%|█████▏    | 1140/2208 [01:03<00:56, 18.83it/s][A
Epoch 7/10:  52%|█████▏    | 1143/2208 [01:03<00:54, 19.48it/s][A
Epoch 7/10:  52%|█████▏    | 1146/2208 [01:03<00:55, 19.25it/s][A
  with torch.cuda.amp.autocast():

Epoch 7/10:  52%|█████▏    | 1152/2208 [01:04<01:16, 13.73it/s][A
Epoch 7/10:  52%|█████▏    | 1155/2208 [01:04<01:08, 15.38it/s][A

Batch 1150: Training loss = 0.1069, Training accuracy = 0.9496, F1 = 0.9496



Epoch 7/10:  52%|█████▏    | 1158/2208 [01:04<01:02, 16.78it/s][A
Epoch 7/10:  53%|█████▎    | 1161/2208 [01:04<00:58, 17.85it/s][A
Epoch 7/10:  53%|█████▎    | 1164/2208 [01:04<00:56, 18.32it/s][A
Epoch 7/10:  53%|█████▎    | 1167/2208 [01:04<00:54, 19.06it/s][A
Epoch 7/10:  53%|█████▎    | 1170/2208 [01:04<00:52, 19.60it/s][A
Epoch 7/10:  53%|█████▎    | 1173/2208 [01:05<00:51, 20.08it/s][A
  with torch.cuda.amp.autocast():

Epoch 7/10:  53%|█████▎    | 1179/2208 [01:05<01:07, 15.15it/s][A

Batch 1175: Training loss = 0.2173, Training accuracy = 0.9496, F1 = 0.9495



Epoch 7/10:  54%|█████▎    | 1182/2208 [01:05<01:02, 16.55it/s][A
Epoch 7/10:  54%|█████▎    | 1185/2208 [01:05<00:57, 17.68it/s][A
Epoch 7/10:  54%|█████▍    | 1188/2208 [01:05<00:54, 18.65it/s][A
Epoch 7/10:  54%|█████▍    | 1191/2208 [01:06<00:53, 19.12it/s][A
Epoch 7/10:  54%|█████▍    | 1194/2208 [01:06<01:01, 16.56it/s][A
Epoch 7/10:  54%|█████▍    | 1196/2208 [01:06<01:11, 14.18it/s][A
Epoch 7/10:  54%|█████▍    | 1199/2208 [01:06<01:03, 15.99it/s][A
  with torch.cuda.amp.autocast():

Epoch 7/10:  55%|█████▍    | 1204/2208 [01:07<01:12, 13.85it/s][A

Batch 1200: Training loss = 0.1594, Training accuracy = 0.9494, F1 = 0.9494



Epoch 7/10:  55%|█████▍    | 1207/2208 [01:07<01:04, 15.60it/s][A
Epoch 7/10:  55%|█████▍    | 1210/2208 [01:07<00:58, 17.07it/s][A
Epoch 7/10:  55%|█████▍    | 1213/2208 [01:07<00:54, 18.17it/s][A
Epoch 7/10:  55%|█████▌    | 1216/2208 [01:07<00:52, 19.01it/s][A
Epoch 7/10:  55%|█████▌    | 1219/2208 [01:07<00:50, 19.68it/s][A
Epoch 7/10:  55%|█████▌    | 1222/2208 [01:08<00:48, 20.15it/s][A
  with torch.cuda.amp.autocast():

Epoch 7/10:  56%|█████▌    | 1228/2208 [01:08<01:10, 13.81it/s][A

Batch 1225: Training loss = 0.0915, Training accuracy = 0.9493, F1 = 0.9493



Epoch 7/10:  56%|█████▌    | 1231/2208 [01:08<01:03, 15.45it/s][A
Epoch 7/10:  56%|█████▌    | 1234/2208 [01:08<00:58, 16.79it/s][A
Epoch 7/10:  56%|█████▌    | 1237/2208 [01:08<00:54, 17.97it/s][A
Epoch 7/10:  56%|█████▌    | 1239/2208 [01:09<00:52, 18.38it/s][A
Epoch 7/10:  56%|█████▋    | 1242/2208 [01:09<00:50, 19.18it/s][A
Epoch 7/10:  56%|█████▋    | 1245/2208 [01:09<00:48, 19.76it/s][A
Epoch 7/10:  57%|█████▋    | 1248/2208 [01:09<00:47, 20.18it/s][A
  with torch.cuda.amp.autocast():

Epoch 7/10:  57%|█████▋    | 1254/2208 [01:10<01:04, 14.80it/s][A

Batch 1250: Training loss = 0.1496, Training accuracy = 0.9494, F1 = 0.9494



Epoch 7/10:  57%|█████▋    | 1257/2208 [01:10<00:57, 16.43it/s][A
Epoch 7/10:  57%|█████▋    | 1260/2208 [01:10<00:53, 17.71it/s][A
Epoch 7/10:  57%|█████▋    | 1263/2208 [01:10<00:50, 18.66it/s][A
Epoch 7/10:  57%|█████▋    | 1266/2208 [01:10<00:48, 19.40it/s][A
Epoch 7/10:  57%|█████▋    | 1269/2208 [01:10<00:47, 19.86it/s][A
Epoch 7/10:  58%|█████▊    | 1272/2208 [01:10<00:46, 20.29it/s][A
  with torch.cuda.amp.autocast():

Epoch 7/10:  58%|█████▊    | 1278/2208 [01:11<01:07, 13.72it/s][A

Batch 1275: Training loss = 0.1082, Training accuracy = 0.9495, F1 = 0.9494



Epoch 7/10:  58%|█████▊    | 1281/2208 [01:11<00:59, 15.46it/s][A
Epoch 7/10:  58%|█████▊    | 1284/2208 [01:11<00:54, 16.85it/s][A
Epoch 7/10:  58%|█████▊    | 1287/2208 [01:11<00:51, 18.00it/s][A
Epoch 7/10:  58%|█████▊    | 1290/2208 [01:11<00:49, 18.73it/s][A
Epoch 7/10:  59%|█████▊    | 1293/2208 [01:12<00:47, 19.40it/s][A
Epoch 7/10:  59%|█████▊    | 1296/2208 [01:12<00:45, 19.96it/s][A
  with torch.cuda.amp.autocast():

Epoch 7/10:  59%|█████▉    | 1302/2208 [01:12<01:13, 12.35it/s][A
Epoch 7/10:  59%|█████▉    | 1305/2208 [01:12<01:03, 14.21it/s][A

Batch 1300: Training loss = 0.1248, Training accuracy = 0.9495, F1 = 0.9494



Epoch 7/10:  59%|█████▉    | 1308/2208 [01:13<00:56, 15.80it/s][A
Epoch 7/10:  59%|█████▉    | 1311/2208 [01:13<00:52, 17.16it/s][A
Epoch 7/10:  60%|█████▉    | 1314/2208 [01:13<00:49, 18.24it/s][A
Epoch 7/10:  60%|█████▉    | 1317/2208 [01:13<00:46, 19.07it/s][A
Epoch 7/10:  60%|█████▉    | 1320/2208 [01:13<00:44, 19.75it/s][A
Epoch 7/10:  60%|█████▉    | 1323/2208 [01:13<00:43, 20.14it/s][A
  with torch.cuda.amp.autocast():

Epoch 7/10:  60%|██████    | 1329/2208 [01:14<00:57, 15.28it/s][A

Batch 1325: Training loss = 0.1723, Training accuracy = 0.9495, F1 = 0.9495



Epoch 7/10:  60%|██████    | 1332/2208 [01:14<00:52, 16.64it/s][A
Epoch 7/10:  60%|██████    | 1335/2208 [01:14<00:49, 17.81it/s][A
Epoch 7/10:  61%|██████    | 1338/2208 [01:14<00:46, 18.72it/s][A
Epoch 7/10:  61%|██████    | 1341/2208 [01:14<00:44, 19.29it/s][A
Epoch 7/10:  61%|██████    | 1344/2208 [01:15<00:43, 19.85it/s][A
Epoch 7/10:  61%|██████    | 1347/2208 [01:15<00:42, 20.13it/s][A
  with torch.cuda.amp.autocast():

Epoch 7/10:  61%|██████▏   | 1353/2208 [01:15<01:03, 13.52it/s][A

Batch 1350: Training loss = 0.0931, Training accuracy = 0.9497, F1 = 0.9496



Epoch 7/10:  61%|██████▏   | 1356/2208 [01:15<00:55, 15.26it/s][A
Epoch 7/10:  62%|██████▏   | 1359/2208 [01:16<00:51, 16.55it/s][A
Epoch 7/10:  62%|██████▏   | 1362/2208 [01:16<00:47, 17.75it/s][A
Epoch 7/10:  62%|██████▏   | 1365/2208 [01:16<00:45, 18.64it/s][A
Epoch 7/10:  62%|██████▏   | 1368/2208 [01:16<00:43, 19.37it/s][A
Epoch 7/10:  62%|██████▏   | 1371/2208 [01:16<00:42, 19.89it/s][A
  with torch.cuda.amp.autocast():

Epoch 7/10:  62%|██████▏   | 1377/2208 [01:17<01:07, 12.27it/s][A
Epoch 7/10:  62%|██████▎   | 1380/2208 [01:17<00:58, 14.09it/s][A

Batch 1375: Training loss = 0.1234, Training accuracy = 0.9497, F1 = 0.9496



Epoch 7/10:  63%|██████▎   | 1383/2208 [01:17<00:52, 15.59it/s][A
Epoch 7/10:  63%|██████▎   | 1386/2208 [01:17<00:48, 16.89it/s][A
Epoch 7/10:  63%|██████▎   | 1389/2208 [01:17<00:45, 17.99it/s][A
Epoch 7/10:  63%|██████▎   | 1391/2208 [01:17<00:47, 17.13it/s][A
Epoch 7/10:  63%|██████▎   | 1394/2208 [01:18<00:44, 18.27it/s][A
Epoch 7/10:  63%|██████▎   | 1397/2208 [01:18<00:42, 19.08it/s][A
Epoch 7/10:  63%|██████▎   | 1399/2208 [01:18<00:43, 18.50it/s][A
  with torch.cuda.amp.autocast():

Epoch 7/10:  64%|██████▎   | 1404/2208 [01:18<01:00, 13.29it/s][A

Batch 1400: Training loss = 0.1577, Training accuracy = 0.9497, F1 = 0.9496



Epoch 7/10:  64%|██████▎   | 1407/2208 [01:19<00:52, 15.22it/s][A
Epoch 7/10:  64%|██████▍   | 1410/2208 [01:19<00:47, 16.80it/s][A
Epoch 7/10:  64%|██████▍   | 1413/2208 [01:19<00:44, 17.98it/s][A
Epoch 7/10:  64%|██████▍   | 1416/2208 [01:19<00:42, 18.81it/s][A
Epoch 7/10:  64%|██████▍   | 1419/2208 [01:19<00:41, 19.01it/s][A
Epoch 7/10:  64%|██████▍   | 1421/2208 [01:19<00:41, 19.19it/s][A
Epoch 7/10:  64%|██████▍   | 1424/2208 [01:19<00:48, 16.31it/s][A
  with torch.cuda.amp.autocast():

Epoch 7/10:  65%|██████▍   | 1429/2208 [01:20<00:58, 13.25it/s][A

Batch 1425: Training loss = 0.1725, Training accuracy = 0.9496, F1 = 0.9496



Epoch 7/10:  65%|██████▍   | 1432/2208 [01:20<00:51, 15.03it/s][A
Epoch 7/10:  65%|██████▍   | 1435/2208 [01:20<00:46, 16.53it/s][A
Epoch 7/10:  65%|██████▌   | 1438/2208 [01:20<00:43, 17.70it/s][A
Epoch 7/10:  65%|██████▌   | 1440/2208 [01:20<00:42, 18.18it/s][A
Epoch 7/10:  65%|██████▌   | 1443/2208 [01:21<00:40, 19.07it/s][A
Epoch 7/10:  65%|██████▌   | 1446/2208 [01:21<00:38, 19.75it/s][A
  with torch.cuda.amp.autocast():

Epoch 7/10:  66%|██████▌   | 1452/2208 [01:21<01:01, 12.33it/s][A
Epoch 7/10:  66%|██████▌   | 1455/2208 [01:21<00:52, 14.23it/s][A

Batch 1450: Training loss = 0.1907, Training accuracy = 0.9497, F1 = 0.9497



Epoch 7/10:  66%|██████▌   | 1458/2208 [01:22<00:47, 15.92it/s][A
Epoch 7/10:  66%|██████▌   | 1461/2208 [01:22<00:43, 17.30it/s][A
Epoch 7/10:  66%|██████▋   | 1464/2208 [01:22<00:40, 18.42it/s][A
Epoch 7/10:  66%|██████▋   | 1467/2208 [01:22<00:38, 19.19it/s][A
Epoch 7/10:  67%|██████▋   | 1470/2208 [01:22<00:37, 19.74it/s][A
Epoch 7/10:  67%|██████▋   | 1473/2208 [01:22<00:36, 20.13it/s][A
  with torch.cuda.amp.autocast():

Epoch 7/10:  67%|██████▋   | 1479/2208 [01:23<00:50, 14.32it/s][A

Batch 1475: Training loss = 0.1837, Training accuracy = 0.9498, F1 = 0.9498



Epoch 7/10:  67%|██████▋   | 1482/2208 [01:23<00:45, 15.90it/s][A
Epoch 7/10:  67%|██████▋   | 1485/2208 [01:23<00:42, 17.16it/s][A
Epoch 7/10:  67%|██████▋   | 1488/2208 [01:23<00:39, 18.13it/s][A
Epoch 7/10:  68%|██████▊   | 1491/2208 [01:23<00:37, 18.96it/s][A
Epoch 7/10:  68%|██████▊   | 1494/2208 [01:24<00:36, 19.55it/s][A
Epoch 7/10:  68%|██████▊   | 1497/2208 [01:24<00:35, 19.99it/s][A
  with torch.cuda.amp.autocast():

Epoch 7/10:  68%|██████▊   | 1503/2208 [01:24<00:55, 12.74it/s][A

Batch 1500: Training loss = 0.1345, Training accuracy = 0.9498, F1 = 0.9498



Epoch 7/10:  68%|██████▊   | 1506/2208 [01:24<00:48, 14.52it/s][A
Epoch 7/10:  68%|██████▊   | 1509/2208 [01:25<00:43, 16.10it/s][A
Epoch 7/10:  68%|██████▊   | 1512/2208 [01:25<00:40, 17.36it/s][A
Epoch 7/10:  69%|██████▊   | 1515/2208 [01:25<00:37, 18.40it/s][A
Epoch 7/10:  69%|██████▉   | 1518/2208 [01:25<00:35, 19.18it/s][A
Epoch 7/10:  69%|██████▉   | 1521/2208 [01:25<00:34, 19.80it/s][A
  with torch.cuda.amp.autocast():

Epoch 7/10:  69%|██████▉   | 1527/2208 [01:26<00:53, 12.73it/s][A
Epoch 7/10:  69%|██████▉   | 1530/2208 [01:26<00:46, 14.56it/s][A

Batch 1525: Training loss = 0.1603, Training accuracy = 0.9498, F1 = 0.9498



Epoch 7/10:  69%|██████▉   | 1533/2208 [01:26<00:42, 16.04it/s][A
Epoch 7/10:  70%|██████▉   | 1536/2208 [01:26<00:38, 17.28it/s][A
Epoch 7/10:  70%|██████▉   | 1539/2208 [01:26<00:36, 18.30it/s][A
Epoch 7/10:  70%|██████▉   | 1542/2208 [01:26<00:34, 19.15it/s][A
Epoch 7/10:  70%|██████▉   | 1545/2208 [01:27<00:33, 19.66it/s][A
Epoch 7/10:  70%|███████   | 1548/2208 [01:27<00:32, 20.18it/s][A
  with torch.cuda.amp.autocast():

Epoch 7/10:  70%|███████   | 1554/2208 [01:27<00:45, 14.32it/s][A

Batch 1550: Training loss = 0.1430, Training accuracy = 0.9498, F1 = 0.9497



Epoch 7/10:  71%|███████   | 1557/2208 [01:27<00:40, 15.98it/s][A
Epoch 7/10:  71%|███████   | 1560/2208 [01:28<00:37, 17.30it/s][A
Epoch 7/10:  71%|███████   | 1563/2208 [01:28<00:35, 18.33it/s][A
Epoch 7/10:  71%|███████   | 1566/2208 [01:28<00:33, 19.14it/s][A
Epoch 7/10:  71%|███████   | 1569/2208 [01:28<00:32, 19.62it/s][A
Epoch 7/10:  71%|███████   | 1572/2208 [01:28<00:31, 20.14it/s][A
  with torch.cuda.amp.autocast():

Epoch 7/10:  71%|███████▏  | 1578/2208 [01:29<00:50, 12.56it/s][A

Batch 1575: Training loss = 0.1793, Training accuracy = 0.9498, F1 = 0.9497



Epoch 7/10:  72%|███████▏  | 1581/2208 [01:29<00:43, 14.41it/s][A
Epoch 7/10:  72%|███████▏  | 1584/2208 [01:29<00:39, 15.91it/s][A
Epoch 7/10:  72%|███████▏  | 1587/2208 [01:29<00:36, 17.13it/s][A
Epoch 7/10:  72%|███████▏  | 1590/2208 [01:29<00:33, 18.21it/s][A
Epoch 7/10:  72%|███████▏  | 1593/2208 [01:29<00:32, 19.02it/s][A
Epoch 7/10:  72%|███████▏  | 1596/2208 [01:30<00:31, 19.68it/s][A
  with torch.cuda.amp.autocast():

Epoch 7/10:  73%|███████▎  | 1602/2208 [01:30<00:48, 12.45it/s][A
Epoch 7/10:  73%|███████▎  | 1605/2208 [01:30<00:42, 14.26it/s][A

Batch 1600: Training loss = 0.1835, Training accuracy = 0.9498, F1 = 0.9498



Epoch 7/10:  73%|███████▎  | 1608/2208 [01:30<00:37, 15.81it/s][A
Epoch 7/10:  73%|███████▎  | 1611/2208 [01:31<00:34, 17.21it/s][A
Epoch 7/10:  73%|███████▎  | 1614/2208 [01:31<00:32, 18.18it/s][A
Epoch 7/10:  73%|███████▎  | 1617/2208 [01:31<00:31, 19.04it/s][A
Epoch 7/10:  73%|███████▎  | 1620/2208 [01:31<00:29, 19.66it/s][A
Epoch 7/10:  74%|███████▎  | 1623/2208 [01:31<00:29, 20.07it/s][A
  with torch.cuda.amp.autocast():

Epoch 7/10:  74%|███████▍  | 1629/2208 [01:32<00:43, 13.29it/s][A

Batch 1625: Training loss = 0.1301, Training accuracy = 0.9499, F1 = 0.9499



Epoch 7/10:  74%|███████▍  | 1632/2208 [01:32<00:38, 14.98it/s][A
Epoch 7/10:  74%|███████▍  | 1635/2208 [01:32<00:35, 16.32it/s][A
Epoch 7/10:  74%|███████▍  | 1638/2208 [01:32<00:32, 17.50it/s][A
Epoch 7/10:  74%|███████▍  | 1641/2208 [01:32<00:30, 18.33it/s][A
Epoch 7/10:  74%|███████▍  | 1644/2208 [01:33<00:29, 19.06it/s][A
Epoch 7/10:  75%|███████▍  | 1647/2208 [01:33<00:29, 19.14it/s][A
  with torch.cuda.amp.autocast():

Epoch 7/10:  75%|███████▍  | 1652/2208 [01:33<00:51, 10.82it/s][A
Epoch 7/10:  75%|███████▍  | 1655/2208 [01:34<00:42, 12.91it/s][A

Batch 1650: Training loss = 0.1547, Training accuracy = 0.9499, F1 = 0.9499



Epoch 7/10:  75%|███████▌  | 1658/2208 [01:34<00:37, 14.76it/s][A
Epoch 7/10:  75%|███████▌  | 1660/2208 [01:34<00:34, 15.70it/s][A
Epoch 7/10:  75%|███████▌  | 1663/2208 [01:34<00:31, 17.14it/s][A
Epoch 7/10:  75%|███████▌  | 1665/2208 [01:34<00:30, 17.74it/s][A
Epoch 7/10:  76%|███████▌  | 1668/2208 [01:34<00:29, 18.56it/s][A
Epoch 7/10:  76%|███████▌  | 1670/2208 [01:34<00:30, 17.83it/s][A
Epoch 7/10:  76%|███████▌  | 1673/2208 [01:34<00:33, 16.20it/s][A
  with torch.cuda.amp.autocast():

Epoch 7/10:  76%|███████▌  | 1679/2208 [01:35<00:42, 12.58it/s][A

Batch 1675: Training loss = 0.1495, Training accuracy = 0.9500, F1 = 0.9499



Epoch 7/10:  76%|███████▌  | 1682/2208 [01:35<00:36, 14.44it/s][A
Epoch 7/10:  76%|███████▋  | 1685/2208 [01:35<00:32, 15.95it/s][A
Epoch 7/10:  76%|███████▋  | 1688/2208 [01:36<00:30, 17.27it/s][A
Epoch 7/10:  77%|███████▋  | 1691/2208 [01:36<00:28, 18.31it/s][A
Epoch 7/10:  77%|███████▋  | 1694/2208 [01:36<00:26, 19.08it/s][A
Epoch 7/10:  77%|███████▋  | 1697/2208 [01:36<00:25, 19.69it/s][A
  with torch.cuda.amp.autocast():

Epoch 7/10:  77%|███████▋  | 1703/2208 [01:37<00:43, 11.63it/s][A

Batch 1700: Training loss = 0.2913, Training accuracy = 0.9500, F1 = 0.9500



Epoch 7/10:  77%|███████▋  | 1706/2208 [01:37<00:37, 13.50it/s][A
Epoch 7/10:  77%|███████▋  | 1709/2208 [01:37<00:32, 15.20it/s][A
Epoch 7/10:  78%|███████▊  | 1712/2208 [01:37<00:29, 16.68it/s][A
Epoch 7/10:  78%|███████▊  | 1715/2208 [01:37<00:27, 17.82it/s][A
Epoch 7/10:  78%|███████▊  | 1718/2208 [01:37<00:26, 18.69it/s][A
Epoch 7/10:  78%|███████▊  | 1721/2208 [01:37<00:25, 19.38it/s][A
  with torch.cuda.amp.autocast():

Epoch 7/10:  78%|███████▊  | 1727/2208 [01:38<00:39, 12.03it/s][A
Epoch 7/10:  78%|███████▊  | 1730/2208 [01:38<00:34, 13.86it/s][A

Batch 1725: Training loss = 0.1205, Training accuracy = 0.9501, F1 = 0.9501



Epoch 7/10:  78%|███████▊  | 1733/2208 [01:38<00:30, 15.46it/s][A
Epoch 7/10:  79%|███████▊  | 1736/2208 [01:39<00:27, 16.89it/s][A
Epoch 7/10:  79%|███████▉  | 1739/2208 [01:39<00:26, 17.92it/s][A
Epoch 7/10:  79%|███████▉  | 1742/2208 [01:39<00:24, 18.87it/s][A
Epoch 7/10:  79%|███████▉  | 1745/2208 [01:39<00:23, 19.57it/s][A
Epoch 7/10:  79%|███████▉  | 1748/2208 [01:39<00:22, 20.01it/s][A
  with torch.cuda.amp.autocast():

Epoch 7/10:  79%|███████▉  | 1754/2208 [01:40<00:33, 13.70it/s][A

Batch 1750: Training loss = 0.1877, Training accuracy = 0.9502, F1 = 0.9501



Epoch 7/10:  80%|███████▉  | 1757/2208 [01:40<00:29, 15.37it/s][A
Epoch 7/10:  80%|███████▉  | 1760/2208 [01:40<00:26, 16.76it/s][A
Epoch 7/10:  80%|███████▉  | 1763/2208 [01:40<00:25, 17.79it/s][A
Epoch 7/10:  80%|███████▉  | 1766/2208 [01:40<00:23, 18.69it/s][A
Epoch 7/10:  80%|████████  | 1769/2208 [01:40<00:22, 19.36it/s][A
Epoch 7/10:  80%|████████  | 1772/2208 [01:41<00:22, 19.79it/s][A
  with torch.cuda.amp.autocast():

Epoch 7/10:  81%|████████  | 1778/2208 [01:41<00:36, 11.90it/s][A

Batch 1775: Training loss = 0.1087, Training accuracy = 0.9503, F1 = 0.9502



Epoch 7/10:  81%|████████  | 1781/2208 [01:41<00:31, 13.72it/s][A
Epoch 7/10:  81%|████████  | 1784/2208 [01:41<00:27, 15.31it/s][A
Epoch 7/10:  81%|████████  | 1787/2208 [01:42<00:25, 16.73it/s][A
Epoch 7/10:  81%|████████  | 1790/2208 [01:42<00:23, 17.93it/s][A
Epoch 7/10:  81%|████████  | 1793/2208 [01:42<00:22, 18.86it/s][A
Epoch 7/10:  81%|████████▏ | 1796/2208 [01:42<00:21, 19.40it/s][A
  with torch.cuda.amp.autocast():

Epoch 7/10:  82%|████████▏ | 1802/2208 [01:43<00:34, 11.67it/s][A
Epoch 7/10:  82%|████████▏ | 1805/2208 [01:43<00:29, 13.53it/s][A

Batch 1800: Training loss = 0.0975, Training accuracy = 0.9504, F1 = 0.9504



Epoch 7/10:  82%|████████▏ | 1808/2208 [01:43<00:26, 15.16it/s][A
Epoch 7/10:  82%|████████▏ | 1811/2208 [01:43<00:24, 16.52it/s][A
Epoch 7/10:  82%|████████▏ | 1814/2208 [01:43<00:22, 17.77it/s][A
Epoch 7/10:  82%|████████▏ | 1817/2208 [01:43<00:21, 18.60it/s][A
Epoch 7/10:  82%|████████▏ | 1820/2208 [01:44<00:20, 19.29it/s][A
Epoch 7/10:  83%|████████▎ | 1823/2208 [01:44<00:19, 19.76it/s][A
  with torch.cuda.amp.autocast():

Epoch 7/10:  83%|████████▎ | 1829/2208 [01:44<00:28, 13.35it/s][A

Batch 1825: Training loss = 0.0695, Training accuracy = 0.9504, F1 = 0.9503



Epoch 7/10:  83%|████████▎ | 1832/2208 [01:44<00:25, 15.01it/s][A
Epoch 7/10:  83%|████████▎ | 1835/2208 [01:45<00:22, 16.37it/s][A
Epoch 7/10:  83%|████████▎ | 1838/2208 [01:45<00:21, 17.54it/s][A
Epoch 7/10:  83%|████████▎ | 1841/2208 [01:45<00:19, 18.40it/s][A
Epoch 7/10:  84%|████████▎ | 1844/2208 [01:45<00:18, 19.19it/s][A
Epoch 7/10:  84%|████████▎ | 1847/2208 [01:45<00:18, 19.64it/s][A
  with torch.cuda.amp.autocast():

Epoch 7/10:  84%|████████▍ | 1853/2208 [01:46<00:31, 11.25it/s][A

Batch 1850: Training loss = 0.1103, Training accuracy = 0.9504, F1 = 0.9504



Epoch 7/10:  84%|████████▍ | 1856/2208 [01:46<00:26, 13.15it/s][A
Epoch 7/10:  84%|████████▍ | 1859/2208 [01:46<00:23, 14.80it/s][A
Epoch 7/10:  84%|████████▍ | 1862/2208 [01:46<00:21, 16.21it/s][A
Epoch 7/10:  84%|████████▍ | 1865/2208 [01:46<00:19, 17.42it/s][A
Epoch 7/10:  85%|████████▍ | 1868/2208 [01:47<00:18, 18.42it/s][A
Epoch 7/10:  85%|████████▍ | 1871/2208 [01:47<00:19, 17.14it/s][A
Epoch 7/10:  85%|████████▍ | 1874/2208 [01:47<00:18, 18.22it/s][A
  with torch.cuda.amp.autocast():

Epoch 7/10:  85%|████████▌ | 1879/2208 [01:48<00:26, 12.51it/s][A

Batch 1875: Training loss = 0.1338, Training accuracy = 0.9505, F1 = 0.9504



Epoch 7/10:  85%|████████▌ | 1882/2208 [01:48<00:22, 14.30it/s][A
Epoch 7/10:  85%|████████▌ | 1885/2208 [01:48<00:20, 15.92it/s][A
Epoch 7/10:  86%|████████▌ | 1888/2208 [01:48<00:18, 17.23it/s][A
Epoch 7/10:  86%|████████▌ | 1891/2208 [01:48<00:17, 18.17it/s][A
Epoch 7/10:  86%|████████▌ | 1894/2208 [01:48<00:16, 19.12it/s][A
Epoch 7/10:  86%|████████▌ | 1897/2208 [01:48<00:17, 18.27it/s][A
  with torch.cuda.amp.autocast():

Epoch 7/10:  86%|████████▌ | 1902/2208 [01:49<00:30, 10.06it/s][A
Epoch 7/10:  86%|████████▋ | 1905/2208 [01:49<00:24, 12.17it/s][A

Batch 1900: Training loss = 0.1820, Training accuracy = 0.9505, F1 = 0.9505



Epoch 7/10:  86%|████████▋ | 1908/2208 [01:49<00:21, 14.10it/s][A
Epoch 7/10:  87%|████████▋ | 1911/2208 [01:50<00:18, 15.76it/s][A
Epoch 7/10:  87%|████████▋ | 1914/2208 [01:50<00:17, 17.09it/s][A
Epoch 7/10:  87%|████████▋ | 1917/2208 [01:50<00:16, 18.11it/s][A
Epoch 7/10:  87%|████████▋ | 1920/2208 [01:50<00:15, 18.89it/s][A
Epoch 7/10:  87%|████████▋ | 1923/2208 [01:50<00:14, 19.61it/s][A
  with torch.cuda.amp.autocast():

Epoch 7/10:  87%|████████▋ | 1929/2208 [01:51<00:20, 13.34it/s][A

Batch 1925: Training loss = 0.0703, Training accuracy = 0.9506, F1 = 0.9505



Epoch 7/10:  88%|████████▊ | 1932/2208 [01:51<00:18, 15.02it/s][A
Epoch 7/10:  88%|████████▊ | 1935/2208 [01:51<00:16, 16.45it/s][A
Epoch 7/10:  88%|████████▊ | 1938/2208 [01:51<00:15, 17.63it/s][A
Epoch 7/10:  88%|████████▊ | 1941/2208 [01:51<00:14, 18.65it/s][A
Epoch 7/10:  88%|████████▊ | 1944/2208 [01:51<00:13, 19.33it/s][A
Epoch 7/10:  88%|████████▊ | 1947/2208 [01:52<00:13, 19.87it/s][A
  with torch.cuda.amp.autocast():

Epoch 7/10:  88%|████████▊ | 1953/2208 [01:52<00:21, 11.69it/s][A

Batch 1950: Training loss = 0.1034, Training accuracy = 0.9506, F1 = 0.9506



Epoch 7/10:  89%|████████▊ | 1956/2208 [01:52<00:18, 13.45it/s][A
Epoch 7/10:  89%|████████▊ | 1959/2208 [01:53<00:16, 15.13it/s][A
Epoch 7/10:  89%|████████▉ | 1962/2208 [01:53<00:14, 16.49it/s][A
Epoch 7/10:  89%|████████▉ | 1965/2208 [01:53<00:13, 17.77it/s][A
Epoch 7/10:  89%|████████▉ | 1968/2208 [01:53<00:12, 18.73it/s][A
Epoch 7/10:  89%|████████▉ | 1971/2208 [01:53<00:12, 18.55it/s][A
  with torch.cuda.amp.autocast():

Epoch 7/10:  90%|████████▉ | 1977/2208 [01:54<00:20, 11.23it/s][A
Epoch 7/10:  90%|████████▉ | 1980/2208 [01:54<00:17, 13.14it/s][A

Batch 1975: Training loss = 0.1840, Training accuracy = 0.9506, F1 = 0.9506



Epoch 7/10:  90%|████████▉ | 1983/2208 [01:54<00:15, 14.83it/s][A
Epoch 7/10:  90%|████████▉ | 1986/2208 [01:54<00:13, 16.25it/s][A
Epoch 7/10:  90%|█████████ | 1989/2208 [01:54<00:12, 17.48it/s][A
Epoch 7/10:  90%|█████████ | 1992/2208 [01:54<00:11, 18.41it/s][A
Epoch 7/10:  90%|█████████ | 1995/2208 [01:55<00:11, 18.98it/s][A
Epoch 7/10:  90%|█████████ | 1998/2208 [01:55<00:10, 19.61it/s][A
  with torch.cuda.amp.autocast():

Epoch 7/10:  91%|█████████ | 2004/2208 [01:55<00:15, 13.16it/s][A

Batch 2000: Training loss = 0.1582, Training accuracy = 0.9506, F1 = 0.9505



Epoch 7/10:  91%|█████████ | 2007/2208 [01:56<00:13, 14.87it/s][A
Epoch 7/10:  91%|█████████ | 2010/2208 [01:56<00:12, 16.31it/s][A
Epoch 7/10:  91%|█████████ | 2013/2208 [01:56<00:11, 17.39it/s][A
Epoch 7/10:  91%|█████████▏| 2016/2208 [01:56<00:10, 18.26it/s][A
Epoch 7/10:  91%|█████████▏| 2019/2208 [01:56<00:09, 18.91it/s][A
Epoch 7/10:  92%|█████████▏| 2022/2208 [01:56<00:09, 19.60it/s][A
  with torch.cuda.amp.autocast():

Epoch 7/10:  92%|█████████▏| 2028/2208 [01:57<00:16, 10.95it/s][A

Batch 2025: Training loss = 0.2529, Training accuracy = 0.9506, F1 = 0.9505



Epoch 7/10:  92%|█████████▏| 2031/2208 [01:57<00:13, 12.86it/s][A
Epoch 7/10:  92%|█████████▏| 2034/2208 [01:57<00:11, 14.51it/s][A
Epoch 7/10:  92%|█████████▏| 2037/2208 [01:57<00:10, 15.94it/s][A
Epoch 7/10:  92%|█████████▏| 2040/2208 [01:58<00:09, 17.24it/s][A
Epoch 7/10:  93%|█████████▎| 2043/2208 [01:58<00:09, 18.15it/s][A
Epoch 7/10:  93%|█████████▎| 2046/2208 [01:58<00:08, 18.93it/s][A
  with torch.cuda.amp.autocast():

Epoch 7/10:  93%|█████████▎| 2052/2208 [01:59<00:15, 10.04it/s][A
Epoch 7/10:  93%|█████████▎| 2055/2208 [01:59<00:12, 11.99it/s][A

Batch 2050: Training loss = 0.1606, Training accuracy = 0.9506, F1 = 0.9505



Epoch 7/10:  93%|█████████▎| 2058/2208 [01:59<00:10, 13.83it/s][A
Epoch 7/10:  93%|█████████▎| 2061/2208 [01:59<00:09, 15.44it/s][A
Epoch 7/10:  93%|█████████▎| 2064/2208 [01:59<00:08, 16.91it/s][A
Epoch 7/10:  94%|█████████▎| 2067/2208 [01:59<00:07, 18.08it/s][A
Epoch 7/10:  94%|█████████▍| 2070/2208 [01:59<00:07, 18.89it/s][A
Epoch 7/10:  94%|█████████▍| 2073/2208 [02:00<00:06, 19.39it/s][A
  with torch.cuda.amp.autocast():

Epoch 7/10:  94%|█████████▍| 2079/2208 [02:00<00:10, 12.60it/s][A

Batch 2075: Training loss = 0.0723, Training accuracy = 0.9506, F1 = 0.9506



Epoch 7/10:  94%|█████████▍| 2082/2208 [02:00<00:08, 14.34it/s][A
Epoch 7/10:  94%|█████████▍| 2085/2208 [02:01<00:07, 15.88it/s][A
Epoch 7/10:  95%|█████████▍| 2088/2208 [02:01<00:06, 17.23it/s][A
Epoch 7/10:  95%|█████████▍| 2091/2208 [02:01<00:06, 18.23it/s][A
Epoch 7/10:  95%|█████████▍| 2094/2208 [02:01<00:06, 18.70it/s][A
Epoch 7/10:  95%|█████████▍| 2097/2208 [02:01<00:06, 16.14it/s][A
  with torch.cuda.amp.autocast():

Epoch 7/10:  95%|█████████▌| 2102/2208 [02:02<00:12,  8.59it/s][A
Epoch 7/10:  95%|█████████▌| 2105/2208 [02:02<00:09, 10.64it/s][A

Batch 2100: Training loss = 0.2055, Training accuracy = 0.9506, F1 = 0.9505



Epoch 7/10:  95%|█████████▌| 2108/2208 [02:02<00:07, 12.55it/s][A
Epoch 7/10:  96%|█████████▌| 2111/2208 [02:03<00:06, 14.37it/s][A
Epoch 7/10:  96%|█████████▌| 2114/2208 [02:03<00:05, 15.95it/s][A
Epoch 7/10:  96%|█████████▌| 2117/2208 [02:03<00:05, 17.16it/s][A
Epoch 7/10:  96%|█████████▌| 2119/2208 [02:03<00:05, 17.13it/s][A
Epoch 7/10:  96%|█████████▌| 2122/2208 [02:03<00:04, 18.27it/s][A
Epoch 7/10:  96%|█████████▌| 2124/2208 [02:03<00:04, 16.99it/s][A
  with torch.cuda.amp.autocast():

Epoch 7/10:  96%|█████████▋| 2129/2208 [02:04<00:07, 10.96it/s][A

Batch 2125: Training loss = 0.1221, Training accuracy = 0.9505, F1 = 0.9505



Epoch 7/10:  97%|█████████▋| 2132/2208 [02:04<00:05, 13.12it/s][A
Epoch 7/10:  97%|█████████▋| 2135/2208 [02:04<00:04, 14.97it/s][A
Epoch 7/10:  97%|█████████▋| 2138/2208 [02:04<00:04, 16.45it/s][A
Epoch 7/10:  97%|█████████▋| 2141/2208 [02:04<00:03, 17.69it/s][A
Epoch 7/10:  97%|█████████▋| 2144/2208 [02:05<00:03, 18.60it/s][A
Epoch 7/10:  97%|█████████▋| 2147/2208 [02:05<00:03, 19.35it/s][A
  with torch.cuda.amp.autocast():

Epoch 7/10:  98%|█████████▊| 2153/2208 [02:05<00:05, 10.89it/s][A

Batch 2150: Training loss = 0.1814, Training accuracy = 0.9506, F1 = 0.9505



Epoch 7/10:  98%|█████████▊| 2156/2208 [02:06<00:04, 12.80it/s][A
Epoch 7/10:  98%|█████████▊| 2159/2208 [02:06<00:03, 14.59it/s][A
Epoch 7/10:  98%|█████████▊| 2162/2208 [02:06<00:02, 16.15it/s][A
Epoch 7/10:  98%|█████████▊| 2165/2208 [02:06<00:02, 17.37it/s][A
Epoch 7/10:  98%|█████████▊| 2168/2208 [02:06<00:02, 18.40it/s][A
Epoch 7/10:  98%|█████████▊| 2171/2208 [02:06<00:01, 19.14it/s][A
  with torch.cuda.amp.autocast():

Epoch 7/10:  99%|█████████▊| 2177/2208 [02:07<00:02, 10.56it/s][A
Epoch 7/10:  99%|█████████▊| 2180/2208 [02:07<00:02, 12.47it/s][A

Batch 2175: Training loss = 0.2216, Training accuracy = 0.9505, F1 = 0.9505



Epoch 7/10:  99%|█████████▉| 2182/2208 [02:07<00:01, 13.58it/s][A
Epoch 7/10:  99%|█████████▉| 2185/2208 [02:07<00:01, 15.40it/s][A
Epoch 7/10:  99%|█████████▉| 2188/2208 [02:08<00:01, 16.88it/s][A
Epoch 7/10:  99%|█████████▉| 2191/2208 [02:08<00:00, 18.04it/s][A
Epoch 7/10:  99%|█████████▉| 2194/2208 [02:08<00:00, 18.93it/s][A
Epoch 7/10: 100%|█████████▉| 2197/2208 [02:08<00:00, 19.63it/s][A
  with torch.cuda.amp.autocast():

Epoch 7/10: 100%|█████████▉| 2203/2208 [02:09<00:00, 10.70it/s][A

Batch 2200: Training loss = 0.1170, Training accuracy = 0.9506, F1 = 0.9505



Epoch 7/10: 100%|█████████▉| 2206/2208 [02:09<00:00, 12.67it/s][A
                                                               [A


Epoch 7 Training Metrics:
Loss: 0.1482
Accuracy: 0.9506
F1 Score: 0.9506
Precision: 0.9505
Recall: 0.9506

Starting validation...



Validation:   0%|          | 0/552 [00:00<?, ?it/s][A
Validation:   0%|          | 1/552 [00:01<15:42,  1.71s/it][A
Validation:   1%|          | 3/552 [00:01<04:26,  2.06it/s][A
Validation:   1%|          | 5/552 [00:01<02:25,  3.77it/s][A
Validation:   1%|▏         | 7/552 [00:02<01:35,  5.70it/s][A
Validation:   2%|▏         | 9/552 [00:02<01:10,  7.74it/s][A
Validation:   2%|▏         | 11/552 [00:02<00:55,  9.74it/s][A
Validation:   2%|▏         | 13/552 [00:02<00:46, 11.64it/s][A
Validation:   3%|▎         | 15/552 [00:02<00:40, 13.22it/s][A
Validation:   3%|▎         | 17/552 [00:02<00:36, 14.60it/s][A
Validation:   3%|▎         | 19/552 [00:02<00:33, 15.76it/s][A
Validation:   4%|▍         | 21/552 [00:02<00:31, 16.62it/s][A
Validation:   4%|▍         | 23/552 [00:02<00:30, 17.26it/s][A
Validation:   5%|▍         | 25/552 [00:02<00:29, 17.77it/s][A
Validation:   5%|▍         | 27/552 [00:03<00:29, 18.07it/s][A
Validation:   5%|▌         | 29/552 [00:03<00:28, 18.


Epoch 7 Validation Metrics:
Loss: 0.1515
Accuracy: 0.9545
F1 Score: 0.9543
Precision: 0.9558
Recall: 0.9545


Training epochs:  70%|███████   | 7/10 [18:49<08:05, 161.81s/it]


Starting epoch 8/10



  with torch.cuda.amp.autocast():

  with torch.cuda.amp.autocast():

Epoch 8/10:   0%|          | 3/2208 [00:01<18:10,  2.02it/s]  [A

Batch 0: Training loss = 0.1390, Training accuracy = 0.9531, F1 = 0.9479



Epoch 8/10:   0%|          | 5/2208 [00:01<09:48,  3.74it/s][A
Epoch 8/10:   0%|          | 8/2208 [00:02<05:35,  6.56it/s][A
Epoch 8/10:   0%|          | 10/2208 [00:02<04:24,  8.30it/s][A
Epoch 8/10:   1%|          | 13/2208 [00:02<03:18, 11.04it/s][A
Epoch 8/10:   1%|          | 16/2208 [00:02<02:42, 13.49it/s][A
Epoch 8/10:   1%|          | 18/2208 [00:02<02:36, 14.03it/s][A
Epoch 8/10:   1%|          | 21/2208 [00:02<02:23, 15.28it/s][A
Epoch 8/10:   1%|          | 24/2208 [00:02<02:10, 16.79it/s][A
  with torch.cuda.amp.autocast():

Epoch 8/10:   1%|▏         | 29/2208 [00:03<02:08, 16.98it/s][A

Batch 25: Training loss = 0.0440, Training accuracy = 0.9561, F1 = 0.9561



Epoch 8/10:   1%|▏         | 32/2208 [00:03<02:00, 18.04it/s][A
Epoch 8/10:   2%|▏         | 34/2208 [00:03<02:08, 16.85it/s][A
Epoch 8/10:   2%|▏         | 37/2208 [00:03<01:59, 18.19it/s][A
Epoch 8/10:   2%|▏         | 39/2208 [00:03<02:12, 16.34it/s][A
Epoch 8/10:   2%|▏         | 42/2208 [00:03<02:01, 17.78it/s][A
Epoch 8/10:   2%|▏         | 45/2208 [00:04<01:55, 18.70it/s][A
Epoch 8/10:   2%|▏         | 48/2208 [00:04<01:51, 19.34it/s][A
  with torch.cuda.amp.autocast():

Epoch 8/10:   2%|▏         | 52/2208 [00:04<02:00, 17.93it/s][A

Batch 50: Training loss = 0.0851, Training accuracy = 0.9556, F1 = 0.9556



Epoch 8/10:   2%|▏         | 54/2208 [00:04<02:22, 15.10it/s][A
Epoch 8/10:   3%|▎         | 57/2208 [00:04<02:20, 15.27it/s][A
Epoch 8/10:   3%|▎         | 60/2208 [00:05<02:07, 16.80it/s][A
Epoch 8/10:   3%|▎         | 62/2208 [00:05<02:07, 16.83it/s][A
Epoch 8/10:   3%|▎         | 65/2208 [00:05<02:07, 16.83it/s][A
Epoch 8/10:   3%|▎         | 68/2208 [00:05<01:59, 17.98it/s][A
Epoch 8/10:   3%|▎         | 70/2208 [00:05<02:08, 16.70it/s][A
Epoch 8/10:   3%|▎         | 73/2208 [00:05<01:58, 18.01it/s][A
  with torch.cuda.amp.autocast():

Epoch 8/10:   4%|▎         | 79/2208 [00:06<01:53, 18.82it/s][A

Batch 75: Training loss = 0.1313, Training accuracy = 0.9547, F1 = 0.9546



Epoch 8/10:   4%|▎         | 81/2208 [00:06<01:52, 18.97it/s][A
Epoch 8/10:   4%|▍         | 84/2208 [00:06<01:47, 19.73it/s][A
Epoch 8/10:   4%|▍         | 87/2208 [00:06<01:44, 20.21it/s][A
Epoch 8/10:   4%|▍         | 90/2208 [00:06<01:43, 20.55it/s][A
Epoch 8/10:   4%|▍         | 93/2208 [00:06<01:44, 20.27it/s][A
Epoch 8/10:   4%|▍         | 96/2208 [00:06<01:42, 20.54it/s][A
Epoch 8/10:   4%|▍         | 99/2208 [00:07<01:58, 17.80it/s][A
  with torch.cuda.amp.autocast():

Epoch 8/10:   5%|▍         | 104/2208 [00:07<01:53, 18.49it/s][A

Batch 100: Training loss = 0.1643, Training accuracy = 0.9545, F1 = 0.9545



Epoch 8/10:   5%|▍         | 107/2208 [00:07<01:48, 19.28it/s][A
Epoch 8/10:   5%|▍         | 110/2208 [00:07<01:45, 19.92it/s][A
Epoch 8/10:   5%|▌         | 113/2208 [00:07<01:42, 20.44it/s][A
Epoch 8/10:   5%|▌         | 116/2208 [00:07<01:47, 19.45it/s][A
Epoch 8/10:   5%|▌         | 118/2208 [00:08<01:48, 19.33it/s][A
Epoch 8/10:   5%|▌         | 121/2208 [00:08<01:44, 20.01it/s][A
Epoch 8/10:   6%|▌         | 124/2208 [00:08<01:44, 19.87it/s][A
  with torch.cuda.amp.autocast():

Epoch 8/10:   6%|▌         | 129/2208 [00:08<01:48, 19.21it/s][A

Batch 125: Training loss = 0.2015, Training accuracy = 0.9538, F1 = 0.9538



Epoch 8/10:   6%|▌         | 132/2208 [00:08<01:45, 19.72it/s][A
Epoch 8/10:   6%|▌         | 135/2208 [00:08<01:43, 20.10it/s][A
Epoch 8/10:   6%|▋         | 138/2208 [00:09<01:42, 20.22it/s][A
Epoch 8/10:   6%|▋         | 141/2208 [00:09<01:40, 20.63it/s][A
Epoch 8/10:   7%|▋         | 144/2208 [00:09<01:39, 20.77it/s][A
Epoch 8/10:   7%|▋         | 147/2208 [00:09<01:37, 21.10it/s][A
  with torch.cuda.amp.autocast():

Epoch 8/10:   7%|▋         | 153/2208 [00:09<01:43, 19.88it/s][A

Batch 150: Training loss = 0.1398, Training accuracy = 0.9537, F1 = 0.9537



Epoch 8/10:   7%|▋         | 156/2208 [00:09<01:41, 20.28it/s][A
Epoch 8/10:   7%|▋         | 159/2208 [00:10<01:39, 20.69it/s][A
Epoch 8/10:   7%|▋         | 162/2208 [00:10<01:41, 20.22it/s][A
Epoch 8/10:   7%|▋         | 165/2208 [00:10<01:39, 20.47it/s][A
Epoch 8/10:   8%|▊         | 168/2208 [00:10<01:40, 20.22it/s][A
Epoch 8/10:   8%|▊         | 171/2208 [00:10<01:42, 19.83it/s][A
  with torch.cuda.amp.autocast():

Epoch 8/10:   8%|▊         | 177/2208 [00:11<01:47, 18.87it/s][A
Epoch 8/10:   8%|▊         | 180/2208 [00:11<01:44, 19.33it/s][A

Batch 175: Training loss = 0.0742, Training accuracy = 0.9533, F1 = 0.9532



Epoch 8/10:   8%|▊         | 183/2208 [00:11<01:42, 19.81it/s][A
Epoch 8/10:   8%|▊         | 185/2208 [00:11<01:42, 19.72it/s][A
Epoch 8/10:   8%|▊         | 187/2208 [00:11<01:47, 18.72it/s][A
Epoch 8/10:   9%|▊         | 189/2208 [00:11<01:47, 18.84it/s][A
Epoch 8/10:   9%|▊         | 192/2208 [00:11<01:43, 19.52it/s][A
Epoch 8/10:   9%|▉         | 194/2208 [00:11<01:43, 19.38it/s][A
Epoch 8/10:   9%|▉         | 196/2208 [00:11<01:43, 19.51it/s][A
Epoch 8/10:   9%|▉         | 198/2208 [00:12<01:43, 19.37it/s][A
  with torch.cuda.amp.autocast():

Epoch 8/10:   9%|▉         | 204/2208 [00:12<01:45, 19.02it/s][A

Batch 200: Training loss = 0.0932, Training accuracy = 0.9535, F1 = 0.9535



Epoch 8/10:   9%|▉         | 206/2208 [00:12<01:45, 18.97it/s][A
Epoch 8/10:   9%|▉         | 209/2208 [00:12<01:41, 19.77it/s][A
Epoch 8/10:  10%|▉         | 211/2208 [00:12<01:44, 19.17it/s][A
Epoch 8/10:  10%|▉         | 214/2208 [00:12<01:43, 19.34it/s][A
Epoch 8/10:  10%|▉         | 217/2208 [00:13<01:40, 19.84it/s][A
Epoch 8/10:  10%|▉         | 219/2208 [00:13<01:45, 18.87it/s][A
Epoch 8/10:  10%|█         | 222/2208 [00:13<01:57, 16.97it/s][A
  with torch.cuda.amp.autocast():

Epoch 8/10:  10%|█         | 227/2208 [00:13<02:07, 15.51it/s][A
Epoch 8/10:  10%|█         | 230/2208 [00:13<01:55, 17.06it/s][A

Batch 225: Training loss = 0.2029, Training accuracy = 0.9539, F1 = 0.9539



Epoch 8/10:  11%|█         | 233/2208 [00:14<01:48, 18.15it/s][A
Epoch 8/10:  11%|█         | 236/2208 [00:14<01:43, 19.00it/s][A
Epoch 8/10:  11%|█         | 238/2208 [00:14<01:44, 18.85it/s][A
Epoch 8/10:  11%|█         | 241/2208 [00:14<01:40, 19.62it/s][A
Epoch 8/10:  11%|█         | 243/2208 [00:14<01:46, 18.43it/s][A
Epoch 8/10:  11%|█         | 246/2208 [00:14<01:43, 18.99it/s][A
Epoch 8/10:  11%|█▏        | 249/2208 [00:14<01:40, 19.53it/s][A
  with torch.cuda.amp.autocast():

Epoch 8/10:  12%|█▏        | 254/2208 [00:15<01:45, 18.44it/s][A

Batch 250: Training loss = 0.1629, Training accuracy = 0.9537, F1 = 0.9537



Epoch 8/10:  12%|█▏        | 257/2208 [00:15<01:40, 19.40it/s][A
Epoch 8/10:  12%|█▏        | 260/2208 [00:15<01:37, 19.92it/s][A
Epoch 8/10:  12%|█▏        | 263/2208 [00:15<01:35, 20.31it/s][A
Epoch 8/10:  12%|█▏        | 266/2208 [00:15<01:35, 20.42it/s][A
Epoch 8/10:  12%|█▏        | 269/2208 [00:15<01:43, 18.77it/s][A
Epoch 8/10:  12%|█▏        | 272/2208 [00:16<01:45, 18.29it/s][A
  with torch.cuda.amp.autocast():

Epoch 8/10:  13%|█▎        | 277/2208 [00:16<01:56, 16.63it/s][A
Epoch 8/10:  13%|█▎        | 280/2208 [00:16<01:48, 17.76it/s][A

Batch 275: Training loss = 0.1057, Training accuracy = 0.9537, F1 = 0.9537



Epoch 8/10:  13%|█▎        | 283/2208 [00:16<01:43, 18.56it/s][A
Epoch 8/10:  13%|█▎        | 285/2208 [00:16<01:47, 17.97it/s][A
Epoch 8/10:  13%|█▎        | 287/2208 [00:16<01:48, 17.73it/s][A
Epoch 8/10:  13%|█▎        | 289/2208 [00:17<02:03, 15.52it/s][A
Epoch 8/10:  13%|█▎        | 292/2208 [00:17<01:53, 16.81it/s][A
Epoch 8/10:  13%|█▎        | 295/2208 [00:17<01:58, 16.18it/s][A
Epoch 8/10:  13%|█▎        | 298/2208 [00:17<01:48, 17.55it/s][A
  with torch.cuda.amp.autocast():

Epoch 8/10:  14%|█▎        | 302/2208 [00:17<02:02, 15.52it/s][A
Epoch 8/10:  14%|█▍        | 305/2208 [00:18<01:50, 17.20it/s][A

Batch 300: Training loss = 0.2019, Training accuracy = 0.9529, F1 = 0.9529



Epoch 8/10:  14%|█▍        | 308/2208 [00:18<01:43, 18.33it/s][A
Epoch 8/10:  14%|█▍        | 310/2208 [00:18<01:56, 16.25it/s][A
Epoch 8/10:  14%|█▍        | 312/2208 [00:18<01:51, 17.00it/s][A
Epoch 8/10:  14%|█▍        | 315/2208 [00:18<01:43, 18.34it/s][A
Epoch 8/10:  14%|█▍        | 318/2208 [00:18<01:38, 19.14it/s][A
Epoch 8/10:  14%|█▍        | 320/2208 [00:18<01:46, 17.77it/s][A
Epoch 8/10:  15%|█▍        | 322/2208 [00:18<01:43, 18.25it/s][A
Epoch 8/10:  15%|█▍        | 324/2208 [00:19<01:47, 17.46it/s][A
  with torch.cuda.amp.autocast():

Epoch 8/10:  15%|█▍        | 329/2208 [00:19<01:55, 16.26it/s][A

Batch 325: Training loss = 0.1813, Training accuracy = 0.9532, F1 = 0.9532



Epoch 8/10:  15%|█▌        | 332/2208 [00:19<01:46, 17.63it/s][A
Epoch 8/10:  15%|█▌        | 335/2208 [00:19<01:40, 18.61it/s][A
Epoch 8/10:  15%|█▌        | 337/2208 [00:19<01:39, 18.72it/s][A
Epoch 8/10:  15%|█▌        | 340/2208 [00:19<01:36, 19.30it/s][A
Epoch 8/10:  15%|█▌        | 342/2208 [00:20<01:36, 19.27it/s][A
Epoch 8/10:  16%|█▌        | 345/2208 [00:20<01:33, 19.85it/s][A
Epoch 8/10:  16%|█▌        | 347/2208 [00:20<01:41, 18.25it/s][A
  with torch.cuda.amp.autocast():

Epoch 8/10:  16%|█▌        | 352/2208 [00:20<01:49, 16.90it/s][A
Epoch 8/10:  16%|█▌        | 355/2208 [00:20<01:41, 18.17it/s][A

Batch 350: Training loss = 0.0780, Training accuracy = 0.9535, F1 = 0.9535



Epoch 8/10:  16%|█▌        | 358/2208 [00:20<01:37, 19.06it/s][A
Epoch 8/10:  16%|█▋        | 361/2208 [00:21<01:33, 19.73it/s][A
Epoch 8/10:  16%|█▋        | 364/2208 [00:21<01:31, 20.08it/s][A
Epoch 8/10:  17%|█▋        | 367/2208 [00:21<01:31, 20.19it/s][A
Epoch 8/10:  17%|█▋        | 370/2208 [00:21<01:30, 20.40it/s][A
Epoch 8/10:  17%|█▋        | 373/2208 [00:21<01:28, 20.76it/s][A
  with torch.cuda.amp.autocast():

Epoch 8/10:  17%|█▋        | 379/2208 [00:21<01:35, 19.06it/s][A

Batch 375: Training loss = 0.3377, Training accuracy = 0.9539, F1 = 0.9538



Epoch 8/10:  17%|█▋        | 382/2208 [00:22<01:33, 19.60it/s][A
Epoch 8/10:  17%|█▋        | 385/2208 [00:22<01:31, 20.00it/s][A
Epoch 8/10:  18%|█▊        | 388/2208 [00:22<01:29, 20.35it/s][A
Epoch 8/10:  18%|█▊        | 391/2208 [00:22<01:37, 18.56it/s][A
Epoch 8/10:  18%|█▊        | 393/2208 [00:22<01:38, 18.50it/s][A
Epoch 8/10:  18%|█▊        | 396/2208 [00:22<01:33, 19.28it/s][A
Epoch 8/10:  18%|█▊        | 398/2208 [00:22<01:38, 18.40it/s][A
  with torch.cuda.amp.autocast():

Epoch 8/10:  18%|█▊        | 404/2208 [00:23<01:40, 17.87it/s][A

Batch 400: Training loss = 0.1245, Training accuracy = 0.9538, F1 = 0.9537



Epoch 8/10:  18%|█▊        | 407/2208 [00:23<01:35, 18.93it/s][A
Epoch 8/10:  19%|█▊        | 410/2208 [00:23<01:31, 19.67it/s][A
Epoch 8/10:  19%|█▊        | 413/2208 [00:23<01:29, 20.11it/s][A
Epoch 8/10:  19%|█▉        | 416/2208 [00:23<01:27, 20.38it/s][A
Epoch 8/10:  19%|█▉        | 419/2208 [00:24<01:26, 20.59it/s][A
Epoch 8/10:  19%|█▉        | 422/2208 [00:24<01:25, 20.91it/s][A
  with torch.cuda.amp.autocast():

Epoch 8/10:  19%|█▉        | 428/2208 [00:24<01:42, 17.41it/s][A

Batch 425: Training loss = 0.1136, Training accuracy = 0.9535, F1 = 0.9535



Epoch 8/10:  20%|█▉        | 431/2208 [00:24<01:36, 18.48it/s][A
Epoch 8/10:  20%|█▉        | 434/2208 [00:24<01:32, 19.24it/s][A
Epoch 8/10:  20%|█▉        | 437/2208 [00:24<01:29, 19.77it/s][A
Epoch 8/10:  20%|█▉        | 440/2208 [00:25<01:27, 20.21it/s][A
Epoch 8/10:  20%|██        | 443/2208 [00:25<01:26, 20.47it/s][A
Epoch 8/10:  20%|██        | 446/2208 [00:25<01:25, 20.69it/s][A
  with torch.cuda.amp.autocast():

Epoch 8/10:  20%|██        | 452/2208 [00:25<01:40, 17.55it/s][A


Batch 450: Training loss = 0.1246, Training accuracy = 0.9539, F1 = 0.9538


Epoch 8/10:  21%|██        | 455/2208 [00:25<01:37, 18.07it/s][A
Epoch 8/10:  21%|██        | 458/2208 [00:26<01:33, 18.81it/s][A
Epoch 8/10:  21%|██        | 461/2208 [00:26<01:29, 19.51it/s][A
Epoch 8/10:  21%|██        | 464/2208 [00:26<01:29, 19.42it/s][A
Epoch 8/10:  21%|██        | 467/2208 [00:26<01:28, 19.78it/s][A
Epoch 8/10:  21%|██▏       | 470/2208 [00:26<01:26, 20.21it/s][A
Epoch 8/10:  21%|██▏       | 473/2208 [00:26<01:24, 20.49it/s][A
  with torch.cuda.amp.autocast():

Epoch 8/10:  22%|██▏       | 479/2208 [00:27<01:43, 16.73it/s][A

Batch 475: Training loss = 0.0874, Training accuracy = 0.9538, F1 = 0.9537



Epoch 8/10:  22%|██▏       | 482/2208 [00:27<01:36, 17.97it/s][A
Epoch 8/10:  22%|██▏       | 485/2208 [00:27<01:31, 18.87it/s][A
Epoch 8/10:  22%|██▏       | 488/2208 [00:27<01:28, 19.50it/s][A
Epoch 8/10:  22%|██▏       | 491/2208 [00:27<01:26, 19.88it/s][A
Epoch 8/10:  22%|██▏       | 494/2208 [00:27<01:24, 20.27it/s][A
Epoch 8/10:  23%|██▎       | 497/2208 [00:28<01:23, 20.58it/s][A
  with torch.cuda.amp.autocast():

Epoch 8/10:  23%|██▎       | 503/2208 [00:28<01:41, 16.79it/s][A

Batch 500: Training loss = 0.0840, Training accuracy = 0.9541, F1 = 0.9540



Epoch 8/10:  23%|██▎       | 506/2208 [00:28<01:34, 17.98it/s][A
Epoch 8/10:  23%|██▎       | 509/2208 [00:28<01:30, 18.87it/s][A
Epoch 8/10:  23%|██▎       | 512/2208 [00:28<01:26, 19.50it/s][A
Epoch 8/10:  23%|██▎       | 515/2208 [00:29<01:24, 19.93it/s][A
Epoch 8/10:  23%|██▎       | 518/2208 [00:29<01:23, 20.32it/s][A
Epoch 8/10:  24%|██▎       | 521/2208 [00:29<01:21, 20.67it/s][A
  with torch.cuda.amp.autocast():

Epoch 8/10:  24%|██▍       | 527/2208 [00:29<01:36, 17.46it/s][A
Epoch 8/10:  24%|██▍       | 530/2208 [00:29<01:30, 18.50it/s][A

Batch 525: Training loss = 0.1141, Training accuracy = 0.9539, F1 = 0.9539



Epoch 8/10:  24%|██▍       | 533/2208 [00:30<01:26, 19.26it/s][A
Epoch 8/10:  24%|██▍       | 536/2208 [00:30<01:24, 19.77it/s][A
Epoch 8/10:  24%|██▍       | 539/2208 [00:30<01:22, 20.19it/s][A
Epoch 8/10:  25%|██▍       | 542/2208 [00:30<01:21, 20.44it/s][A
Epoch 8/10:  25%|██▍       | 545/2208 [00:30<01:21, 20.49it/s][A
Epoch 8/10:  25%|██▍       | 548/2208 [00:30<01:20, 20.73it/s][A
  with torch.cuda.amp.autocast():

Epoch 8/10:  25%|██▌       | 554/2208 [00:31<01:41, 16.23it/s][A

Batch 550: Training loss = 0.2639, Training accuracy = 0.9543, F1 = 0.9542



Epoch 8/10:  25%|██▌       | 557/2208 [00:31<01:34, 17.50it/s][A
Epoch 8/10:  25%|██▌       | 559/2208 [00:31<01:31, 17.98it/s][A
Epoch 8/10:  25%|██▌       | 562/2208 [00:31<01:27, 18.86it/s][A
Epoch 8/10:  26%|██▌       | 565/2208 [00:31<01:24, 19.53it/s][A
Epoch 8/10:  26%|██▌       | 568/2208 [00:31<01:27, 18.82it/s][A
Epoch 8/10:  26%|██▌       | 571/2208 [00:32<01:24, 19.33it/s][A
  with torch.cuda.amp.autocast():

Epoch 8/10:  26%|██▌       | 577/2208 [00:32<01:48, 15.02it/s][A
Epoch 8/10:  26%|██▋       | 580/2208 [00:32<01:38, 16.47it/s][A

Batch 575: Training loss = 0.1811, Training accuracy = 0.9543, F1 = 0.9543



Epoch 8/10:  26%|██▋       | 583/2208 [00:32<01:32, 17.64it/s][A
Epoch 8/10:  27%|██▋       | 586/2208 [00:32<01:27, 18.51it/s][A
Epoch 8/10:  27%|██▋       | 589/2208 [00:33<01:24, 19.14it/s][A
Epoch 8/10:  27%|██▋       | 592/2208 [00:33<01:21, 19.82it/s][A
Epoch 8/10:  27%|██▋       | 595/2208 [00:33<01:21, 19.90it/s][A
Epoch 8/10:  27%|██▋       | 598/2208 [00:33<01:19, 20.14it/s][A
  with torch.cuda.amp.autocast():

Epoch 8/10:  27%|██▋       | 604/2208 [00:33<01:37, 16.48it/s][A

Batch 600: Training loss = 0.1358, Training accuracy = 0.9544, F1 = 0.9544



Epoch 8/10:  27%|██▋       | 607/2208 [00:34<01:30, 17.73it/s][A
Epoch 8/10:  28%|██▊       | 610/2208 [00:34<01:25, 18.59it/s][A
Epoch 8/10:  28%|██▊       | 613/2208 [00:34<01:22, 19.35it/s][A
Epoch 8/10:  28%|██▊       | 616/2208 [00:34<01:30, 17.52it/s][A
Epoch 8/10:  28%|██▊       | 619/2208 [00:34<01:26, 18.33it/s][A
Epoch 8/10:  28%|██▊       | 622/2208 [00:34<01:23, 19.02it/s][A
Epoch 8/10:  28%|██▊       | 624/2208 [00:35<01:28, 17.91it/s][A
  with torch.cuda.amp.autocast():

Epoch 8/10:  28%|██▊       | 629/2208 [00:35<01:35, 16.54it/s][A

Batch 625: Training loss = 0.0802, Training accuracy = 0.9544, F1 = 0.9544



Epoch 8/10:  29%|██▊       | 632/2208 [00:35<01:28, 17.85it/s][A
Epoch 8/10:  29%|██▉       | 635/2208 [00:35<01:23, 18.87it/s][A
Epoch 8/10:  29%|██▉       | 638/2208 [00:35<01:20, 19.58it/s][A
Epoch 8/10:  29%|██▉       | 641/2208 [00:35<01:17, 20.14it/s][A
Epoch 8/10:  29%|██▉       | 644/2208 [00:36<01:16, 20.37it/s][A
Epoch 8/10:  29%|██▉       | 647/2208 [00:36<01:15, 20.54it/s][A
  with torch.cuda.amp.autocast():

Epoch 8/10:  30%|██▉       | 653/2208 [00:36<01:37, 15.95it/s][A

Batch 650: Training loss = 0.1583, Training accuracy = 0.9543, F1 = 0.9542



Epoch 8/10:  30%|██▉       | 656/2208 [00:36<01:29, 17.27it/s][A
Epoch 8/10:  30%|██▉       | 659/2208 [00:36<01:24, 18.25it/s][A
Epoch 8/10:  30%|██▉       | 662/2208 [00:37<01:20, 19.10it/s][A
Epoch 8/10:  30%|███       | 665/2208 [00:37<01:18, 19.68it/s][A
Epoch 8/10:  30%|███       | 668/2208 [00:37<01:20, 19.16it/s][A
Epoch 8/10:  30%|███       | 671/2208 [00:37<01:17, 19.84it/s][A
  with torch.cuda.amp.autocast():

Epoch 8/10:  31%|███       | 677/2208 [00:37<01:32, 16.50it/s][A
Epoch 8/10:  31%|███       | 680/2208 [00:38<01:26, 17.75it/s][A

Batch 675: Training loss = 0.1827, Training accuracy = 0.9544, F1 = 0.9544



Epoch 8/10:  31%|███       | 683/2208 [00:38<01:21, 18.71it/s][A
Epoch 8/10:  31%|███       | 686/2208 [00:38<01:18, 19.40it/s][A
Epoch 8/10:  31%|███       | 689/2208 [00:38<01:16, 19.83it/s][A
Epoch 8/10:  31%|███▏      | 692/2208 [00:38<01:15, 20.12it/s][A
Epoch 8/10:  31%|███▏      | 695/2208 [00:38<01:13, 20.54it/s][A
Epoch 8/10:  32%|███▏      | 698/2208 [00:38<01:12, 20.77it/s][A
  with torch.cuda.amp.autocast():

Epoch 8/10:  32%|███▏      | 704/2208 [00:39<01:25, 17.58it/s][A

Batch 700: Training loss = 0.1279, Training accuracy = 0.9544, F1 = 0.9544



Epoch 8/10:  32%|███▏      | 707/2208 [00:39<01:20, 18.58it/s][A
Epoch 8/10:  32%|███▏      | 710/2208 [00:39<01:17, 19.31it/s][A
Epoch 8/10:  32%|███▏      | 713/2208 [00:39<01:15, 19.89it/s][A
Epoch 8/10:  32%|███▏      | 716/2208 [00:39<01:13, 20.31it/s][A
Epoch 8/10:  33%|███▎      | 719/2208 [00:40<01:12, 20.61it/s][A
Epoch 8/10:  33%|███▎      | 722/2208 [00:40<01:11, 20.69it/s][A
  with torch.cuda.amp.autocast():

Epoch 8/10:  33%|███▎      | 728/2208 [00:40<01:32, 16.06it/s][A

Batch 725: Training loss = 0.1594, Training accuracy = 0.9543, F1 = 0.9543



Epoch 8/10:  33%|███▎      | 731/2208 [00:40<01:25, 17.25it/s][A
Epoch 8/10:  33%|███▎      | 734/2208 [00:40<01:20, 18.35it/s][A
Epoch 8/10:  33%|███▎      | 737/2208 [00:41<01:16, 19.12it/s][A
Epoch 8/10:  34%|███▎      | 740/2208 [00:41<01:14, 19.74it/s][A
Epoch 8/10:  34%|███▎      | 743/2208 [00:41<01:12, 20.11it/s][A
Epoch 8/10:  34%|███▍      | 746/2208 [00:41<01:11, 20.42it/s][A
  with torch.cuda.amp.autocast():

Epoch 8/10:  34%|███▍      | 752/2208 [00:41<01:31, 15.99it/s][A
Epoch 8/10:  34%|███▍      | 755/2208 [00:42<01:23, 17.32it/s][A

Batch 750: Training loss = 0.1464, Training accuracy = 0.9543, F1 = 0.9543



Epoch 8/10:  34%|███▍      | 758/2208 [00:42<01:18, 18.44it/s][A
Epoch 8/10:  34%|███▍      | 761/2208 [00:42<01:15, 19.23it/s][A
Epoch 8/10:  35%|███▍      | 764/2208 [00:42<01:19, 18.22it/s][A
Epoch 8/10:  35%|███▍      | 767/2208 [00:42<01:17, 18.56it/s][A
Epoch 8/10:  35%|███▍      | 770/2208 [00:42<01:14, 19.34it/s][A
Epoch 8/10:  35%|███▌      | 773/2208 [00:42<01:12, 19.89it/s][A
  with torch.cuda.amp.autocast():

Epoch 8/10:  35%|███▌      | 779/2208 [00:43<01:30, 15.79it/s][A

Batch 775: Training loss = 0.1468, Training accuracy = 0.9543, F1 = 0.9542



Epoch 8/10:  35%|███▌      | 782/2208 [00:43<01:23, 17.10it/s][A
Epoch 8/10:  36%|███▌      | 785/2208 [00:43<01:18, 18.24it/s][A
Epoch 8/10:  36%|███▌      | 788/2208 [00:43<01:14, 19.02it/s][A
Epoch 8/10:  36%|███▌      | 791/2208 [00:43<01:12, 19.58it/s][A
Epoch 8/10:  36%|███▌      | 794/2208 [00:44<01:10, 20.00it/s][A
Epoch 8/10:  36%|███▌      | 797/2208 [00:44<01:09, 20.43it/s][A
  with torch.cuda.amp.autocast():

Epoch 8/10:  36%|███▋      | 803/2208 [00:44<01:35, 14.68it/s][A

Batch 800: Training loss = 0.1338, Training accuracy = 0.9544, F1 = 0.9543



Epoch 8/10:  37%|███▋      | 806/2208 [00:44<01:26, 16.29it/s][A
Epoch 8/10:  37%|███▋      | 809/2208 [00:45<01:19, 17.56it/s][A
Epoch 8/10:  37%|███▋      | 812/2208 [00:45<01:15, 18.50it/s][A
Epoch 8/10:  37%|███▋      | 815/2208 [00:45<01:12, 19.16it/s][A
Epoch 8/10:  37%|███▋      | 818/2208 [00:45<01:10, 19.70it/s][A
Epoch 8/10:  37%|███▋      | 821/2208 [00:45<01:09, 20.04it/s][A
Epoch 8/10:  37%|███▋      | 824/2208 [00:45<01:12, 19.20it/s][A
  with torch.cuda.amp.autocast():

Epoch 8/10:  38%|███▊      | 829/2208 [00:46<01:34, 14.58it/s][A

Batch 825: Training loss = 0.0959, Training accuracy = 0.9544, F1 = 0.9543



Epoch 8/10:  38%|███▊      | 832/2208 [00:46<01:24, 16.19it/s][A
Epoch 8/10:  38%|███▊      | 835/2208 [00:46<01:18, 17.48it/s][A
Epoch 8/10:  38%|███▊      | 838/2208 [00:46<01:14, 18.49it/s][A
Epoch 8/10:  38%|███▊      | 841/2208 [00:46<01:10, 19.32it/s][A
Epoch 8/10:  38%|███▊      | 844/2208 [00:47<01:16, 17.71it/s][A
Epoch 8/10:  38%|███▊      | 847/2208 [00:47<01:13, 18.64it/s][A
  with torch.cuda.amp.autocast():

Epoch 8/10:  39%|███▊      | 853/2208 [00:47<01:36, 14.07it/s][A

Batch 850: Training loss = 0.0726, Training accuracy = 0.9545, F1 = 0.9545



Epoch 8/10:  39%|███▉      | 856/2208 [00:47<01:26, 15.66it/s][A
Epoch 8/10:  39%|███▉      | 859/2208 [00:47<01:19, 17.05it/s][A
Epoch 8/10:  39%|███▉      | 862/2208 [00:48<01:14, 18.15it/s][A
Epoch 8/10:  39%|███▉      | 864/2208 [00:48<01:12, 18.52it/s][A
Epoch 8/10:  39%|███▉      | 867/2208 [00:48<01:09, 19.18it/s][A
Epoch 8/10:  39%|███▉      | 870/2208 [00:48<01:12, 18.35it/s][A
Epoch 8/10:  40%|███▉      | 873/2208 [00:48<01:13, 18.22it/s][A
  with torch.cuda.amp.autocast():

Epoch 8/10:  40%|███▉      | 879/2208 [00:49<01:23, 15.85it/s][A

Batch 875: Training loss = 0.0827, Training accuracy = 0.9546, F1 = 0.9546



Epoch 8/10:  40%|███▉      | 882/2208 [00:49<01:17, 17.12it/s][A
Epoch 8/10:  40%|████      | 885/2208 [00:49<01:12, 18.20it/s][A
Epoch 8/10:  40%|████      | 888/2208 [00:49<01:09, 18.97it/s][A
Epoch 8/10:  40%|████      | 891/2208 [00:49<01:07, 19.49it/s][A
Epoch 8/10:  40%|████      | 894/2208 [00:49<01:09, 19.01it/s][A
Epoch 8/10:  41%|████      | 896/2208 [00:50<01:18, 16.80it/s][A
Epoch 8/10:  41%|████      | 899/2208 [00:50<01:12, 17.94it/s][A
  with torch.cuda.amp.autocast():

Epoch 8/10:  41%|████      | 904/2208 [00:50<01:26, 15.06it/s][A

Batch 900: Training loss = 0.1573, Training accuracy = 0.9547, F1 = 0.9547



Epoch 8/10:  41%|████      | 907/2208 [00:50<01:17, 16.72it/s][A
Epoch 8/10:  41%|████      | 910/2208 [00:50<01:12, 17.95it/s][A
Epoch 8/10:  41%|████▏     | 913/2208 [00:51<01:09, 18.73it/s][A
Epoch 8/10:  41%|████▏     | 916/2208 [00:51<01:06, 19.39it/s][A
Epoch 8/10:  42%|████▏     | 919/2208 [00:51<01:04, 19.91it/s][A
Epoch 8/10:  42%|████▏     | 922/2208 [00:51<01:03, 20.19it/s][A
  with torch.cuda.amp.autocast():

Epoch 8/10:  42%|████▏     | 928/2208 [00:51<01:25, 14.98it/s][A

Batch 925: Training loss = 0.2015, Training accuracy = 0.9548, F1 = 0.9547



Epoch 8/10:  42%|████▏     | 931/2208 [00:52<01:17, 16.52it/s][A
Epoch 8/10:  42%|████▏     | 934/2208 [00:52<01:11, 17.75it/s][A
Epoch 8/10:  42%|████▏     | 937/2208 [00:52<01:07, 18.76it/s][A
Epoch 8/10:  43%|████▎     | 940/2208 [00:52<01:05, 19.30it/s][A
Epoch 8/10:  43%|████▎     | 943/2208 [00:52<01:03, 19.87it/s][A
Epoch 8/10:  43%|████▎     | 946/2208 [00:52<01:02, 20.25it/s][A
  with torch.cuda.amp.autocast():

Epoch 8/10:  43%|████▎     | 952/2208 [00:53<01:23, 14.96it/s][A
Epoch 8/10:  43%|████▎     | 955/2208 [00:53<01:15, 16.55it/s][A

Batch 950: Training loss = 0.1232, Training accuracy = 0.9548, F1 = 0.9547



Epoch 8/10:  43%|████▎     | 958/2208 [00:53<01:10, 17.71it/s][A
Epoch 8/10:  44%|████▎     | 961/2208 [00:53<01:07, 18.55it/s][A
Epoch 8/10:  44%|████▎     | 964/2208 [00:53<01:04, 19.31it/s][A
Epoch 8/10:  44%|████▍     | 967/2208 [00:53<01:02, 19.89it/s][A
Epoch 8/10:  44%|████▍     | 970/2208 [00:54<01:01, 20.18it/s][A
Epoch 8/10:  44%|████▍     | 973/2208 [00:54<01:00, 20.41it/s][A
  with torch.cuda.amp.autocast():

Epoch 8/10:  44%|████▍     | 979/2208 [00:54<01:14, 16.42it/s][A

Batch 975: Training loss = 0.1264, Training accuracy = 0.9548, F1 = 0.9548



Epoch 8/10:  44%|████▍     | 982/2208 [00:54<01:09, 17.76it/s][A
Epoch 8/10:  45%|████▍     | 985/2208 [00:54<01:05, 18.67it/s][A
Epoch 8/10:  45%|████▍     | 988/2208 [00:55<01:02, 19.37it/s][A
Epoch 8/10:  45%|████▍     | 991/2208 [00:55<01:00, 19.97it/s][A
Epoch 8/10:  45%|████▌     | 994/2208 [00:55<00:59, 20.40it/s][A
Epoch 8/10:  45%|████▌     | 997/2208 [00:55<00:58, 20.68it/s][A
  with torch.cuda.amp.autocast():

Epoch 8/10:  45%|████▌     | 1003/2208 [00:56<01:23, 14.45it/s][A

Batch 1000: Training loss = 0.1782, Training accuracy = 0.9549, F1 = 0.9548



Epoch 8/10:  46%|████▌     | 1006/2208 [00:56<01:15, 16.00it/s][A
Epoch 8/10:  46%|████▌     | 1009/2208 [00:56<01:09, 17.34it/s][A
Epoch 8/10:  46%|████▌     | 1012/2208 [00:56<01:05, 18.31it/s][A
Epoch 8/10:  46%|████▌     | 1015/2208 [00:56<01:02, 19.08it/s][A
Epoch 8/10:  46%|████▌     | 1018/2208 [00:56<01:00, 19.79it/s][A
Epoch 8/10:  46%|████▌     | 1021/2208 [00:56<00:58, 20.17it/s][A
  with torch.cuda.amp.autocast():

Epoch 8/10:  47%|████▋     | 1027/2208 [00:57<01:19, 14.94it/s][A
Epoch 8/10:  47%|████▋     | 1030/2208 [00:57<01:11, 16.42it/s][A

Batch 1025: Training loss = 0.0981, Training accuracy = 0.9550, F1 = 0.9550



Epoch 8/10:  47%|████▋     | 1033/2208 [00:57<01:06, 17.63it/s][A
Epoch 8/10:  47%|████▋     | 1035/2208 [00:57<01:04, 18.07it/s][A
Epoch 8/10:  47%|████▋     | 1038/2208 [00:57<01:01, 19.02it/s][A
Epoch 8/10:  47%|████▋     | 1041/2208 [00:57<00:58, 19.78it/s][A
Epoch 8/10:  47%|████▋     | 1044/2208 [00:58<00:57, 20.27it/s][A
Epoch 8/10:  47%|████▋     | 1047/2208 [00:58<00:56, 20.45it/s][A
  with torch.cuda.amp.autocast():

Epoch 8/10:  48%|████▊     | 1053/2208 [00:58<01:20, 14.33it/s][A

Batch 1050: Training loss = 0.1251, Training accuracy = 0.9550, F1 = 0.9550



Epoch 8/10:  48%|████▊     | 1056/2208 [00:58<01:12, 15.95it/s][A
Epoch 8/10:  48%|████▊     | 1058/2208 [00:59<01:08, 16.70it/s][A
Epoch 8/10:  48%|████▊     | 1061/2208 [00:59<01:03, 18.01it/s][A
Epoch 8/10:  48%|████▊     | 1064/2208 [00:59<01:00, 18.91it/s][A
Epoch 8/10:  48%|████▊     | 1067/2208 [00:59<00:57, 19.68it/s][A
Epoch 8/10:  48%|████▊     | 1070/2208 [00:59<00:56, 20.03it/s][A
Epoch 8/10:  49%|████▊     | 1073/2208 [00:59<00:55, 20.37it/s][A
  with torch.cuda.amp.autocast():

Epoch 8/10:  49%|████▉     | 1079/2208 [01:00<01:12, 15.50it/s][A

Batch 1075: Training loss = 0.0806, Training accuracy = 0.9550, F1 = 0.9550



Epoch 8/10:  49%|████▉     | 1082/2208 [01:00<01:06, 16.82it/s][A
Epoch 8/10:  49%|████▉     | 1085/2208 [01:00<01:02, 18.00it/s][A
Epoch 8/10:  49%|████▉     | 1088/2208 [01:00<00:59, 18.95it/s][A
Epoch 8/10:  49%|████▉     | 1091/2208 [01:00<00:57, 19.41it/s][A
Epoch 8/10:  50%|████▉     | 1094/2208 [01:00<00:57, 19.44it/s][A
Epoch 8/10:  50%|████▉     | 1097/2208 [01:01<00:55, 19.88it/s][A
  with torch.cuda.amp.autocast():

Epoch 8/10:  50%|████▉     | 1103/2208 [01:01<01:22, 13.47it/s][A

Batch 1100: Training loss = 0.1078, Training accuracy = 0.9552, F1 = 0.9551



Epoch 8/10:  50%|█████     | 1106/2208 [01:01<01:12, 15.13it/s][A
Epoch 8/10:  50%|█████     | 1108/2208 [01:01<01:08, 15.97it/s][A
Epoch 8/10:  50%|█████     | 1110/2208 [01:01<01:05, 16.75it/s][A
Epoch 8/10:  50%|█████     | 1113/2208 [01:02<01:00, 18.11it/s][A
Epoch 8/10:  51%|█████     | 1116/2208 [01:02<00:59, 18.38it/s][A
Epoch 8/10:  51%|█████     | 1119/2208 [01:02<00:56, 19.12it/s][A
Epoch 8/10:  51%|█████     | 1122/2208 [01:02<00:55, 19.74it/s][A
  with torch.cuda.amp.autocast():

Epoch 8/10:  51%|█████     | 1127/2208 [01:03<01:32, 11.74it/s][A
Epoch 8/10:  51%|█████     | 1130/2208 [01:03<01:17, 13.85it/s][A

Batch 1125: Training loss = 0.0982, Training accuracy = 0.9552, F1 = 0.9552



Epoch 8/10:  51%|█████▏    | 1133/2208 [01:03<01:09, 15.54it/s][A
Epoch 8/10:  51%|█████▏    | 1136/2208 [01:03<01:02, 17.04it/s][A
Epoch 8/10:  52%|█████▏    | 1139/2208 [01:03<00:58, 18.16it/s][A
Epoch 8/10:  52%|█████▏    | 1142/2208 [01:03<00:56, 18.86it/s][A
Epoch 8/10:  52%|█████▏    | 1145/2208 [01:03<00:54, 19.42it/s][A
Epoch 8/10:  52%|█████▏    | 1148/2208 [01:04<00:55, 18.98it/s][A
  with torch.cuda.amp.autocast():

Epoch 8/10:  52%|█████▏    | 1154/2208 [01:04<01:10, 15.05it/s][A

Batch 1150: Training loss = 0.0515, Training accuracy = 0.9553, F1 = 0.9553



Epoch 8/10:  52%|█████▏    | 1157/2208 [01:04<01:03, 16.55it/s][A
Epoch 8/10:  53%|█████▎    | 1160/2208 [01:04<00:59, 17.66it/s][A
Epoch 8/10:  53%|█████▎    | 1163/2208 [01:05<00:55, 18.68it/s][A
Epoch 8/10:  53%|█████▎    | 1166/2208 [01:05<00:53, 19.42it/s][A
Epoch 8/10:  53%|█████▎    | 1169/2208 [01:05<00:52, 19.89it/s][A
Epoch 8/10:  53%|█████▎    | 1172/2208 [01:05<00:51, 20.21it/s][A
  with torch.cuda.amp.autocast():

Epoch 8/10:  53%|█████▎    | 1178/2208 [01:06<01:12, 14.18it/s][A

Batch 1175: Training loss = 0.1465, Training accuracy = 0.9553, F1 = 0.9552



Epoch 8/10:  53%|█████▎    | 1181/2208 [01:06<01:04, 15.84it/s][A
Epoch 8/10:  54%|█████▎    | 1184/2208 [01:06<00:59, 17.23it/s][A
Epoch 8/10:  54%|█████▍    | 1187/2208 [01:06<00:56, 18.16it/s][A
Epoch 8/10:  54%|█████▍    | 1190/2208 [01:06<00:53, 19.00it/s][A
Epoch 8/10:  54%|█████▍    | 1193/2208 [01:06<00:51, 19.74it/s][A
Epoch 8/10:  54%|█████▍    | 1196/2208 [01:06<00:50, 20.23it/s][A
  with torch.cuda.amp.autocast():

Epoch 8/10:  54%|█████▍    | 1202/2208 [01:07<01:13, 13.70it/s][A
Epoch 8/10:  55%|█████▍    | 1205/2208 [01:07<01:05, 15.41it/s][A

Batch 1200: Training loss = 0.1230, Training accuracy = 0.9552, F1 = 0.9552



Epoch 8/10:  55%|█████▍    | 1208/2208 [01:07<00:59, 16.87it/s][A
Epoch 8/10:  55%|█████▍    | 1211/2208 [01:07<00:55, 17.91it/s][A
Epoch 8/10:  55%|█████▍    | 1214/2208 [01:07<00:52, 18.84it/s][A
Epoch 8/10:  55%|█████▌    | 1217/2208 [01:08<00:50, 19.53it/s][A
Epoch 8/10:  55%|█████▌    | 1220/2208 [01:08<00:49, 20.03it/s][A
Epoch 8/10:  55%|█████▌    | 1223/2208 [01:08<00:48, 20.42it/s][A
  with torch.cuda.amp.autocast():

Epoch 8/10:  56%|█████▌    | 1229/2208 [01:08<01:02, 15.71it/s][A

Batch 1225: Training loss = 0.1215, Training accuracy = 0.9551, F1 = 0.9551



Epoch 8/10:  56%|█████▌    | 1232/2208 [01:09<00:57, 17.10it/s][A
Epoch 8/10:  56%|█████▌    | 1235/2208 [01:09<00:53, 18.05it/s][A
Epoch 8/10:  56%|█████▌    | 1238/2208 [01:09<00:51, 18.92it/s][A
Epoch 8/10:  56%|█████▌    | 1241/2208 [01:09<00:49, 19.66it/s][A
Epoch 8/10:  56%|█████▋    | 1244/2208 [01:09<00:48, 19.94it/s][A
Epoch 8/10:  56%|█████▋    | 1247/2208 [01:09<00:47, 20.31it/s][A
  with torch.cuda.amp.autocast():

Epoch 8/10:  57%|█████▋    | 1253/2208 [01:10<01:10, 13.63it/s][A

Batch 1250: Training loss = 0.1169, Training accuracy = 0.9552, F1 = 0.9552



Epoch 8/10:  57%|█████▋    | 1256/2208 [01:10<01:02, 15.31it/s][A
Epoch 8/10:  57%|█████▋    | 1259/2208 [01:10<00:57, 16.63it/s][A
Epoch 8/10:  57%|█████▋    | 1262/2208 [01:10<00:53, 17.78it/s][A
Epoch 8/10:  57%|█████▋    | 1265/2208 [01:10<00:50, 18.72it/s][A
Epoch 8/10:  57%|█████▋    | 1268/2208 [01:10<00:48, 19.47it/s][A
Epoch 8/10:  58%|█████▊    | 1271/2208 [01:11<00:47, 19.83it/s][A
  with torch.cuda.amp.autocast():

Epoch 8/10:  58%|█████▊    | 1277/2208 [01:11<01:08, 13.66it/s][A
Epoch 8/10:  58%|█████▊    | 1280/2208 [01:11<01:00, 15.39it/s][A

Batch 1275: Training loss = 0.1641, Training accuracy = 0.9551, F1 = 0.9551



Epoch 8/10:  58%|█████▊    | 1283/2208 [01:11<00:55, 16.73it/s][A
Epoch 8/10:  58%|█████▊    | 1286/2208 [01:12<00:51, 17.86it/s][A
Epoch 8/10:  58%|█████▊    | 1289/2208 [01:12<00:49, 18.67it/s][A
Epoch 8/10:  59%|█████▊    | 1292/2208 [01:12<00:47, 19.31it/s][A
Epoch 8/10:  59%|█████▊    | 1295/2208 [01:12<00:46, 19.82it/s][A
Epoch 8/10:  59%|█████▉    | 1298/2208 [01:12<00:45, 20.17it/s][A
  with torch.cuda.amp.autocast():

Epoch 8/10:  59%|█████▉    | 1304/2208 [01:13<01:00, 14.92it/s][A

Batch 1300: Training loss = 0.1905, Training accuracy = 0.9551, F1 = 0.9550



Epoch 8/10:  59%|█████▉    | 1307/2208 [01:13<00:55, 16.35it/s][A
Epoch 8/10:  59%|█████▉    | 1310/2208 [01:13<00:51, 17.51it/s][A
Epoch 8/10:  59%|█████▉    | 1313/2208 [01:13<00:48, 18.61it/s][A
Epoch 8/10:  60%|█████▉    | 1316/2208 [01:13<00:46, 19.30it/s][A
Epoch 8/10:  60%|█████▉    | 1319/2208 [01:13<00:44, 19.85it/s][A
Epoch 8/10:  60%|█████▉    | 1322/2208 [01:14<00:43, 20.27it/s][A
  with torch.cuda.amp.autocast():

Epoch 8/10:  60%|██████    | 1328/2208 [01:14<01:04, 13.61it/s][A

Batch 1325: Training loss = 0.1186, Training accuracy = 0.9551, F1 = 0.9551



Epoch 8/10:  60%|██████    | 1331/2208 [01:14<00:57, 15.25it/s][A
Epoch 8/10:  60%|██████    | 1334/2208 [01:14<00:52, 16.72it/s][A
Epoch 8/10:  61%|██████    | 1337/2208 [01:14<00:49, 17.76it/s][A
Epoch 8/10:  61%|██████    | 1339/2208 [01:15<00:47, 18.21it/s][A
Epoch 8/10:  61%|██████    | 1341/2208 [01:15<00:54, 15.95it/s][A
Epoch 8/10:  61%|██████    | 1344/2208 [01:15<00:49, 17.44it/s][A
Epoch 8/10:  61%|██████    | 1346/2208 [01:15<00:48, 17.67it/s][A
Epoch 8/10:  61%|██████    | 1349/2208 [01:15<00:49, 17.30it/s][A
  with torch.cuda.amp.autocast():

Epoch 8/10:  61%|██████▏   | 1354/2208 [01:16<01:02, 13.59it/s][A

Batch 1350: Training loss = 0.2237, Training accuracy = 0.9551, F1 = 0.9551



Epoch 8/10:  61%|██████▏   | 1357/2208 [01:16<00:55, 15.40it/s][A
Epoch 8/10:  62%|██████▏   | 1360/2208 [01:16<00:50, 16.77it/s][A
Epoch 8/10:  62%|██████▏   | 1363/2208 [01:16<00:47, 17.97it/s][A
Epoch 8/10:  62%|██████▏   | 1366/2208 [01:16<00:44, 18.96it/s][A
Epoch 8/10:  62%|██████▏   | 1369/2208 [01:16<00:42, 19.56it/s][A
Epoch 8/10:  62%|██████▏   | 1372/2208 [01:17<00:47, 17.43it/s][A
Epoch 8/10:  62%|██████▏   | 1374/2208 [01:17<00:48, 17.15it/s][A
  with torch.cuda.amp.autocast():

Epoch 8/10:  62%|██████▏   | 1379/2208 [01:17<01:05, 12.61it/s][A

Batch 1375: Training loss = 0.0699, Training accuracy = 0.9552, F1 = 0.9551



Epoch 8/10:  63%|██████▎   | 1382/2208 [01:17<00:56, 14.61it/s][A
Epoch 8/10:  63%|██████▎   | 1385/2208 [01:18<00:50, 16.22it/s][A
Epoch 8/10:  63%|██████▎   | 1388/2208 [01:18<00:46, 17.53it/s][A
Epoch 8/10:  63%|██████▎   | 1390/2208 [01:18<00:46, 17.56it/s][A
Epoch 8/10:  63%|██████▎   | 1393/2208 [01:18<00:48, 16.88it/s][A
Epoch 8/10:  63%|██████▎   | 1396/2208 [01:18<00:44, 18.05it/s][A
Epoch 8/10:  63%|██████▎   | 1398/2208 [01:18<00:49, 16.34it/s][A
  with torch.cuda.amp.autocast():

Epoch 8/10:  63%|██████▎   | 1402/2208 [01:19<01:14, 10.75it/s][A
Epoch 8/10:  64%|██████▎   | 1405/2208 [01:19<01:00, 13.17it/s][A

Batch 1400: Training loss = 0.1079, Training accuracy = 0.9552, F1 = 0.9552



Epoch 8/10:  64%|██████▍   | 1408/2208 [01:19<00:52, 15.16it/s][A
Epoch 8/10:  64%|██████▍   | 1411/2208 [01:19<00:47, 16.68it/s][A
Epoch 8/10:  64%|██████▍   | 1414/2208 [01:19<00:44, 17.85it/s][A
Epoch 8/10:  64%|██████▍   | 1417/2208 [01:20<00:42, 18.70it/s][A
Epoch 8/10:  64%|██████▍   | 1420/2208 [01:20<00:40, 19.35it/s][A
Epoch 8/10:  64%|██████▍   | 1423/2208 [01:20<00:39, 19.90it/s][A
  with torch.cuda.amp.autocast():

Epoch 8/10:  65%|██████▍   | 1429/2208 [01:20<00:54, 14.31it/s][A

Batch 1425: Training loss = 0.0887, Training accuracy = 0.9552, F1 = 0.9552



Epoch 8/10:  65%|██████▍   | 1432/2208 [01:21<00:48, 15.94it/s][A
Epoch 8/10:  65%|██████▍   | 1435/2208 [01:21<00:44, 17.26it/s][A
Epoch 8/10:  65%|██████▌   | 1438/2208 [01:21<00:42, 18.18it/s][A
Epoch 8/10:  65%|██████▌   | 1441/2208 [01:21<00:40, 18.91it/s][A
Epoch 8/10:  65%|██████▌   | 1444/2208 [01:21<00:39, 19.56it/s][A
Epoch 8/10:  66%|██████▌   | 1447/2208 [01:21<00:37, 20.07it/s][A
  with torch.cuda.amp.autocast():

Epoch 8/10:  66%|██████▌   | 1453/2208 [01:22<01:00, 12.49it/s][A

Batch 1450: Training loss = 0.0946, Training accuracy = 0.9551, F1 = 0.9551



Epoch 8/10:  66%|██████▌   | 1456/2208 [01:22<00:52, 14.33it/s][A
Epoch 8/10:  66%|██████▌   | 1459/2208 [01:22<00:47, 15.90it/s][A
Epoch 8/10:  66%|██████▌   | 1462/2208 [01:22<00:43, 17.17it/s][A
Epoch 8/10:  66%|██████▋   | 1465/2208 [01:22<00:40, 18.19it/s][A
Epoch 8/10:  66%|██████▋   | 1468/2208 [01:23<00:38, 19.04it/s][A
Epoch 8/10:  67%|██████▋   | 1471/2208 [01:23<00:37, 19.43it/s][A
  with torch.cuda.amp.autocast():

Epoch 8/10:  67%|██████▋   | 1477/2208 [01:23<00:58, 12.43it/s][A
Epoch 8/10:  67%|██████▋   | 1480/2208 [01:23<00:51, 14.23it/s][A

Batch 1475: Training loss = 0.1116, Training accuracy = 0.9552, F1 = 0.9552



Epoch 8/10:  67%|██████▋   | 1483/2208 [01:24<00:45, 15.78it/s][A
Epoch 8/10:  67%|██████▋   | 1486/2208 [01:24<00:42, 17.02it/s][A
Epoch 8/10:  67%|██████▋   | 1489/2208 [01:24<00:39, 18.00it/s][A
Epoch 8/10:  68%|██████▊   | 1492/2208 [01:24<00:38, 18.80it/s][A
Epoch 8/10:  68%|██████▊   | 1495/2208 [01:24<00:36, 19.57it/s][A
Epoch 8/10:  68%|██████▊   | 1498/2208 [01:24<00:35, 20.11it/s][A
  with torch.cuda.amp.autocast():

Epoch 8/10:  68%|██████▊   | 1504/2208 [01:25<00:48, 14.51it/s][A

Batch 1500: Training loss = 0.1661, Training accuracy = 0.9552, F1 = 0.9552



Epoch 8/10:  68%|██████▊   | 1507/2208 [01:25<00:43, 16.11it/s][A
Epoch 8/10:  68%|██████▊   | 1510/2208 [01:25<00:40, 17.30it/s][A
Epoch 8/10:  69%|██████▊   | 1513/2208 [01:25<00:37, 18.39it/s][A
Epoch 8/10:  69%|██████▊   | 1516/2208 [01:25<00:36, 19.10it/s][A
Epoch 8/10:  69%|██████▉   | 1519/2208 [01:26<00:34, 19.69it/s][A
Epoch 8/10:  69%|██████▉   | 1522/2208 [01:26<00:34, 19.94it/s][A
  with torch.cuda.amp.autocast():

Epoch 8/10:  69%|██████▉   | 1528/2208 [01:26<00:54, 12.46it/s][A

Batch 1525: Training loss = 0.2112, Training accuracy = 0.9552, F1 = 0.9552



Epoch 8/10:  69%|██████▉   | 1531/2208 [01:26<00:47, 14.24it/s][A
Epoch 8/10:  69%|██████▉   | 1534/2208 [01:27<00:42, 15.84it/s][A
Epoch 8/10:  70%|██████▉   | 1537/2208 [01:27<00:39, 17.19it/s][A
Epoch 8/10:  70%|██████▉   | 1540/2208 [01:27<00:36, 18.25it/s][A
Epoch 8/10:  70%|██████▉   | 1543/2208 [01:27<00:35, 18.93it/s][A
Epoch 8/10:  70%|███████   | 1546/2208 [01:27<00:33, 19.65it/s][A
  with torch.cuda.amp.autocast():

Epoch 8/10:  70%|███████   | 1552/2208 [01:28<00:52, 12.46it/s][A
Epoch 8/10:  70%|███████   | 1555/2208 [01:28<00:45, 14.29it/s][A

Batch 1550: Training loss = 0.0978, Training accuracy = 0.9552, F1 = 0.9552



Epoch 8/10:  71%|███████   | 1558/2208 [01:28<00:40, 15.92it/s][A
Epoch 8/10:  71%|███████   | 1561/2208 [01:28<00:37, 17.31it/s][A
Epoch 8/10:  71%|███████   | 1564/2208 [01:28<00:35, 18.26it/s][A
Epoch 8/10:  71%|███████   | 1567/2208 [01:28<00:33, 19.00it/s][A
Epoch 8/10:  71%|███████   | 1570/2208 [01:29<00:32, 19.41it/s][A
Epoch 8/10:  71%|███████   | 1573/2208 [01:29<00:31, 19.89it/s][A
  with torch.cuda.amp.autocast():

Epoch 8/10:  72%|███████▏  | 1579/2208 [01:29<00:50, 12.50it/s][A

Batch 1575: Training loss = 0.1644, Training accuracy = 0.9552, F1 = 0.9552



Epoch 8/10:  72%|███████▏  | 1582/2208 [01:30<00:44, 14.20it/s][A
Epoch 8/10:  72%|███████▏  | 1585/2208 [01:30<00:39, 15.71it/s][A
Epoch 8/10:  72%|███████▏  | 1588/2208 [01:30<00:36, 17.07it/s][A
Epoch 8/10:  72%|███████▏  | 1591/2208 [01:30<00:34, 18.07it/s][A
Epoch 8/10:  72%|███████▏  | 1594/2208 [01:30<00:32, 18.78it/s][A
Epoch 8/10:  72%|███████▏  | 1597/2208 [01:30<00:34, 17.49it/s][A
Epoch 8/10:  72%|███████▏  | 1599/2208 [01:30<00:34, 17.60it/s][A
  with torch.cuda.amp.autocast():

Epoch 8/10:  73%|███████▎  | 1604/2208 [01:31<00:48, 12.56it/s][A

Batch 1600: Training loss = 0.0789, Training accuracy = 0.9553, F1 = 0.9553



Epoch 8/10:  73%|███████▎  | 1607/2208 [01:31<00:41, 14.52it/s][A
Epoch 8/10:  73%|███████▎  | 1610/2208 [01:31<00:37, 16.13it/s][A
Epoch 8/10:  73%|███████▎  | 1613/2208 [01:31<00:34, 17.42it/s][A
Epoch 8/10:  73%|███████▎  | 1616/2208 [01:32<00:32, 18.43it/s][A
Epoch 8/10:  73%|███████▎  | 1619/2208 [01:32<00:36, 16.10it/s][A
Epoch 8/10:  73%|███████▎  | 1622/2208 [01:32<00:34, 17.03it/s][A
  with torch.cuda.amp.autocast():

Epoch 8/10:  74%|███████▎  | 1627/2208 [01:33<00:53, 10.96it/s][A
Epoch 8/10:  74%|███████▍  | 1630/2208 [01:33<00:44, 13.04it/s][A

Batch 1625: Training loss = 0.0418, Training accuracy = 0.9554, F1 = 0.9553



Epoch 8/10:  74%|███████▍  | 1633/2208 [01:33<00:38, 14.81it/s][A
Epoch 8/10:  74%|███████▍  | 1636/2208 [01:33<00:34, 16.42it/s][A
Epoch 8/10:  74%|███████▍  | 1639/2208 [01:33<00:32, 17.65it/s][A
Epoch 8/10:  74%|███████▍  | 1642/2208 [01:33<00:30, 18.60it/s][A
Epoch 8/10:  75%|███████▍  | 1645/2208 [01:33<00:29, 19.21it/s][A
Epoch 8/10:  75%|███████▍  | 1648/2208 [01:34<00:28, 19.77it/s][A
  with torch.cuda.amp.autocast():

Epoch 8/10:  75%|███████▍  | 1654/2208 [01:34<00:39, 13.95it/s][A

Batch 1650: Training loss = 0.1265, Training accuracy = 0.9554, F1 = 0.9554



Epoch 8/10:  75%|███████▌  | 1657/2208 [01:34<00:35, 15.58it/s][A
Epoch 8/10:  75%|███████▌  | 1660/2208 [01:34<00:32, 16.86it/s][A
Epoch 8/10:  75%|███████▌  | 1663/2208 [01:35<00:30, 17.93it/s][A
Epoch 8/10:  75%|███████▌  | 1666/2208 [01:35<00:28, 18.79it/s][A
Epoch 8/10:  76%|███████▌  | 1669/2208 [01:35<00:27, 19.36it/s][A
Epoch 8/10:  76%|███████▌  | 1672/2208 [01:35<00:27, 19.17it/s][A
  with torch.cuda.amp.autocast():

Epoch 8/10:  76%|███████▌  | 1677/2208 [01:36<00:46, 11.38it/s][A
Epoch 8/10:  76%|███████▌  | 1680/2208 [01:36<00:39, 13.44it/s][A

Batch 1675: Training loss = 0.1523, Training accuracy = 0.9555, F1 = 0.9554



Epoch 8/10:  76%|███████▌  | 1683/2208 [01:36<00:34, 15.22it/s][A
Epoch 8/10:  76%|███████▋  | 1686/2208 [01:36<00:31, 16.66it/s][A
Epoch 8/10:  76%|███████▋  | 1689/2208 [01:36<00:29, 17.73it/s][A
Epoch 8/10:  77%|███████▋  | 1692/2208 [01:36<00:27, 18.69it/s][A
Epoch 8/10:  77%|███████▋  | 1695/2208 [01:37<00:26, 19.41it/s][A
Epoch 8/10:  77%|███████▋  | 1698/2208 [01:37<00:25, 19.86it/s][A
  with torch.cuda.amp.autocast():

Epoch 8/10:  77%|███████▋  | 1704/2208 [01:37<00:36, 13.93it/s][A

Batch 1700: Training loss = 0.0938, Training accuracy = 0.9556, F1 = 0.9556



Epoch 8/10:  77%|███████▋  | 1707/2208 [01:37<00:32, 15.55it/s][A
Epoch 8/10:  77%|███████▋  | 1710/2208 [01:38<00:29, 16.92it/s][A
Epoch 8/10:  78%|███████▊  | 1713/2208 [01:38<00:27, 18.04it/s][A
Epoch 8/10:  78%|███████▊  | 1716/2208 [01:38<00:26, 18.87it/s][A
Epoch 8/10:  78%|███████▊  | 1719/2208 [01:38<00:25, 19.50it/s][A
Epoch 8/10:  78%|███████▊  | 1722/2208 [01:38<00:24, 19.83it/s][A
  with torch.cuda.amp.autocast():

Epoch 8/10:  78%|███████▊  | 1728/2208 [01:39<00:41, 11.54it/s][A

Batch 1725: Training loss = 0.0883, Training accuracy = 0.9557, F1 = 0.9557



Epoch 8/10:  78%|███████▊  | 1731/2208 [01:39<00:35, 13.41it/s][A
Epoch 8/10:  79%|███████▊  | 1734/2208 [01:39<00:31, 15.11it/s][A
Epoch 8/10:  79%|███████▊  | 1737/2208 [01:39<00:28, 16.56it/s][A
Epoch 8/10:  79%|███████▉  | 1740/2208 [01:39<00:26, 17.60it/s][A
Epoch 8/10:  79%|███████▉  | 1743/2208 [01:39<00:25, 18.52it/s][A
Epoch 8/10:  79%|███████▉  | 1746/2208 [01:40<00:24, 19.20it/s][A
  with torch.cuda.amp.autocast():

Epoch 8/10:  79%|███████▉  | 1752/2208 [01:40<00:37, 12.07it/s][A
Epoch 8/10:  79%|███████▉  | 1755/2208 [01:40<00:32, 13.90it/s][A

Batch 1750: Training loss = 0.1231, Training accuracy = 0.9558, F1 = 0.9558



Epoch 8/10:  80%|███████▉  | 1758/2208 [01:41<00:28, 15.58it/s][A
Epoch 8/10:  80%|███████▉  | 1761/2208 [01:41<00:26, 16.95it/s][A
Epoch 8/10:  80%|███████▉  | 1764/2208 [01:41<00:24, 18.02it/s][A
Epoch 8/10:  80%|████████  | 1767/2208 [01:41<00:23, 18.90it/s][A
Epoch 8/10:  80%|████████  | 1770/2208 [01:41<00:22, 19.52it/s][A
Epoch 8/10:  80%|████████  | 1773/2208 [01:41<00:21, 19.98it/s][A
  with torch.cuda.amp.autocast():

Epoch 8/10:  81%|████████  | 1779/2208 [01:42<00:31, 13.72it/s][A

Batch 1775: Training loss = 0.1619, Training accuracy = 0.9558, F1 = 0.9558



Epoch 8/10:  81%|████████  | 1782/2208 [01:42<00:27, 15.42it/s][A
Epoch 8/10:  81%|████████  | 1785/2208 [01:42<00:25, 16.82it/s][A
Epoch 8/10:  81%|████████  | 1788/2208 [01:42<00:23, 18.03it/s][A
Epoch 8/10:  81%|████████  | 1791/2208 [01:42<00:22, 18.83it/s][A
Epoch 8/10:  81%|████████▏ | 1794/2208 [01:43<00:21, 19.49it/s][A
Epoch 8/10:  81%|████████▏ | 1797/2208 [01:43<00:20, 19.90it/s][A
  with torch.cuda.amp.autocast():

Epoch 8/10:  82%|████████▏ | 1803/2208 [01:43<00:36, 11.11it/s][A

Batch 1800: Training loss = 0.1269, Training accuracy = 0.9558, F1 = 0.9558



Epoch 8/10:  82%|████████▏ | 1806/2208 [01:44<00:31, 12.94it/s][A
Epoch 8/10:  82%|████████▏ | 1809/2208 [01:44<00:27, 14.71it/s][A
Epoch 8/10:  82%|████████▏ | 1812/2208 [01:44<00:24, 16.17it/s][A
Epoch 8/10:  82%|████████▏ | 1815/2208 [01:44<00:22, 17.36it/s][A
Epoch 8/10:  82%|████████▏ | 1818/2208 [01:44<00:21, 18.29it/s][A
Epoch 8/10:  82%|████████▏ | 1821/2208 [01:44<00:20, 19.02it/s][A
  with torch.cuda.amp.autocast():

Epoch 8/10:  83%|████████▎ | 1827/2208 [01:45<00:35, 10.79it/s][A
Epoch 8/10:  83%|████████▎ | 1830/2208 [01:45<00:29, 12.71it/s][A

Batch 1825: Training loss = 0.0863, Training accuracy = 0.9558, F1 = 0.9558



Epoch 8/10:  83%|████████▎ | 1832/2208 [01:45<00:27, 13.81it/s][A
Epoch 8/10:  83%|████████▎ | 1835/2208 [01:45<00:24, 15.52it/s][A
Epoch 8/10:  83%|████████▎ | 1838/2208 [01:45<00:21, 16.88it/s][A
Epoch 8/10:  83%|████████▎ | 1841/2208 [01:46<00:20, 17.89it/s][A
Epoch 8/10:  84%|████████▎ | 1844/2208 [01:46<00:19, 18.80it/s][A
Epoch 8/10:  84%|████████▎ | 1847/2208 [01:46<00:18, 19.44it/s][A
  with torch.cuda.amp.autocast():

Epoch 8/10:  84%|████████▍ | 1853/2208 [01:47<00:34, 10.36it/s][A

Batch 1850: Training loss = 0.0689, Training accuracy = 0.9559, F1 = 0.9558



Epoch 8/10:  84%|████████▍ | 1856/2208 [01:47<00:28, 12.26it/s][A
Epoch 8/10:  84%|████████▍ | 1859/2208 [01:47<00:24, 13.98it/s][A
Epoch 8/10:  84%|████████▍ | 1861/2208 [01:47<00:23, 14.98it/s][A
Epoch 8/10:  84%|████████▍ | 1864/2208 [01:47<00:20, 16.52it/s][A
Epoch 8/10:  85%|████████▍ | 1867/2208 [01:47<00:19, 17.68it/s][A
Epoch 8/10:  85%|████████▍ | 1870/2208 [01:47<00:18, 18.68it/s][A
Epoch 8/10:  85%|████████▍ | 1873/2208 [01:48<00:17, 19.35it/s][A
  with torch.cuda.amp.autocast():

Epoch 8/10:  85%|████████▌ | 1879/2208 [01:48<00:24, 13.35it/s][A

Batch 1875: Training loss = 0.1363, Training accuracy = 0.9559, F1 = 0.9558



Epoch 8/10:  85%|████████▌ | 1882/2208 [01:48<00:21, 15.03it/s][A
Epoch 8/10:  85%|████████▌ | 1885/2208 [01:49<00:19, 16.41it/s][A
Epoch 8/10:  86%|████████▌ | 1888/2208 [01:49<00:18, 17.65it/s][A
Epoch 8/10:  86%|████████▌ | 1891/2208 [01:49<00:17, 18.49it/s][A
Epoch 8/10:  86%|████████▌ | 1894/2208 [01:49<00:16, 19.33it/s][A
Epoch 8/10:  86%|████████▌ | 1897/2208 [01:49<00:15, 19.83it/s][A
  with torch.cuda.amp.autocast():

Epoch 8/10:  86%|████████▌ | 1903/2208 [01:50<00:25, 11.76it/s][A

Batch 1900: Training loss = 0.1167, Training accuracy = 0.9559, F1 = 0.9559



Epoch 8/10:  86%|████████▋ | 1906/2208 [01:50<00:22, 13.65it/s][A
Epoch 8/10:  86%|████████▋ | 1909/2208 [01:50<00:19, 15.30it/s][A
Epoch 8/10:  87%|████████▋ | 1912/2208 [01:50<00:17, 16.68it/s][A
Epoch 8/10:  87%|████████▋ | 1915/2208 [01:50<00:16, 17.87it/s][A
Epoch 8/10:  87%|████████▋ | 1918/2208 [01:50<00:15, 18.77it/s][A
Epoch 8/10:  87%|████████▋ | 1921/2208 [01:51<00:14, 19.51it/s][A
  with torch.cuda.amp.autocast():

Epoch 8/10:  87%|████████▋ | 1927/2208 [01:51<00:24, 11.67it/s][A
Epoch 8/10:  87%|████████▋ | 1930/2208 [01:51<00:20, 13.57it/s][A

Batch 1925: Training loss = 0.1708, Training accuracy = 0.9560, F1 = 0.9559



Epoch 8/10:  88%|████████▊ | 1933/2208 [01:52<00:18, 15.27it/s][A
Epoch 8/10:  88%|████████▊ | 1936/2208 [01:52<00:16, 16.61it/s][A
Epoch 8/10:  88%|████████▊ | 1939/2208 [01:52<00:15, 17.73it/s][A
Epoch 8/10:  88%|████████▊ | 1942/2208 [01:52<00:14, 18.57it/s][A
Epoch 8/10:  88%|████████▊ | 1945/2208 [01:52<00:13, 19.23it/s][A
Epoch 8/10:  88%|████████▊ | 1948/2208 [01:52<00:13, 19.81it/s][A
  with torch.cuda.amp.autocast():

Epoch 8/10:  88%|████████▊ | 1954/2208 [01:53<00:19, 13.26it/s][A

Batch 1950: Training loss = 0.1104, Training accuracy = 0.9560, F1 = 0.9560



Epoch 8/10:  89%|████████▊ | 1957/2208 [01:53<00:16, 14.96it/s][A
Epoch 8/10:  89%|████████▉ | 1960/2208 [01:53<00:15, 16.37it/s][A
Epoch 8/10:  89%|████████▉ | 1963/2208 [01:53<00:13, 17.67it/s][A
Epoch 8/10:  89%|████████▉ | 1966/2208 [01:53<00:12, 18.66it/s][A
Epoch 8/10:  89%|████████▉ | 1969/2208 [01:54<00:12, 19.43it/s][A
Epoch 8/10:  89%|████████▉ | 1972/2208 [01:54<00:11, 19.99it/s][A
  with torch.cuda.amp.autocast():

Epoch 8/10:  90%|████████▉ | 1978/2208 [01:54<00:20, 11.30it/s][A

Batch 1975: Training loss = 0.2367, Training accuracy = 0.9561, F1 = 0.9560



Epoch 8/10:  90%|████████▉ | 1981/2208 [01:55<00:17, 13.19it/s][A
Epoch 8/10:  90%|████████▉ | 1984/2208 [01:55<00:15, 14.89it/s][A
Epoch 8/10:  90%|████████▉ | 1987/2208 [01:55<00:13, 16.29it/s][A
Epoch 8/10:  90%|█████████ | 1990/2208 [01:55<00:12, 17.44it/s][A
Epoch 8/10:  90%|█████████ | 1993/2208 [01:55<00:11, 18.52it/s][A
Epoch 8/10:  90%|█████████ | 1996/2208 [01:55<00:10, 19.32it/s][A
  with torch.cuda.amp.autocast():

Epoch 8/10:  91%|█████████ | 2002/2208 [01:56<00:18, 10.87it/s][A
Epoch 8/10:  91%|█████████ | 2005/2208 [01:56<00:15, 12.76it/s][A

Batch 2000: Training loss = 0.1575, Training accuracy = 0.9562, F1 = 0.9561



Epoch 8/10:  91%|█████████ | 2008/2208 [01:56<00:13, 14.51it/s][A
Epoch 8/10:  91%|█████████ | 2011/2208 [01:56<00:12, 16.07it/s][A
Epoch 8/10:  91%|█████████ | 2014/2208 [01:57<00:11, 17.31it/s][A
Epoch 8/10:  91%|█████████▏| 2017/2208 [01:57<00:10, 18.29it/s][A
Epoch 8/10:  91%|█████████▏| 2020/2208 [01:57<00:09, 19.11it/s][A
Epoch 8/10:  92%|█████████▏| 2023/2208 [01:57<00:09, 19.57it/s][A
  with torch.cuda.amp.autocast():

Epoch 8/10:  92%|█████████▏| 2029/2208 [01:58<00:14, 12.62it/s][A

Batch 2025: Training loss = 0.0548, Training accuracy = 0.9562, F1 = 0.9562



Epoch 8/10:  92%|█████████▏| 2032/2208 [01:58<00:12, 14.37it/s][A
Epoch 8/10:  92%|█████████▏| 2035/2208 [01:58<00:10, 15.94it/s][A
Epoch 8/10:  92%|█████████▏| 2038/2208 [01:58<00:09, 17.17it/s][A
Epoch 8/10:  92%|█████████▏| 2040/2208 [01:58<00:09, 17.64it/s][A
Epoch 8/10:  93%|█████████▎| 2043/2208 [01:58<00:08, 18.66it/s][A
Epoch 8/10:  93%|█████████▎| 2046/2208 [01:59<00:09, 17.78it/s][A
Epoch 8/10:  93%|█████████▎| 2049/2208 [01:59<00:08, 18.73it/s][A
  with torch.cuda.amp.autocast():

Epoch 8/10:  93%|█████████▎| 2054/2208 [01:59<00:12, 11.97it/s][A

Batch 2050: Training loss = 0.2007, Training accuracy = 0.9562, F1 = 0.9562



Epoch 8/10:  93%|█████████▎| 2057/2208 [02:00<00:10, 13.92it/s][A
Epoch 8/10:  93%|█████████▎| 2060/2208 [02:00<00:09, 15.52it/s][A
Epoch 8/10:  93%|█████████▎| 2063/2208 [02:00<00:08, 16.93it/s][A
Epoch 8/10:  94%|█████████▎| 2066/2208 [02:00<00:07, 18.05it/s][A
Epoch 8/10:  94%|█████████▎| 2069/2208 [02:00<00:07, 18.77it/s][A
Epoch 8/10:  94%|█████████▍| 2072/2208 [02:00<00:06, 19.46it/s][A
  with torch.cuda.amp.autocast():

Epoch 8/10:  94%|█████████▍| 2078/2208 [02:01<00:12, 10.67it/s][A

Batch 2075: Training loss = 0.1077, Training accuracy = 0.9563, F1 = 0.9563



Epoch 8/10:  94%|█████████▍| 2081/2208 [02:01<00:10, 12.58it/s][A
Epoch 8/10:  94%|█████████▍| 2084/2208 [02:01<00:08, 14.28it/s][A
Epoch 8/10:  95%|█████████▍| 2087/2208 [02:01<00:07, 15.86it/s][A
Epoch 8/10:  95%|█████████▍| 2090/2208 [02:02<00:06, 17.14it/s][A
Epoch 8/10:  95%|█████████▍| 2093/2208 [02:02<00:06, 17.23it/s][A
Epoch 8/10:  95%|█████████▍| 2096/2208 [02:02<00:06, 18.23it/s][A
Epoch 8/10:  95%|█████████▌| 2098/2208 [02:02<00:06, 17.71it/s][A
  with torch.cuda.amp.autocast():

Epoch 8/10:  95%|█████████▌| 2104/2208 [02:03<00:08, 12.11it/s][A

Batch 2100: Training loss = 0.1347, Training accuracy = 0.9563, F1 = 0.9563



Epoch 8/10:  95%|█████████▌| 2107/2208 [02:03<00:07, 13.98it/s][A
Epoch 8/10:  96%|█████████▌| 2110/2208 [02:03<00:06, 15.67it/s][A
Epoch 8/10:  96%|█████████▌| 2113/2208 [02:03<00:05, 16.92it/s][A
Epoch 8/10:  96%|█████████▌| 2116/2208 [02:03<00:05, 18.08it/s][A
Epoch 8/10:  96%|█████████▌| 2119/2208 [02:03<00:04, 18.95it/s][A
Epoch 8/10:  96%|█████████▌| 2122/2208 [02:04<00:04, 19.62it/s][A
  with torch.cuda.amp.autocast():

Epoch 8/10:  96%|█████████▋| 2128/2208 [02:04<00:07, 10.97it/s][A

Batch 2125: Training loss = 0.1009, Training accuracy = 0.9563, F1 = 0.9563



Epoch 8/10:  97%|█████████▋| 2131/2208 [02:04<00:05, 12.89it/s][A
Epoch 8/10:  97%|█████████▋| 2134/2208 [02:04<00:05, 14.68it/s][A
Epoch 8/10:  97%|█████████▋| 2137/2208 [02:05<00:04, 16.10it/s][A
Epoch 8/10:  97%|█████████▋| 2140/2208 [02:05<00:03, 17.29it/s][A
Epoch 8/10:  97%|█████████▋| 2143/2208 [02:05<00:03, 18.32it/s][A
Epoch 8/10:  97%|█████████▋| 2146/2208 [02:05<00:03, 19.10it/s][A
  with torch.cuda.amp.autocast():

Epoch 8/10:  97%|█████████▋| 2152/2208 [02:06<00:05, 10.73it/s][A
Epoch 8/10:  98%|█████████▊| 2155/2208 [02:06<00:04, 12.64it/s][A

Batch 2150: Training loss = 0.0609, Training accuracy = 0.9564, F1 = 0.9563



Epoch 8/10:  98%|█████████▊| 2158/2208 [02:06<00:03, 14.45it/s][A
Epoch 8/10:  98%|█████████▊| 2161/2208 [02:06<00:02, 15.95it/s][A
Epoch 8/10:  98%|█████████▊| 2164/2208 [02:06<00:02, 17.15it/s][A
Epoch 8/10:  98%|█████████▊| 2167/2208 [02:06<00:02, 18.13it/s][A
Epoch 8/10:  98%|█████████▊| 2170/2208 [02:07<00:02, 18.79it/s][A
Epoch 8/10:  98%|█████████▊| 2173/2208 [02:07<00:01, 19.52it/s][A
  with torch.cuda.amp.autocast():

Epoch 8/10:  99%|█████████▊| 2179/2208 [02:07<00:02, 12.82it/s][A

Batch 2175: Training loss = 0.1658, Training accuracy = 0.9564, F1 = 0.9564



Epoch 8/10:  99%|█████████▉| 2182/2208 [02:08<00:01, 14.55it/s][A
Epoch 8/10:  99%|█████████▉| 2185/2208 [02:08<00:01, 16.15it/s][A
Epoch 8/10:  99%|█████████▉| 2188/2208 [02:08<00:01, 17.41it/s][A
Epoch 8/10:  99%|█████████▉| 2191/2208 [02:08<00:00, 18.34it/s][A
Epoch 8/10:  99%|█████████▉| 2194/2208 [02:08<00:00, 19.15it/s][A
Epoch 8/10: 100%|█████████▉| 2197/2208 [02:08<00:00, 19.78it/s][A
  with torch.cuda.amp.autocast():

Epoch 8/10: 100%|█████████▉| 2203/2208 [02:09<00:00, 10.57it/s][A

Batch 2200: Training loss = 0.1152, Training accuracy = 0.9565, F1 = 0.9564



Epoch 8/10: 100%|█████████▉| 2206/2208 [02:09<00:00, 12.53it/s][A
                                                               [A


Epoch 8 Training Metrics:
Loss: 0.1317
Accuracy: 0.9565
F1 Score: 0.9564
Precision: 0.9564
Recall: 0.9565

Starting validation...



Validation:   0%|          | 0/552 [00:00<?, ?it/s][A
Validation:   0%|          | 1/552 [00:01<14:51,  1.62s/it][A
Validation:   1%|          | 3/552 [00:01<04:13,  2.17it/s][A
Validation:   1%|          | 5/552 [00:01<02:17,  3.97it/s][A
Validation:   1%|▏         | 7/552 [00:01<01:31,  5.94it/s][A
Validation:   2%|▏         | 9/552 [00:02<01:07,  8.00it/s][A
Validation:   2%|▏         | 11/552 [00:02<00:54,  9.99it/s][A
Validation:   2%|▏         | 13/552 [00:02<00:45, 11.85it/s][A
Validation:   3%|▎         | 15/552 [00:02<00:39, 13.44it/s][A
Validation:   3%|▎         | 17/552 [00:02<00:36, 14.81it/s][A
Validation:   3%|▎         | 19/552 [00:02<00:33, 15.84it/s][A
Validation:   4%|▍         | 21/552 [00:02<00:31, 16.71it/s][A
Validation:   4%|▍         | 23/552 [00:02<00:36, 14.68it/s][A
Validation:   5%|▍         | 25/552 [00:02<00:33, 15.74it/s][A
Validation:   5%|▍         | 27/552 [00:03<00:32, 16.35it/s][A
Validation:   5%|▌         | 29/552 [00:03<00:30, 17.


Epoch 8 Validation Metrics:
Loss: 0.1403
Accuracy: 0.9574
F1 Score: 0.9573
Precision: 0.9588
Recall: 0.9574


Training epochs:  80%|████████  | 8/10 [21:32<05:24, 162.13s/it]


Starting epoch 9/10



  with torch.cuda.amp.autocast():

  with torch.cuda.amp.autocast():

Epoch 9/10:   0%|          | 3/2208 [00:01<17:40,  2.08it/s]  [A

Batch 0: Training loss = 0.1039, Training accuracy = 0.9453, F1 = 0.9453



Epoch 9/10:   0%|          | 6/2208 [00:01<07:57,  4.61it/s][A
Epoch 9/10:   0%|          | 9/2208 [00:02<05:01,  7.30it/s][A
Epoch 9/10:   1%|          | 12/2208 [00:02<03:42,  9.87it/s][A
Epoch 9/10:   1%|          | 14/2208 [00:02<03:12, 11.39it/s][A
Epoch 9/10:   1%|          | 16/2208 [00:02<02:51, 12.76it/s][A
Epoch 9/10:   1%|          | 18/2208 [00:02<02:39, 13.73it/s][A
Epoch 9/10:   1%|          | 20/2208 [00:02<02:27, 14.79it/s][A
Epoch 9/10:   1%|          | 22/2208 [00:02<02:19, 15.66it/s][A
Epoch 9/10:   1%|          | 24/2208 [00:02<02:17, 15.83it/s][A
  with torch.cuda.amp.autocast():

Epoch 9/10:   1%|▏         | 28/2208 [00:03<02:13, 16.32it/s][A

Batch 25: Training loss = 0.1348, Training accuracy = 0.9537, F1 = 0.9537



Epoch 9/10:   1%|▏         | 30/2208 [00:03<02:18, 15.75it/s][A
Epoch 9/10:   1%|▏         | 33/2208 [00:03<02:06, 17.18it/s][A
Epoch 9/10:   2%|▏         | 36/2208 [00:03<01:57, 18.43it/s][A
Epoch 9/10:   2%|▏         | 38/2208 [00:03<01:55, 18.74it/s][A
Epoch 9/10:   2%|▏         | 41/2208 [00:03<02:00, 17.95it/s][A
Epoch 9/10:   2%|▏         | 44/2208 [00:04<01:53, 18.99it/s][A
Epoch 9/10:   2%|▏         | 47/2208 [00:04<01:50, 19.54it/s][A
Epoch 9/10:   2%|▏         | 49/2208 [00:04<02:01, 17.73it/s][A
  with torch.cuda.amp.autocast():

Epoch 9/10:   2%|▏         | 53/2208 [00:04<02:10, 16.46it/s][A

Batch 50: Training loss = 0.2394, Training accuracy = 0.9580, F1 = 0.9579



Epoch 9/10:   3%|▎         | 56/2208 [00:04<02:00, 17.87it/s][A
Epoch 9/10:   3%|▎         | 58/2208 [00:04<01:57, 18.36it/s][A
Epoch 9/10:   3%|▎         | 61/2208 [00:05<02:08, 16.75it/s][A
Epoch 9/10:   3%|▎         | 64/2208 [00:05<01:59, 17.90it/s][A
Epoch 9/10:   3%|▎         | 67/2208 [00:05<01:53, 18.81it/s][A
Epoch 9/10:   3%|▎         | 69/2208 [00:05<01:53, 18.89it/s][A
Epoch 9/10:   3%|▎         | 72/2208 [00:05<01:48, 19.76it/s][A
Epoch 9/10:   3%|▎         | 74/2208 [00:05<01:52, 18.89it/s][A
  with torch.cuda.amp.autocast():

Epoch 9/10:   4%|▎         | 78/2208 [00:05<01:52, 18.96it/s][A

Batch 75: Training loss = 0.2012, Training accuracy = 0.9570, F1 = 0.9569



Epoch 9/10:   4%|▎         | 81/2208 [00:06<01:56, 18.20it/s][A
Epoch 9/10:   4%|▍         | 84/2208 [00:06<01:50, 19.15it/s][A
Epoch 9/10:   4%|▍         | 87/2208 [00:06<01:47, 19.77it/s][A
Epoch 9/10:   4%|▍         | 89/2208 [00:06<02:02, 17.31it/s][A
Epoch 9/10:   4%|▍         | 92/2208 [00:06<01:54, 18.45it/s][A
Epoch 9/10:   4%|▍         | 94/2208 [00:06<01:56, 18.13it/s][A
Epoch 9/10:   4%|▍         | 97/2208 [00:06<02:05, 16.89it/s][A
  with torch.cuda.amp.autocast():

Epoch 9/10:   5%|▍         | 102/2208 [00:07<02:04, 16.89it/s][A
Epoch 9/10:   5%|▍         | 105/2208 [00:07<01:55, 18.16it/s][A

Batch 100: Training loss = 0.1328, Training accuracy = 0.9582, F1 = 0.9581



Epoch 9/10:   5%|▍         | 108/2208 [00:07<01:50, 19.02it/s][A
Epoch 9/10:   5%|▌         | 111/2208 [00:07<01:47, 19.53it/s][A
Epoch 9/10:   5%|▌         | 113/2208 [00:07<01:47, 19.49it/s][A
Epoch 9/10:   5%|▌         | 116/2208 [00:07<01:43, 20.19it/s][A
Epoch 9/10:   5%|▌         | 119/2208 [00:08<01:57, 17.74it/s][A
Epoch 9/10:   6%|▌         | 122/2208 [00:08<01:51, 18.72it/s][A
  with torch.cuda.amp.autocast():

Epoch 9/10:   6%|▌         | 127/2208 [00:08<01:52, 18.55it/s][A
Epoch 9/10:   6%|▌         | 130/2208 [00:08<01:47, 19.37it/s][A

Batch 125: Training loss = 0.1090, Training accuracy = 0.9581, F1 = 0.9581



Epoch 9/10:   6%|▌         | 133/2208 [00:08<01:43, 19.98it/s][A
Epoch 9/10:   6%|▌         | 136/2208 [00:08<01:41, 20.42it/s][A
Epoch 9/10:   6%|▋         | 139/2208 [00:09<01:41, 20.37it/s][A
Epoch 9/10:   6%|▋         | 142/2208 [00:09<01:40, 20.46it/s][A
Epoch 9/10:   7%|▋         | 145/2208 [00:09<01:39, 20.67it/s][A
Epoch 9/10:   7%|▋         | 148/2208 [00:09<01:42, 20.19it/s][A
  with torch.cuda.amp.autocast():

Epoch 9/10:   7%|▋         | 154/2208 [00:09<01:51, 18.37it/s][A

Batch 150: Training loss = 0.0721, Training accuracy = 0.9591, F1 = 0.9590



Epoch 9/10:   7%|▋         | 156/2208 [00:10<01:49, 18.71it/s][A
Epoch 9/10:   7%|▋         | 159/2208 [00:10<01:45, 19.46it/s][A
Epoch 9/10:   7%|▋         | 162/2208 [00:10<01:44, 19.56it/s][A
Epoch 9/10:   7%|▋         | 165/2208 [00:10<01:41, 20.11it/s][A
Epoch 9/10:   8%|▊         | 168/2208 [00:10<01:51, 18.30it/s][A
Epoch 9/10:   8%|▊         | 170/2208 [00:10<01:49, 18.59it/s][A
Epoch 9/10:   8%|▊         | 173/2208 [00:10<01:45, 19.35it/s][A
  with torch.cuda.amp.autocast():

Epoch 9/10:   8%|▊         | 177/2208 [00:11<02:05, 16.19it/s][A
Epoch 9/10:   8%|▊         | 180/2208 [00:11<01:54, 17.76it/s][A

Batch 175: Training loss = 0.0626, Training accuracy = 0.9589, F1 = 0.9589



Epoch 9/10:   8%|▊         | 183/2208 [00:11<01:47, 18.83it/s][A
Epoch 9/10:   8%|▊         | 186/2208 [00:11<01:48, 18.72it/s][A
Epoch 9/10:   9%|▊         | 189/2208 [00:11<01:44, 19.40it/s][A
Epoch 9/10:   9%|▊         | 191/2208 [00:11<01:45, 19.14it/s][A
Epoch 9/10:   9%|▉         | 194/2208 [00:12<01:44, 19.28it/s][A
Epoch 9/10:   9%|▉         | 197/2208 [00:12<01:41, 19.89it/s][A
Epoch 9/10:   9%|▉         | 199/2208 [00:12<01:43, 19.32it/s][A
  with torch.cuda.amp.autocast():

Epoch 9/10:   9%|▉         | 203/2208 [00:12<01:50, 18.22it/s][A

Batch 200: Training loss = 0.2210, Training accuracy = 0.9595, F1 = 0.9594



Epoch 9/10:   9%|▉         | 206/2208 [00:12<01:49, 18.27it/s][A
Epoch 9/10:   9%|▉         | 209/2208 [00:12<01:44, 19.18it/s][A
Epoch 9/10:  10%|▉         | 212/2208 [00:12<01:40, 19.78it/s][A
Epoch 9/10:  10%|▉         | 214/2208 [00:13<01:49, 18.14it/s][A
Epoch 9/10:  10%|▉         | 217/2208 [00:13<01:44, 19.11it/s][A
Epoch 9/10:  10%|▉         | 220/2208 [00:13<01:41, 19.51it/s][A
Epoch 9/10:  10%|█         | 223/2208 [00:13<01:39, 19.91it/s][A
  with torch.cuda.amp.autocast():

Epoch 9/10:  10%|█         | 229/2208 [00:13<01:45, 18.73it/s][A

Batch 225: Training loss = 0.1012, Training accuracy = 0.9595, F1 = 0.9595



Epoch 9/10:  10%|█         | 231/2208 [00:14<01:49, 18.05it/s][A
Epoch 9/10:  11%|█         | 233/2208 [00:14<01:51, 17.71it/s][A
Epoch 9/10:  11%|█         | 235/2208 [00:14<01:51, 17.71it/s][A
Epoch 9/10:  11%|█         | 238/2208 [00:14<01:50, 17.84it/s][A
Epoch 9/10:  11%|█         | 241/2208 [00:14<01:44, 18.90it/s][A
Epoch 9/10:  11%|█         | 243/2208 [00:14<01:51, 17.58it/s][A
Epoch 9/10:  11%|█         | 246/2208 [00:14<01:49, 17.86it/s][A
Epoch 9/10:  11%|█▏        | 249/2208 [00:15<01:45, 18.63it/s][A
  with torch.cuda.amp.autocast():

Epoch 9/10:  11%|█▏        | 253/2208 [00:15<01:55, 16.91it/s][A

Batch 250: Training loss = 0.1927, Training accuracy = 0.9594, F1 = 0.9594



Epoch 9/10:  12%|█▏        | 255/2208 [00:15<01:51, 17.57it/s][A
Epoch 9/10:  12%|█▏        | 258/2208 [00:15<01:44, 18.67it/s][A
Epoch 9/10:  12%|█▏        | 261/2208 [00:15<01:40, 19.29it/s][A
Epoch 9/10:  12%|█▏        | 263/2208 [00:15<01:40, 19.32it/s][A
Epoch 9/10:  12%|█▏        | 265/2208 [00:15<01:42, 18.99it/s][A
Epoch 9/10:  12%|█▏        | 267/2208 [00:16<01:54, 17.00it/s][A
Epoch 9/10:  12%|█▏        | 269/2208 [00:16<01:55, 16.85it/s][A
Epoch 9/10:  12%|█▏        | 271/2208 [00:16<01:49, 17.62it/s][A
Epoch 9/10:  12%|█▏        | 274/2208 [00:16<01:42, 18.83it/s][A
  with torch.cuda.amp.autocast():

Epoch 9/10:  13%|█▎        | 279/2208 [00:16<01:50, 17.42it/s][A

Batch 275: Training loss = 0.1133, Training accuracy = 0.9592, F1 = 0.9592



Epoch 9/10:  13%|█▎        | 282/2208 [00:16<01:43, 18.57it/s][A
Epoch 9/10:  13%|█▎        | 285/2208 [00:17<01:47, 17.81it/s][A
Epoch 9/10:  13%|█▎        | 288/2208 [00:17<01:42, 18.76it/s][A
Epoch 9/10:  13%|█▎        | 290/2208 [00:17<01:42, 18.64it/s][A
Epoch 9/10:  13%|█▎        | 293/2208 [00:17<01:52, 17.03it/s][A
Epoch 9/10:  13%|█▎        | 296/2208 [00:17<01:45, 18.15it/s][A
Epoch 9/10:  13%|█▎        | 298/2208 [00:17<01:55, 16.49it/s][A
  with torch.cuda.amp.autocast():

Epoch 9/10:  14%|█▍        | 304/2208 [00:18<01:49, 17.32it/s][A

Batch 300: Training loss = 0.0875, Training accuracy = 0.9593, F1 = 0.9593



Epoch 9/10:  14%|█▍        | 306/2208 [00:18<01:47, 17.63it/s][A
Epoch 9/10:  14%|█▍        | 308/2208 [00:18<01:45, 18.09it/s][A
Epoch 9/10:  14%|█▍        | 310/2208 [00:18<01:42, 18.46it/s][A
Epoch 9/10:  14%|█▍        | 313/2208 [00:18<01:51, 17.06it/s][A
Epoch 9/10:  14%|█▍        | 316/2208 [00:18<01:43, 18.23it/s][A
Epoch 9/10:  14%|█▍        | 319/2208 [00:18<01:38, 19.09it/s][A
Epoch 9/10:  15%|█▍        | 322/2208 [00:19<01:35, 19.73it/s][A
  with torch.cuda.amp.autocast():

Epoch 9/10:  15%|█▍        | 328/2208 [00:19<01:50, 17.08it/s][A

Batch 325: Training loss = 0.1740, Training accuracy = 0.9593, F1 = 0.9593



Epoch 9/10:  15%|█▍        | 331/2208 [00:19<01:43, 18.22it/s][A
Epoch 9/10:  15%|█▌        | 334/2208 [00:19<01:38, 19.04it/s][A
Epoch 9/10:  15%|█▌        | 337/2208 [00:19<01:40, 18.66it/s][A
Epoch 9/10:  15%|█▌        | 340/2208 [00:20<01:36, 19.41it/s][A
Epoch 9/10:  15%|█▌        | 342/2208 [00:20<01:41, 18.43it/s][A
Epoch 9/10:  16%|█▌        | 344/2208 [00:20<01:39, 18.75it/s][A
Epoch 9/10:  16%|█▌        | 347/2208 [00:20<01:35, 19.51it/s][A
  with torch.cuda.amp.autocast():

Epoch 9/10:  16%|█▌        | 353/2208 [00:20<01:47, 17.24it/s][A

Batch 350: Training loss = 0.0747, Training accuracy = 0.9593, F1 = 0.9593



Epoch 9/10:  16%|█▌        | 356/2208 [00:20<01:41, 18.33it/s][A
Epoch 9/10:  16%|█▋        | 359/2208 [00:21<01:36, 19.22it/s][A
Epoch 9/10:  16%|█▋        | 362/2208 [00:21<01:33, 19.68it/s][A
Epoch 9/10:  17%|█▋        | 365/2208 [00:21<01:31, 20.04it/s][A
Epoch 9/10:  17%|█▋        | 368/2208 [00:21<01:30, 20.42it/s][A
Epoch 9/10:  17%|█▋        | 371/2208 [00:21<01:28, 20.66it/s][A
  with torch.cuda.amp.autocast():

Epoch 9/10:  17%|█▋        | 377/2208 [00:21<01:41, 18.11it/s][A
Epoch 9/10:  17%|█▋        | 379/2208 [00:22<01:42, 17.87it/s][A

Batch 375: Training loss = 0.2076, Training accuracy = 0.9590, F1 = 0.9589



Epoch 9/10:  17%|█▋        | 382/2208 [00:22<01:36, 18.86it/s][A
Epoch 9/10:  17%|█▋        | 385/2208 [00:22<01:33, 19.53it/s][A
Epoch 9/10:  18%|█▊        | 388/2208 [00:22<01:30, 20.16it/s][A
Epoch 9/10:  18%|█▊        | 391/2208 [00:22<01:29, 20.35it/s][A
Epoch 9/10:  18%|█▊        | 394/2208 [00:22<01:33, 19.49it/s][A
Epoch 9/10:  18%|█▊        | 397/2208 [00:22<01:30, 19.96it/s][A
  with torch.cuda.amp.autocast():

Epoch 9/10:  18%|█▊        | 403/2208 [00:23<01:45, 17.14it/s][A

Batch 400: Training loss = 0.1541, Training accuracy = 0.9590, F1 = 0.9590



Epoch 9/10:  18%|█▊        | 406/2208 [00:23<01:39, 18.16it/s][A
Epoch 9/10:  18%|█▊        | 408/2208 [00:23<01:37, 18.52it/s][A
Epoch 9/10:  19%|█▊        | 411/2208 [00:23<01:32, 19.33it/s][A
Epoch 9/10:  19%|█▊        | 413/2208 [00:23<01:33, 19.18it/s][A
Epoch 9/10:  19%|█▉        | 416/2208 [00:23<01:30, 19.73it/s][A
Epoch 9/10:  19%|█▉        | 419/2208 [00:24<01:28, 20.30it/s][A
Epoch 9/10:  19%|█▉        | 422/2208 [00:24<01:27, 20.36it/s][A
  with torch.cuda.amp.autocast():

Epoch 9/10:  19%|█▉        | 427/2208 [00:24<01:52, 15.89it/s][A
Epoch 9/10:  19%|█▉        | 430/2208 [00:24<01:42, 17.33it/s][A

Batch 425: Training loss = 0.1280, Training accuracy = 0.9590, F1 = 0.9589



Epoch 9/10:  20%|█▉        | 433/2208 [00:24<01:36, 18.45it/s][A
Epoch 9/10:  20%|█▉        | 436/2208 [00:25<01:31, 19.31it/s][A
Epoch 9/10:  20%|█▉        | 439/2208 [00:25<01:29, 19.84it/s][A
Epoch 9/10:  20%|██        | 442/2208 [00:25<01:27, 20.20it/s][A
Epoch 9/10:  20%|██        | 445/2208 [00:25<01:26, 20.43it/s][A
Epoch 9/10:  20%|██        | 448/2208 [00:25<01:25, 20.52it/s][A
  with torch.cuda.amp.autocast():

Epoch 9/10:  21%|██        | 454/2208 [00:26<01:38, 17.77it/s][A

Batch 450: Training loss = 0.2486, Training accuracy = 0.9585, F1 = 0.9584



Epoch 9/10:  21%|██        | 457/2208 [00:26<01:33, 18.71it/s][A
Epoch 9/10:  21%|██        | 459/2208 [00:26<01:32, 18.83it/s][A
Epoch 9/10:  21%|██        | 462/2208 [00:26<01:29, 19.60it/s][A
Epoch 9/10:  21%|██        | 465/2208 [00:26<01:26, 20.14it/s][A
Epoch 9/10:  21%|██        | 468/2208 [00:26<01:25, 20.25it/s][A
Epoch 9/10:  21%|██▏       | 471/2208 [00:26<01:24, 20.45it/s][A
  with torch.cuda.amp.autocast():

Epoch 9/10:  22%|██▏       | 477/2208 [00:27<01:38, 17.59it/s][A
Epoch 9/10:  22%|██▏       | 480/2208 [00:27<01:33, 18.57it/s][A

Batch 475: Training loss = 0.0934, Training accuracy = 0.9582, F1 = 0.9581



Epoch 9/10:  22%|██▏       | 483/2208 [00:27<01:29, 19.33it/s][A
Epoch 9/10:  22%|██▏       | 486/2208 [00:27<01:26, 19.86it/s][A
Epoch 9/10:  22%|██▏       | 489/2208 [00:27<01:24, 20.25it/s][A
Epoch 9/10:  22%|██▏       | 492/2208 [00:27<01:23, 20.61it/s][A
Epoch 9/10:  22%|██▏       | 495/2208 [00:28<01:22, 20.86it/s][A
Epoch 9/10:  23%|██▎       | 498/2208 [00:28<01:21, 20.93it/s][A
  with torch.cuda.amp.autocast():

Epoch 9/10:  23%|██▎       | 504/2208 [00:28<01:32, 18.39it/s][A

Batch 500: Training loss = 0.1659, Training accuracy = 0.9583, F1 = 0.9583



Epoch 9/10:  23%|██▎       | 507/2208 [00:28<01:28, 19.18it/s][A
Epoch 9/10:  23%|██▎       | 510/2208 [00:28<01:26, 19.64it/s][A
Epoch 9/10:  23%|██▎       | 513/2208 [00:29<01:24, 20.02it/s][A
Epoch 9/10:  23%|██▎       | 516/2208 [00:29<01:28, 19.07it/s][A
Epoch 9/10:  23%|██▎       | 518/2208 [00:29<01:31, 18.51it/s][A
Epoch 9/10:  24%|██▎       | 521/2208 [00:29<01:27, 19.31it/s][A
Epoch 9/10:  24%|██▎       | 523/2208 [00:29<01:39, 17.00it/s][A
  with torch.cuda.amp.autocast():

Epoch 9/10:  24%|██▍       | 529/2208 [00:30<01:43, 16.25it/s][A

Batch 525: Training loss = 0.1214, Training accuracy = 0.9585, F1 = 0.9584



Epoch 9/10:  24%|██▍       | 532/2208 [00:30<01:35, 17.52it/s][A
Epoch 9/10:  24%|██▍       | 535/2208 [00:30<01:30, 18.52it/s][A
Epoch 9/10:  24%|██▍       | 538/2208 [00:30<01:26, 19.23it/s][A
Epoch 9/10:  25%|██▍       | 541/2208 [00:30<01:34, 17.66it/s][A
Epoch 9/10:  25%|██▍       | 544/2208 [00:30<01:30, 18.49it/s][A
Epoch 9/10:  25%|██▍       | 546/2208 [00:30<01:33, 17.72it/s][A
Epoch 9/10:  25%|██▍       | 549/2208 [00:31<01:32, 18.03it/s][A
  with torch.cuda.amp.autocast():

Epoch 9/10:  25%|██▌       | 554/2208 [00:31<01:45, 15.72it/s][A

Batch 550: Training loss = 0.2106, Training accuracy = 0.9585, F1 = 0.9585



Epoch 9/10:  25%|██▌       | 557/2208 [00:31<01:35, 17.27it/s][A
Epoch 9/10:  25%|██▌       | 560/2208 [00:31<01:30, 18.30it/s][A
Epoch 9/10:  25%|██▌       | 563/2208 [00:31<01:26, 19.09it/s][A
Epoch 9/10:  26%|██▌       | 566/2208 [00:32<01:23, 19.59it/s][A
Epoch 9/10:  26%|██▌       | 569/2208 [00:32<01:26, 18.96it/s][A
Epoch 9/10:  26%|██▌       | 571/2208 [00:32<01:29, 18.37it/s][A
Epoch 9/10:  26%|██▌       | 573/2208 [00:32<01:28, 18.38it/s][A
  with torch.cuda.amp.autocast():

Epoch 9/10:  26%|██▌       | 577/2208 [00:32<02:07, 12.76it/s][A
Epoch 9/10:  26%|██▋       | 580/2208 [00:32<01:48, 14.96it/s][A

Batch 575: Training loss = 0.0888, Training accuracy = 0.9587, F1 = 0.9586



Epoch 9/10:  26%|██▋       | 583/2208 [00:33<01:38, 16.54it/s][A
Epoch 9/10:  26%|██▋       | 585/2208 [00:33<01:34, 17.18it/s][A
Epoch 9/10:  27%|██▋       | 588/2208 [00:33<01:28, 18.35it/s][A
Epoch 9/10:  27%|██▋       | 591/2208 [00:33<01:24, 19.16it/s][A
Epoch 9/10:  27%|██▋       | 594/2208 [00:33<01:21, 19.78it/s][A
Epoch 9/10:  27%|██▋       | 597/2208 [00:33<01:19, 20.22it/s][A
  with torch.cuda.amp.autocast():

Epoch 9/10:  27%|██▋       | 603/2208 [00:34<01:42, 15.72it/s][A

Batch 600: Training loss = 0.1667, Training accuracy = 0.9587, F1 = 0.9587



Epoch 9/10:  27%|██▋       | 606/2208 [00:34<01:33, 17.07it/s][A
Epoch 9/10:  28%|██▊       | 609/2208 [00:34<01:28, 18.05it/s][A
Epoch 9/10:  28%|██▊       | 612/2208 [00:34<01:24, 18.79it/s][A
Epoch 9/10:  28%|██▊       | 615/2208 [00:34<01:22, 19.41it/s][A
Epoch 9/10:  28%|██▊       | 618/2208 [00:34<01:19, 19.88it/s][A
Epoch 9/10:  28%|██▊       | 621/2208 [00:35<01:18, 20.21it/s][A
  with torch.cuda.amp.autocast():

Epoch 9/10:  28%|██▊       | 627/2208 [00:35<01:33, 16.96it/s][A
Epoch 9/10:  29%|██▊       | 630/2208 [00:35<01:27, 18.07it/s][A

Batch 625: Training loss = 0.1496, Training accuracy = 0.9586, F1 = 0.9585



Epoch 9/10:  29%|██▊       | 633/2208 [00:35<01:23, 18.96it/s][A
Epoch 9/10:  29%|██▉       | 636/2208 [00:35<01:20, 19.60it/s][A
Epoch 9/10:  29%|██▉       | 639/2208 [00:36<01:17, 20.15it/s][A
Epoch 9/10:  29%|██▉       | 642/2208 [00:36<01:16, 20.41it/s][A
Epoch 9/10:  29%|██▉       | 645/2208 [00:36<01:16, 20.49it/s][A
Epoch 9/10:  29%|██▉       | 648/2208 [00:36<01:15, 20.57it/s][A
  with torch.cuda.amp.autocast():

Epoch 9/10:  30%|██▉       | 654/2208 [00:36<01:27, 17.69it/s][A

Batch 650: Training loss = 0.0695, Training accuracy = 0.9587, F1 = 0.9587



Epoch 9/10:  30%|██▉       | 657/2208 [00:37<01:23, 18.60it/s][A
Epoch 9/10:  30%|██▉       | 660/2208 [00:37<01:20, 19.34it/s][A
Epoch 9/10:  30%|███       | 663/2208 [00:37<01:18, 19.80it/s][A
Epoch 9/10:  30%|███       | 666/2208 [00:37<01:16, 20.13it/s][A
Epoch 9/10:  30%|███       | 669/2208 [00:37<01:15, 20.48it/s][A
Epoch 9/10:  30%|███       | 672/2208 [00:37<01:14, 20.71it/s][A
  with torch.cuda.amp.autocast():

Epoch 9/10:  31%|███       | 678/2208 [00:38<01:35, 15.98it/s][A

Batch 675: Training loss = 0.1013, Training accuracy = 0.9590, F1 = 0.9590



Epoch 9/10:  31%|███       | 681/2208 [00:38<01:28, 17.27it/s][A
Epoch 9/10:  31%|███       | 684/2208 [00:38<01:23, 18.29it/s][A
Epoch 9/10:  31%|███       | 687/2208 [00:38<01:20, 18.99it/s][A
Epoch 9/10:  31%|███▏      | 690/2208 [00:38<01:17, 19.57it/s][A
Epoch 9/10:  31%|███▏      | 693/2208 [00:38<01:15, 20.12it/s][A
Epoch 9/10:  32%|███▏      | 696/2208 [00:39<01:13, 20.46it/s][A
  with torch.cuda.amp.autocast():

Epoch 9/10:  32%|███▏      | 702/2208 [00:39<01:32, 16.26it/s][A
Epoch 9/10:  32%|███▏      | 705/2208 [00:39<01:26, 17.45it/s][A

Batch 700: Training loss = 0.1037, Training accuracy = 0.9589, F1 = 0.9589



Epoch 9/10:  32%|███▏      | 708/2208 [00:39<01:21, 18.32it/s][A
Epoch 9/10:  32%|███▏      | 711/2208 [00:39<01:18, 19.14it/s][A
Epoch 9/10:  32%|███▏      | 714/2208 [00:39<01:15, 19.70it/s][A
Epoch 9/10:  32%|███▏      | 717/2208 [00:40<01:13, 20.24it/s][A
Epoch 9/10:  33%|███▎      | 720/2208 [00:40<01:12, 20.45it/s][A
Epoch 9/10:  33%|███▎      | 723/2208 [00:40<01:11, 20.69it/s][A
  with torch.cuda.amp.autocast():

Epoch 9/10:  33%|███▎      | 729/2208 [00:40<01:24, 17.47it/s][A

Batch 725: Training loss = 0.0855, Training accuracy = 0.9589, F1 = 0.9589



Epoch 9/10:  33%|███▎      | 732/2208 [00:40<01:19, 18.48it/s][A
Epoch 9/10:  33%|███▎      | 735/2208 [00:41<01:16, 19.19it/s][A
Epoch 9/10:  33%|███▎      | 738/2208 [00:41<01:14, 19.73it/s][A
Epoch 9/10:  34%|███▎      | 741/2208 [00:41<01:13, 20.09it/s][A
Epoch 9/10:  34%|███▎      | 744/2208 [00:41<01:11, 20.51it/s][A
Epoch 9/10:  34%|███▍      | 747/2208 [00:41<01:10, 20.66it/s][A
  with torch.cuda.amp.autocast():

Epoch 9/10:  34%|███▍      | 753/2208 [00:42<01:31, 15.98it/s][A

Batch 750: Training loss = 0.2297, Training accuracy = 0.9589, F1 = 0.9589



Epoch 9/10:  34%|███▍      | 756/2208 [00:42<01:23, 17.30it/s][A
Epoch 9/10:  34%|███▍      | 759/2208 [00:42<01:19, 18.29it/s][A
Epoch 9/10:  35%|███▍      | 762/2208 [00:42<01:16, 18.99it/s][A
Epoch 9/10:  35%|███▍      | 764/2208 [00:42<01:15, 19.14it/s][A
Epoch 9/10:  35%|███▍      | 767/2208 [00:42<01:12, 19.90it/s][A
Epoch 9/10:  35%|███▍      | 770/2208 [00:42<01:10, 20.38it/s][A
Epoch 9/10:  35%|███▌      | 773/2208 [00:43<01:10, 20.33it/s][A
  with torch.cuda.amp.autocast():

Epoch 9/10:  35%|███▌      | 779/2208 [00:43<01:31, 15.68it/s][A

Batch 775: Training loss = 0.0939, Training accuracy = 0.9589, F1 = 0.9589



Epoch 9/10:  35%|███▌      | 782/2208 [00:43<01:23, 17.08it/s][A
Epoch 9/10:  36%|███▌      | 785/2208 [00:43<01:18, 18.18it/s][A
Epoch 9/10:  36%|███▌      | 788/2208 [00:43<01:14, 19.01it/s][A
Epoch 9/10:  36%|███▌      | 791/2208 [00:44<01:21, 17.28it/s][A
Epoch 9/10:  36%|███▌      | 793/2208 [00:44<01:19, 17.80it/s][A
Epoch 9/10:  36%|███▌      | 795/2208 [00:44<01:24, 16.68it/s][A
Epoch 9/10:  36%|███▌      | 798/2208 [00:44<01:25, 16.53it/s][A
  with torch.cuda.amp.autocast():

Epoch 9/10:  36%|███▋      | 804/2208 [00:45<01:38, 14.29it/s][A

Batch 800: Training loss = 0.1057, Training accuracy = 0.9587, F1 = 0.9587



Epoch 9/10:  37%|███▋      | 807/2208 [00:45<01:28, 15.90it/s][A
Epoch 9/10:  37%|███▋      | 810/2208 [00:45<01:21, 17.14it/s][A
Epoch 9/10:  37%|███▋      | 813/2208 [00:45<01:16, 18.20it/s][A
Epoch 9/10:  37%|███▋      | 816/2208 [00:45<01:13, 18.95it/s][A
Epoch 9/10:  37%|███▋      | 818/2208 [00:45<01:24, 16.37it/s][A
Epoch 9/10:  37%|███▋      | 821/2208 [00:46<01:18, 17.72it/s][A
Epoch 9/10:  37%|███▋      | 824/2208 [00:46<01:14, 18.60it/s][A
  with torch.cuda.amp.autocast():

Epoch 9/10:  38%|███▊      | 829/2208 [00:46<01:37, 14.09it/s][A

Batch 825: Training loss = 0.0520, Training accuracy = 0.9588, F1 = 0.9587



Epoch 9/10:  38%|███▊      | 832/2208 [00:46<01:27, 15.79it/s][A
Epoch 9/10:  38%|███▊      | 835/2208 [00:46<01:19, 17.19it/s][A
Epoch 9/10:  38%|███▊      | 838/2208 [00:47<01:14, 18.29it/s][A
Epoch 9/10:  38%|███▊      | 841/2208 [00:47<01:11, 19.00it/s][A
Epoch 9/10:  38%|███▊      | 844/2208 [00:47<01:18, 17.46it/s][A
Epoch 9/10:  38%|███▊      | 847/2208 [00:47<01:13, 18.49it/s][A
Epoch 9/10:  38%|███▊      | 849/2208 [00:47<01:14, 18.28it/s][A
  with torch.cuda.amp.autocast():

Epoch 9/10:  39%|███▊      | 854/2208 [00:48<01:28, 15.33it/s][A

Batch 850: Training loss = 0.2679, Training accuracy = 0.9587, F1 = 0.9587



Epoch 9/10:  39%|███▉      | 857/2208 [00:48<01:20, 16.81it/s][A
Epoch 9/10:  39%|███▉      | 860/2208 [00:48<01:15, 17.92it/s][A
Epoch 9/10:  39%|███▉      | 863/2208 [00:48<01:11, 18.85it/s][A
Epoch 9/10:  39%|███▉      | 866/2208 [00:48<01:08, 19.59it/s][A
Epoch 9/10:  39%|███▉      | 869/2208 [00:48<01:06, 20.10it/s][A
Epoch 9/10:  39%|███▉      | 872/2208 [00:48<01:05, 20.33it/s][A
  with torch.cuda.amp.autocast():

Epoch 9/10:  40%|███▉      | 878/2208 [00:49<01:27, 15.22it/s][A

Batch 875: Training loss = 0.1428, Training accuracy = 0.9587, F1 = 0.9587



Epoch 9/10:  40%|███▉      | 881/2208 [00:49<01:19, 16.72it/s][A
Epoch 9/10:  40%|████      | 884/2208 [00:49<01:14, 17.81it/s][A
Epoch 9/10:  40%|████      | 887/2208 [00:49<01:10, 18.70it/s][A
Epoch 9/10:  40%|████      | 890/2208 [00:49<01:08, 19.34it/s][A
Epoch 9/10:  40%|████      | 893/2208 [00:50<01:05, 19.96it/s][A
Epoch 9/10:  41%|████      | 896/2208 [00:50<01:04, 20.31it/s][A
  with torch.cuda.amp.autocast():

Epoch 9/10:  41%|████      | 902/2208 [00:50<01:30, 14.35it/s][A
Epoch 9/10:  41%|████      | 905/2208 [00:50<01:21, 15.98it/s][A

Batch 900: Training loss = 0.0969, Training accuracy = 0.9587, F1 = 0.9587



Epoch 9/10:  41%|████      | 908/2208 [00:51<01:15, 17.26it/s][A
Epoch 9/10:  41%|████▏     | 911/2208 [00:51<01:10, 18.29it/s][A
Epoch 9/10:  41%|████▏     | 914/2208 [00:51<01:08, 19.00it/s][A
Epoch 9/10:  42%|████▏     | 917/2208 [00:51<01:05, 19.59it/s][A
Epoch 9/10:  42%|████▏     | 920/2208 [00:51<01:03, 20.14it/s][A
Epoch 9/10:  42%|████▏     | 923/2208 [00:51<01:02, 20.50it/s][A
  with torch.cuda.amp.autocast():

Epoch 9/10:  42%|████▏     | 929/2208 [00:52<01:21, 15.75it/s][A

Batch 925: Training loss = 0.0890, Training accuracy = 0.9587, F1 = 0.9587



Epoch 9/10:  42%|████▏     | 932/2208 [00:52<01:14, 17.10it/s][A
Epoch 9/10:  42%|████▏     | 935/2208 [00:52<01:09, 18.22it/s][A
Epoch 9/10:  42%|████▏     | 938/2208 [00:52<01:06, 19.02it/s][A
Epoch 9/10:  43%|████▎     | 941/2208 [00:52<01:04, 19.62it/s][A
Epoch 9/10:  43%|████▎     | 944/2208 [00:52<01:03, 19.96it/s][A
Epoch 9/10:  43%|████▎     | 947/2208 [00:53<01:01, 20.34it/s][A
  with torch.cuda.amp.autocast():

Epoch 9/10:  43%|████▎     | 953/2208 [00:53<01:25, 14.71it/s][A

Batch 950: Training loss = 0.0619, Training accuracy = 0.9589, F1 = 0.9588



Epoch 9/10:  43%|████▎     | 956/2208 [00:53<01:17, 16.10it/s][A
Epoch 9/10:  43%|████▎     | 959/2208 [00:53<01:11, 17.43it/s][A
Epoch 9/10:  44%|████▎     | 962/2208 [00:54<01:07, 18.46it/s][A
Epoch 9/10:  44%|████▎     | 965/2208 [00:54<01:04, 19.17it/s][A
Epoch 9/10:  44%|████▍     | 968/2208 [00:54<01:02, 19.78it/s][A
Epoch 9/10:  44%|████▍     | 971/2208 [00:54<01:00, 20.29it/s][A
  with torch.cuda.amp.autocast():

Epoch 9/10:  44%|████▍     | 977/2208 [00:54<01:24, 14.59it/s][A
Epoch 9/10:  44%|████▍     | 980/2208 [00:55<01:16, 16.13it/s][A

Batch 975: Training loss = 0.1051, Training accuracy = 0.9588, F1 = 0.9588



Epoch 9/10:  45%|████▍     | 983/2208 [00:55<01:10, 17.49it/s][A
Epoch 9/10:  45%|████▍     | 986/2208 [00:55<01:06, 18.43it/s][A
Epoch 9/10:  45%|████▍     | 989/2208 [00:55<01:03, 19.20it/s][A
Epoch 9/10:  45%|████▍     | 992/2208 [00:55<01:01, 19.74it/s][A
Epoch 9/10:  45%|████▌     | 995/2208 [00:55<01:00, 20.21it/s][A
Epoch 9/10:  45%|████▌     | 998/2208 [00:55<00:59, 20.41it/s][A
  with torch.cuda.amp.autocast():

Epoch 9/10:  45%|████▌     | 1004/2208 [00:56<01:15, 15.97it/s][A

Batch 1000: Training loss = 0.1047, Training accuracy = 0.9588, F1 = 0.9587



Epoch 9/10:  46%|████▌     | 1007/2208 [00:56<01:09, 17.34it/s][A
Epoch 9/10:  46%|████▌     | 1010/2208 [00:56<01:05, 18.41it/s][A
Epoch 9/10:  46%|████▌     | 1013/2208 [00:56<01:02, 19.12it/s][A
Epoch 9/10:  46%|████▌     | 1016/2208 [00:56<01:00, 19.81it/s][A
Epoch 9/10:  46%|████▌     | 1019/2208 [00:57<00:58, 20.16it/s][A
Epoch 9/10:  46%|████▋     | 1022/2208 [00:57<01:03, 18.75it/s][A
  with torch.cuda.amp.autocast():

Epoch 9/10:  47%|████▋     | 1027/2208 [00:57<01:28, 13.39it/s][A
Epoch 9/10:  47%|████▋     | 1030/2208 [00:57<01:17, 15.26it/s][A

Batch 1025: Training loss = 0.1632, Training accuracy = 0.9589, F1 = 0.9588



Epoch 9/10:  47%|████▋     | 1033/2208 [00:58<01:10, 16.74it/s][A
Epoch 9/10:  47%|████▋     | 1036/2208 [00:58<01:05, 17.82it/s][A
Epoch 9/10:  47%|████▋     | 1039/2208 [00:58<01:02, 18.58it/s][A
Epoch 9/10:  47%|████▋     | 1042/2208 [00:58<01:00, 19.34it/s][A
Epoch 9/10:  47%|████▋     | 1045/2208 [00:58<00:58, 19.93it/s][A
Epoch 9/10:  47%|████▋     | 1048/2208 [00:58<01:06, 17.49it/s][A
  with torch.cuda.amp.autocast():

Epoch 9/10:  48%|████▊     | 1054/2208 [00:59<01:18, 14.68it/s][A

Batch 1050: Training loss = 0.0340, Training accuracy = 0.9590, F1 = 0.9589



Epoch 9/10:  48%|████▊     | 1057/2208 [00:59<01:11, 16.13it/s][A
Epoch 9/10:  48%|████▊     | 1060/2208 [00:59<01:06, 17.37it/s][A
Epoch 9/10:  48%|████▊     | 1063/2208 [00:59<01:02, 18.25it/s][A
Epoch 9/10:  48%|████▊     | 1065/2208 [00:59<01:05, 17.53it/s][A
Epoch 9/10:  48%|████▊     | 1068/2208 [01:00<01:04, 17.63it/s][A
Epoch 9/10:  48%|████▊     | 1070/2208 [01:00<01:04, 17.65it/s][A
Epoch 9/10:  49%|████▊     | 1072/2208 [01:00<01:03, 17.84it/s][A
Epoch 9/10:  49%|████▊     | 1074/2208 [01:00<01:04, 17.48it/s][A
  with torch.cuda.amp.autocast():

Epoch 9/10:  49%|████▉     | 1079/2208 [01:00<01:30, 12.44it/s][A

Batch 1075: Training loss = 0.0748, Training accuracy = 0.9591, F1 = 0.9591



Epoch 9/10:  49%|████▉     | 1082/2208 [01:01<01:17, 14.47it/s][A
Epoch 9/10:  49%|████▉     | 1084/2208 [01:01<01:12, 15.47it/s][A
Epoch 9/10:  49%|████▉     | 1087/2208 [01:01<01:05, 17.00it/s][A
Epoch 9/10:  49%|████▉     | 1090/2208 [01:01<01:01, 18.06it/s][A
Epoch 9/10:  50%|████▉     | 1093/2208 [01:01<00:59, 18.79it/s][A
Epoch 9/10:  50%|████▉     | 1096/2208 [01:01<00:57, 19.48it/s][A
Epoch 9/10:  50%|████▉     | 1099/2208 [01:02<01:03, 17.50it/s][A
  with torch.cuda.amp.autocast():

Epoch 9/10:  50%|█████     | 1104/2208 [01:02<01:18, 14.13it/s][A

Batch 1100: Training loss = 0.1642, Training accuracy = 0.9591, F1 = 0.9591



Epoch 9/10:  50%|█████     | 1107/2208 [01:02<01:09, 15.82it/s][A
Epoch 9/10:  50%|█████     | 1110/2208 [01:02<01:03, 17.19it/s][A
Epoch 9/10:  50%|█████     | 1113/2208 [01:02<00:59, 18.29it/s][A
Epoch 9/10:  51%|█████     | 1116/2208 [01:03<00:57, 19.06it/s][A
Epoch 9/10:  51%|█████     | 1119/2208 [01:03<00:55, 19.70it/s][A
Epoch 9/10:  51%|█████     | 1122/2208 [01:03<00:54, 20.01it/s][A
  with torch.cuda.amp.autocast():

Epoch 9/10:  51%|█████     | 1128/2208 [01:03<01:21, 13.18it/s][A

Batch 1125: Training loss = 0.1346, Training accuracy = 0.9592, F1 = 0.9592



Epoch 9/10:  51%|█████     | 1131/2208 [01:04<01:12, 14.96it/s][A
Epoch 9/10:  51%|█████▏    | 1134/2208 [01:04<01:05, 16.45it/s][A
Epoch 9/10:  51%|█████▏    | 1137/2208 [01:04<01:00, 17.56it/s][A
Epoch 9/10:  52%|█████▏    | 1140/2208 [01:04<00:57, 18.48it/s][A
Epoch 9/10:  52%|█████▏    | 1143/2208 [01:04<00:55, 19.30it/s][A
Epoch 9/10:  52%|█████▏    | 1146/2208 [01:04<00:53, 19.87it/s][A
  with torch.cuda.amp.autocast():

Epoch 9/10:  52%|█████▏    | 1152/2208 [01:05<01:16, 13.75it/s][A
Epoch 9/10:  52%|█████▏    | 1155/2208 [01:05<01:08, 15.43it/s][A

Batch 1150: Training loss = 0.1219, Training accuracy = 0.9593, F1 = 0.9593



Epoch 9/10:  52%|█████▏    | 1158/2208 [01:05<01:02, 16.78it/s][A
Epoch 9/10:  53%|█████▎    | 1161/2208 [01:05<00:58, 18.04it/s][A
Epoch 9/10:  53%|█████▎    | 1164/2208 [01:05<00:55, 18.97it/s][A
Epoch 9/10:  53%|█████▎    | 1167/2208 [01:05<00:52, 19.69it/s][A
Epoch 9/10:  53%|█████▎    | 1170/2208 [01:06<00:52, 19.87it/s][A
Epoch 9/10:  53%|█████▎    | 1173/2208 [01:06<00:54, 19.11it/s][A
  with torch.cuda.amp.autocast():

Epoch 9/10:  53%|█████▎    | 1177/2208 [01:06<01:20, 12.77it/s][A
Epoch 9/10:  53%|█████▎    | 1180/2208 [01:06<01:09, 14.88it/s][A

Batch 1175: Training loss = 0.1166, Training accuracy = 0.9594, F1 = 0.9593



Epoch 9/10:  54%|█████▎    | 1183/2208 [01:06<01:02, 16.37it/s][A
Epoch 9/10:  54%|█████▎    | 1186/2208 [01:07<00:57, 17.68it/s][A
Epoch 9/10:  54%|█████▍    | 1188/2208 [01:07<00:56, 18.15it/s][A
Epoch 9/10:  54%|█████▍    | 1191/2208 [01:07<00:53, 19.02it/s][A
Epoch 9/10:  54%|█████▍    | 1194/2208 [01:07<00:51, 19.57it/s][A
Epoch 9/10:  54%|█████▍    | 1197/2208 [01:07<00:50, 20.12it/s][A
  with torch.cuda.amp.autocast():

Epoch 9/10:  54%|█████▍    | 1203/2208 [01:08<01:13, 13.68it/s][A

Batch 1200: Training loss = 0.0918, Training accuracy = 0.9593, F1 = 0.9593



Epoch 9/10:  55%|█████▍    | 1206/2208 [01:08<01:05, 15.40it/s][A
Epoch 9/10:  55%|█████▍    | 1209/2208 [01:08<00:59, 16.80it/s][A
Epoch 9/10:  55%|█████▍    | 1212/2208 [01:08<00:55, 17.92it/s][A
Epoch 9/10:  55%|█████▌    | 1215/2208 [01:08<00:53, 18.68it/s][A
Epoch 9/10:  55%|█████▌    | 1218/2208 [01:08<00:51, 19.38it/s][A
Epoch 9/10:  55%|█████▌    | 1221/2208 [01:09<00:49, 19.78it/s][A
Epoch 9/10:  55%|█████▌    | 1224/2208 [01:09<00:51, 19.24it/s][A
  with torch.cuda.amp.autocast():

Epoch 9/10:  56%|█████▌    | 1229/2208 [01:09<01:07, 14.45it/s][A

Batch 1225: Training loss = 0.1888, Training accuracy = 0.9592, F1 = 0.9592



Epoch 9/10:  56%|█████▌    | 1232/2208 [01:09<01:00, 16.15it/s][A
Epoch 9/10:  56%|█████▌    | 1235/2208 [01:09<00:55, 17.39it/s][A
Epoch 9/10:  56%|█████▌    | 1238/2208 [01:10<00:52, 18.37it/s][A
Epoch 9/10:  56%|█████▌    | 1241/2208 [01:10<00:50, 19.13it/s][A
Epoch 9/10:  56%|█████▋    | 1244/2208 [01:10<00:48, 19.80it/s][A
Epoch 9/10:  56%|█████▋    | 1247/2208 [01:10<00:47, 20.29it/s][A
  with torch.cuda.amp.autocast():

Epoch 9/10:  57%|█████▋    | 1253/2208 [01:11<01:09, 13.76it/s][A

Batch 1250: Training loss = 0.1684, Training accuracy = 0.9592, F1 = 0.9592



Epoch 9/10:  57%|█████▋    | 1256/2208 [01:11<01:01, 15.49it/s][A
Epoch 9/10:  57%|█████▋    | 1259/2208 [01:11<00:56, 16.85it/s][A
Epoch 9/10:  57%|█████▋    | 1262/2208 [01:11<00:52, 17.89it/s][A
Epoch 9/10:  57%|█████▋    | 1265/2208 [01:11<00:50, 18.80it/s][A
Epoch 9/10:  57%|█████▋    | 1268/2208 [01:11<00:50, 18.74it/s][A
Epoch 9/10:  58%|█████▊    | 1271/2208 [01:11<00:48, 19.31it/s][A
Epoch 9/10:  58%|█████▊    | 1274/2208 [01:12<00:48, 19.42it/s][A
  with torch.cuda.amp.autocast():

Epoch 9/10:  58%|█████▊    | 1279/2208 [01:12<01:08, 13.56it/s][A

Batch 1275: Training loss = 0.2309, Training accuracy = 0.9594, F1 = 0.9593



Epoch 9/10:  58%|█████▊    | 1282/2208 [01:12<01:00, 15.30it/s][A
Epoch 9/10:  58%|█████▊    | 1285/2208 [01:12<00:55, 16.72it/s][A
Epoch 9/10:  58%|█████▊    | 1288/2208 [01:13<00:51, 17.91it/s][A
Epoch 9/10:  58%|█████▊    | 1291/2208 [01:13<00:48, 18.75it/s][A
Epoch 9/10:  59%|█████▊    | 1294/2208 [01:13<00:48, 18.89it/s][A
Epoch 9/10:  59%|█████▊    | 1296/2208 [01:13<00:53, 17.18it/s][A
Epoch 9/10:  59%|█████▉    | 1299/2208 [01:13<00:50, 18.14it/s][A
  with torch.cuda.amp.autocast():

Epoch 9/10:  59%|█████▉    | 1304/2208 [01:14<01:06, 13.63it/s][A

Batch 1300: Training loss = 0.1062, Training accuracy = 0.9593, F1 = 0.9593



Epoch 9/10:  59%|█████▉    | 1307/2208 [01:14<00:58, 15.40it/s][A
Epoch 9/10:  59%|█████▉    | 1310/2208 [01:14<00:53, 16.88it/s][A
Epoch 9/10:  59%|█████▉    | 1313/2208 [01:14<00:49, 18.01it/s][A
Epoch 9/10:  60%|█████▉    | 1315/2208 [01:14<00:49, 17.99it/s][A
Epoch 9/10:  60%|█████▉    | 1318/2208 [01:14<00:46, 18.99it/s][A
Epoch 9/10:  60%|█████▉    | 1320/2208 [01:15<00:53, 16.52it/s][A
Epoch 9/10:  60%|█████▉    | 1323/2208 [01:15<00:56, 15.62it/s][A
  with torch.cuda.amp.autocast():

Epoch 9/10:  60%|██████    | 1329/2208 [01:15<01:10, 12.54it/s][A

Batch 1325: Training loss = 0.2370, Training accuracy = 0.9594, F1 = 0.9593



Epoch 9/10:  60%|██████    | 1332/2208 [01:15<01:00, 14.38it/s][A
Epoch 9/10:  60%|██████    | 1335/2208 [01:16<00:54, 15.91it/s][A
Epoch 9/10:  61%|██████    | 1338/2208 [01:16<00:50, 17.09it/s][A
Epoch 9/10:  61%|██████    | 1341/2208 [01:16<00:47, 18.21it/s][A
Epoch 9/10:  61%|██████    | 1343/2208 [01:16<00:50, 17.25it/s][A
Epoch 9/10:  61%|██████    | 1346/2208 [01:16<00:47, 18.31it/s][A
Epoch 9/10:  61%|██████    | 1349/2208 [01:16<00:45, 19.04it/s][A
  with torch.cuda.amp.autocast():

Epoch 9/10:  61%|██████▏   | 1354/2208 [01:17<01:01, 13.92it/s][A

Batch 1350: Training loss = 0.1994, Training accuracy = 0.9594, F1 = 0.9594



Epoch 9/10:  61%|██████▏   | 1357/2208 [01:17<00:54, 15.68it/s][A
Epoch 9/10:  62%|██████▏   | 1360/2208 [01:17<00:49, 16.98it/s][A
Epoch 9/10:  62%|██████▏   | 1363/2208 [01:17<00:46, 18.09it/s][A
Epoch 9/10:  62%|██████▏   | 1366/2208 [01:17<00:44, 18.90it/s][A
Epoch 9/10:  62%|██████▏   | 1369/2208 [01:18<00:43, 19.47it/s][A
Epoch 9/10:  62%|██████▏   | 1372/2208 [01:18<00:41, 19.96it/s][A
  with torch.cuda.amp.autocast():

Epoch 9/10:  62%|██████▏   | 1378/2208 [01:18<01:04, 12.90it/s][A

Batch 1375: Training loss = 0.0932, Training accuracy = 0.9594, F1 = 0.9594



Epoch 9/10:  63%|██████▎   | 1381/2208 [01:18<00:56, 14.67it/s][A
Epoch 9/10:  63%|██████▎   | 1384/2208 [01:19<00:51, 16.09it/s][A
Epoch 9/10:  63%|██████▎   | 1386/2208 [01:19<00:48, 16.80it/s][A
Epoch 9/10:  63%|██████▎   | 1388/2208 [01:19<00:47, 17.43it/s][A
Epoch 9/10:  63%|██████▎   | 1391/2208 [01:19<00:44, 18.51it/s][A
Epoch 9/10:  63%|██████▎   | 1394/2208 [01:19<00:42, 19.23it/s][A
Epoch 9/10:  63%|██████▎   | 1397/2208 [01:19<00:40, 19.94it/s][A
  with torch.cuda.amp.autocast():

Epoch 9/10:  64%|██████▎   | 1403/2208 [01:20<01:02, 12.98it/s][A

Batch 1400: Training loss = 0.0995, Training accuracy = 0.9593, F1 = 0.9592



Epoch 9/10:  64%|██████▎   | 1406/2208 [01:20<00:54, 14.77it/s][A
Epoch 9/10:  64%|██████▍   | 1409/2208 [01:20<00:49, 16.30it/s][A
Epoch 9/10:  64%|██████▍   | 1412/2208 [01:20<00:45, 17.54it/s][A
Epoch 9/10:  64%|██████▍   | 1415/2208 [01:20<00:42, 18.53it/s][A
Epoch 9/10:  64%|██████▍   | 1418/2208 [01:20<00:41, 19.26it/s][A
Epoch 9/10:  64%|██████▍   | 1421/2208 [01:21<00:39, 19.73it/s][A
  with torch.cuda.amp.autocast():

Epoch 9/10:  65%|██████▍   | 1427/2208 [01:21<01:04, 12.20it/s][A
Epoch 9/10:  65%|██████▍   | 1430/2208 [01:21<00:55, 13.99it/s][A

Batch 1425: Training loss = 0.0484, Training accuracy = 0.9593, F1 = 0.9593



Epoch 9/10:  65%|██████▍   | 1433/2208 [01:22<00:49, 15.68it/s][A
Epoch 9/10:  65%|██████▌   | 1436/2208 [01:22<00:45, 17.10it/s][A
Epoch 9/10:  65%|██████▌   | 1439/2208 [01:22<00:42, 18.21it/s][A
Epoch 9/10:  65%|██████▌   | 1442/2208 [01:22<00:40, 19.06it/s][A
Epoch 9/10:  65%|██████▌   | 1445/2208 [01:22<00:38, 19.81it/s][A
Epoch 9/10:  66%|██████▌   | 1448/2208 [01:22<00:37, 20.31it/s][A
  with torch.cuda.amp.autocast():

Epoch 9/10:  66%|██████▌   | 1454/2208 [01:23<00:51, 14.54it/s][A

Batch 1450: Training loss = 0.0907, Training accuracy = 0.9594, F1 = 0.9594



Epoch 9/10:  66%|██████▌   | 1457/2208 [01:23<00:46, 16.08it/s][A
Epoch 9/10:  66%|██████▌   | 1460/2208 [01:23<00:43, 17.25it/s][A
Epoch 9/10:  66%|██████▋   | 1463/2208 [01:23<00:40, 18.28it/s][A
Epoch 9/10:  66%|██████▋   | 1466/2208 [01:23<00:39, 18.97it/s][A
Epoch 9/10:  67%|██████▋   | 1469/2208 [01:23<00:37, 19.68it/s][A
Epoch 9/10:  67%|██████▋   | 1472/2208 [01:24<00:36, 20.20it/s][A
  with torch.cuda.amp.autocast():

Epoch 9/10:  67%|██████▋   | 1478/2208 [01:24<00:56, 12.81it/s][A

Batch 1475: Training loss = 0.0804, Training accuracy = 0.9595, F1 = 0.9594



Epoch 9/10:  67%|██████▋   | 1481/2208 [01:24<00:49, 14.60it/s][A
Epoch 9/10:  67%|██████▋   | 1484/2208 [01:24<00:44, 16.18it/s][A
Epoch 9/10:  67%|██████▋   | 1487/2208 [01:25<00:41, 17.42it/s][A
Epoch 9/10:  67%|██████▋   | 1490/2208 [01:25<00:39, 18.37it/s][A
Epoch 9/10:  68%|██████▊   | 1493/2208 [01:25<00:37, 19.09it/s][A
Epoch 9/10:  68%|██████▊   | 1496/2208 [01:25<00:35, 19.80it/s][A
  with torch.cuda.amp.autocast():

Epoch 9/10:  68%|██████▊   | 1502/2208 [01:26<00:55, 12.66it/s][A
Epoch 9/10:  68%|██████▊   | 1505/2208 [01:26<00:48, 14.48it/s][A

Batch 1500: Training loss = 0.1681, Training accuracy = 0.9596, F1 = 0.9596



Epoch 9/10:  68%|██████▊   | 1508/2208 [01:26<00:43, 16.04it/s][A
Epoch 9/10:  68%|██████▊   | 1511/2208 [01:26<00:40, 17.22it/s][A
Epoch 9/10:  69%|██████▊   | 1514/2208 [01:26<00:38, 18.17it/s][A
Epoch 9/10:  69%|██████▊   | 1517/2208 [01:26<00:36, 18.89it/s][A
Epoch 9/10:  69%|██████▉   | 1520/2208 [01:26<00:35, 19.57it/s][A
Epoch 9/10:  69%|██████▉   | 1523/2208 [01:27<00:35, 19.33it/s][A
  with torch.cuda.amp.autocast():

Epoch 9/10:  69%|██████▉   | 1529/2208 [01:27<00:52, 12.92it/s][A

Batch 1525: Training loss = 0.1201, Training accuracy = 0.9597, F1 = 0.9597



Epoch 9/10:  69%|██████▉   | 1532/2208 [01:27<00:46, 14.56it/s][A
Epoch 9/10:  69%|██████▉   | 1534/2208 [01:28<00:43, 15.49it/s][A
Epoch 9/10:  70%|██████▉   | 1537/2208 [01:28<00:39, 16.99it/s][A
Epoch 9/10:  70%|██████▉   | 1540/2208 [01:28<00:37, 18.05it/s][A
Epoch 9/10:  70%|██████▉   | 1543/2208 [01:28<00:35, 18.99it/s][A
Epoch 9/10:  70%|███████   | 1546/2208 [01:28<00:33, 19.47it/s][A
  with torch.cuda.amp.autocast():

Epoch 9/10:  70%|███████   | 1552/2208 [01:29<00:54, 12.00it/s][A
Epoch 9/10:  70%|███████   | 1555/2208 [01:29<00:47, 13.85it/s][A

Batch 1550: Training loss = 0.0320, Training accuracy = 0.9597, F1 = 0.9597



Epoch 9/10:  71%|███████   | 1558/2208 [01:29<00:42, 15.43it/s][A
Epoch 9/10:  71%|███████   | 1561/2208 [01:29<00:38, 16.72it/s][A
Epoch 9/10:  71%|███████   | 1564/2208 [01:29<00:36, 17.85it/s][A
Epoch 9/10:  71%|███████   | 1567/2208 [01:29<00:34, 18.65it/s][A
Epoch 9/10:  71%|███████   | 1570/2208 [01:30<00:33, 19.31it/s][A
Epoch 9/10:  71%|███████   | 1573/2208 [01:30<00:32, 19.70it/s][A
  with torch.cuda.amp.autocast():

Epoch 9/10:  72%|███████▏  | 1579/2208 [01:30<00:45, 13.85it/s][A

Batch 1575: Training loss = 0.0316, Training accuracy = 0.9598, F1 = 0.9597



Epoch 9/10:  72%|███████▏  | 1582/2208 [01:31<00:40, 15.48it/s][A
Epoch 9/10:  72%|███████▏  | 1585/2208 [01:31<00:37, 16.82it/s][A
Epoch 9/10:  72%|███████▏  | 1588/2208 [01:31<00:34, 17.95it/s][A
Epoch 9/10:  72%|███████▏  | 1591/2208 [01:31<00:32, 18.71it/s][A
Epoch 9/10:  72%|███████▏  | 1594/2208 [01:31<00:33, 18.07it/s][A
Epoch 9/10:  72%|███████▏  | 1597/2208 [01:31<00:32, 18.92it/s][A
  with torch.cuda.amp.autocast():

Epoch 9/10:  73%|███████▎  | 1603/2208 [01:32<00:49, 12.15it/s][A

Batch 1600: Training loss = 0.0807, Training accuracy = 0.9598, F1 = 0.9598



Epoch 9/10:  73%|███████▎  | 1606/2208 [01:32<00:42, 14.01it/s][A
Epoch 9/10:  73%|███████▎  | 1609/2208 [01:32<00:38, 15.56it/s][A
Epoch 9/10:  73%|███████▎  | 1612/2208 [01:32<00:35, 16.92it/s][A
Epoch 9/10:  73%|███████▎  | 1615/2208 [01:32<00:32, 18.03it/s][A
Epoch 9/10:  73%|███████▎  | 1618/2208 [01:33<00:31, 18.77it/s][A
Epoch 9/10:  73%|███████▎  | 1621/2208 [01:33<00:30, 19.48it/s][A
  with torch.cuda.amp.autocast():

Epoch 9/10:  74%|███████▎  | 1627/2208 [01:33<00:48, 12.06it/s][A
Epoch 9/10:  74%|███████▍  | 1630/2208 [01:33<00:41, 13.95it/s][A

Batch 1625: Training loss = 0.0520, Training accuracy = 0.9599, F1 = 0.9598



Epoch 9/10:  74%|███████▍  | 1633/2208 [01:34<00:37, 15.54it/s][A
Epoch 9/10:  74%|███████▍  | 1636/2208 [01:34<00:33, 16.91it/s][A
Epoch 9/10:  74%|███████▍  | 1639/2208 [01:34<00:31, 17.97it/s][A
Epoch 9/10:  74%|███████▍  | 1642/2208 [01:34<00:29, 18.93it/s][A
Epoch 9/10:  75%|███████▍  | 1645/2208 [01:34<00:28, 19.70it/s][A
Epoch 9/10:  75%|███████▍  | 1648/2208 [01:34<00:27, 20.16it/s][A
  with torch.cuda.amp.autocast():

Epoch 9/10:  75%|███████▍  | 1654/2208 [01:35<00:41, 13.48it/s][A

Batch 1650: Training loss = 0.0953, Training accuracy = 0.9598, F1 = 0.9598



Epoch 9/10:  75%|███████▌  | 1657/2208 [01:35<00:36, 15.20it/s][A
Epoch 9/10:  75%|███████▌  | 1659/2208 [01:35<00:34, 15.99it/s][A
Epoch 9/10:  75%|███████▌  | 1662/2208 [01:35<00:31, 17.38it/s][A
Epoch 9/10:  75%|███████▌  | 1665/2208 [01:36<00:29, 18.36it/s][A
Epoch 9/10:  76%|███████▌  | 1668/2208 [01:36<00:28, 19.21it/s][A
Epoch 9/10:  76%|███████▌  | 1671/2208 [01:36<00:27, 19.78it/s][A
  with torch.cuda.amp.autocast():

Epoch 9/10:  76%|███████▌  | 1677/2208 [01:36<00:43, 12.19it/s][A
Epoch 9/10:  76%|███████▌  | 1680/2208 [01:37<00:37, 14.03it/s][A

Batch 1675: Training loss = 0.0688, Training accuracy = 0.9599, F1 = 0.9599



Epoch 9/10:  76%|███████▌  | 1683/2208 [01:37<00:33, 15.66it/s][A
Epoch 9/10:  76%|███████▋  | 1686/2208 [01:37<00:30, 17.04it/s][A
Epoch 9/10:  76%|███████▋  | 1689/2208 [01:37<00:28, 18.08it/s][A
Epoch 9/10:  77%|███████▋  | 1692/2208 [01:37<00:27, 18.93it/s][A
Epoch 9/10:  77%|███████▋  | 1695/2208 [01:37<00:26, 19.56it/s][A
Epoch 9/10:  77%|███████▋  | 1698/2208 [01:37<00:25, 20.14it/s][A
  with torch.cuda.amp.autocast():

Epoch 9/10:  77%|███████▋  | 1704/2208 [01:38<00:36, 13.81it/s][A

Batch 1700: Training loss = 0.1245, Training accuracy = 0.9600, F1 = 0.9599



Epoch 9/10:  77%|███████▋  | 1707/2208 [01:38<00:32, 15.49it/s][A
Epoch 9/10:  77%|███████▋  | 1710/2208 [01:38<00:29, 16.86it/s][A
Epoch 9/10:  78%|███████▊  | 1713/2208 [01:38<00:27, 18.10it/s][A
Epoch 9/10:  78%|███████▊  | 1716/2208 [01:39<00:25, 18.95it/s][A
Epoch 9/10:  78%|███████▊  | 1719/2208 [01:39<00:24, 19.67it/s][A
Epoch 9/10:  78%|███████▊  | 1722/2208 [01:39<00:24, 20.10it/s][A
  with torch.cuda.amp.autocast():

Epoch 9/10:  78%|███████▊  | 1728/2208 [01:40<00:41, 11.53it/s][A

Batch 1725: Training loss = 0.1124, Training accuracy = 0.9600, F1 = 0.9599



Epoch 9/10:  78%|███████▊  | 1731/2208 [01:40<00:35, 13.37it/s][A
Epoch 9/10:  79%|███████▊  | 1734/2208 [01:40<00:31, 14.96it/s][A
Epoch 9/10:  79%|███████▊  | 1737/2208 [01:40<00:28, 16.48it/s][A
Epoch 9/10:  79%|███████▉  | 1740/2208 [01:40<00:26, 17.59it/s][A
Epoch 9/10:  79%|███████▉  | 1743/2208 [01:40<00:25, 18.51it/s][A
Epoch 9/10:  79%|███████▉  | 1746/2208 [01:40<00:23, 19.29it/s][A
  with torch.cuda.amp.autocast():

Epoch 9/10:  79%|███████▉  | 1752/2208 [01:41<00:40, 11.14it/s][A
Epoch 9/10:  79%|███████▉  | 1755/2208 [01:41<00:34, 13.06it/s][A

Batch 1750: Training loss = 0.1268, Training accuracy = 0.9600, F1 = 0.9599



Epoch 9/10:  80%|███████▉  | 1758/2208 [01:41<00:30, 14.69it/s][A
Epoch 9/10:  80%|███████▉  | 1761/2208 [01:41<00:27, 16.12it/s][A
Epoch 9/10:  80%|███████▉  | 1764/2208 [01:42<00:25, 17.37it/s][A
Epoch 9/10:  80%|████████  | 1767/2208 [01:42<00:23, 18.45it/s][A
Epoch 9/10:  80%|████████  | 1770/2208 [01:42<00:24, 17.83it/s][A
Epoch 9/10:  80%|████████  | 1773/2208 [01:42<00:23, 18.61it/s][A
  with torch.cuda.amp.autocast():

Epoch 9/10:  81%|████████  | 1779/2208 [01:43<00:34, 12.44it/s][A

Batch 1775: Training loss = 0.1004, Training accuracy = 0.9600, F1 = 0.9600



Epoch 9/10:  81%|████████  | 1782/2208 [01:43<00:30, 14.18it/s][A
Epoch 9/10:  81%|████████  | 1785/2208 [01:43<00:26, 15.76it/s][A
Epoch 9/10:  81%|████████  | 1788/2208 [01:43<00:24, 16.96it/s][A
Epoch 9/10:  81%|████████  | 1791/2208 [01:43<00:23, 17.94it/s][A
Epoch 9/10:  81%|████████▏ | 1794/2208 [01:44<00:22, 18.70it/s][A
Epoch 9/10:  81%|████████▏ | 1797/2208 [01:44<00:22, 18.38it/s][A
  with torch.cuda.amp.autocast():

Epoch 9/10:  82%|████████▏ | 1802/2208 [01:44<00:39, 10.16it/s][A
Epoch 9/10:  82%|████████▏ | 1805/2208 [01:44<00:33, 12.20it/s][A

Batch 1800: Training loss = 0.1699, Training accuracy = 0.9601, F1 = 0.9600



Epoch 9/10:  82%|████████▏ | 1808/2208 [01:45<00:28, 14.05it/s][A
Epoch 9/10:  82%|████████▏ | 1811/2208 [01:45<00:25, 15.68it/s][A
Epoch 9/10:  82%|████████▏ | 1814/2208 [01:45<00:23, 17.07it/s][A
Epoch 9/10:  82%|████████▏ | 1816/2208 [01:45<00:22, 17.35it/s][A
Epoch 9/10:  82%|████████▏ | 1819/2208 [01:45<00:21, 18.51it/s][A
Epoch 9/10:  82%|████████▏ | 1821/2208 [01:45<00:21, 17.84it/s][A
Epoch 9/10:  83%|████████▎ | 1824/2208 [01:45<00:20, 18.84it/s][A
  with torch.cuda.amp.autocast():

Epoch 9/10:  83%|████████▎ | 1829/2208 [01:46<00:31, 12.16it/s][A

Batch 1825: Training loss = 0.0517, Training accuracy = 0.9600, F1 = 0.9600



Epoch 9/10:  83%|████████▎ | 1832/2208 [01:46<00:26, 14.21it/s][A
Epoch 9/10:  83%|████████▎ | 1835/2208 [01:46<00:23, 15.97it/s][A
Epoch 9/10:  83%|████████▎ | 1838/2208 [01:46<00:21, 17.19it/s][A
Epoch 9/10:  83%|████████▎ | 1841/2208 [01:47<00:20, 18.24it/s][A
Epoch 9/10:  84%|████████▎ | 1844/2208 [01:47<00:19, 19.07it/s][A
Epoch 9/10:  84%|████████▎ | 1847/2208 [01:47<00:18, 19.60it/s][A
  with torch.cuda.amp.autocast():

Epoch 9/10:  84%|████████▍ | 1853/2208 [01:48<00:31, 11.27it/s][A

Batch 1850: Training loss = 0.0408, Training accuracy = 0.9601, F1 = 0.9600



Epoch 9/10:  84%|████████▍ | 1856/2208 [01:48<00:26, 13.17it/s][A
Epoch 9/10:  84%|████████▍ | 1859/2208 [01:48<00:23, 14.90it/s][A
Epoch 9/10:  84%|████████▍ | 1862/2208 [01:48<00:21, 16.37it/s][A
Epoch 9/10:  84%|████████▍ | 1865/2208 [01:48<00:19, 17.58it/s][A
Epoch 9/10:  85%|████████▍ | 1868/2208 [01:48<00:18, 18.47it/s][A
Epoch 9/10:  85%|████████▍ | 1871/2208 [01:48<00:17, 19.14it/s][A
  with torch.cuda.amp.autocast():

Epoch 9/10:  85%|████████▌ | 1877/2208 [01:49<00:29, 11.20it/s][A
Epoch 9/10:  85%|████████▌ | 1880/2208 [01:49<00:24, 13.13it/s][A

Batch 1875: Training loss = 0.1730, Training accuracy = 0.9601, F1 = 0.9601



Epoch 9/10:  85%|████████▌ | 1883/2208 [01:49<00:21, 14.84it/s][A
Epoch 9/10:  85%|████████▌ | 1886/2208 [01:50<00:19, 16.33it/s][A
Epoch 9/10:  86%|████████▌ | 1889/2208 [01:50<00:18, 17.44it/s][A
Epoch 9/10:  86%|████████▌ | 1892/2208 [01:50<00:17, 18.52it/s][A
Epoch 9/10:  86%|████████▌ | 1895/2208 [01:50<00:16, 19.21it/s][A
Epoch 9/10:  86%|████████▌ | 1898/2208 [01:50<00:15, 19.73it/s][A
  with torch.cuda.amp.autocast():

Epoch 9/10:  86%|████████▌ | 1904/2208 [01:51<00:23, 12.83it/s][A

Batch 1900: Training loss = 0.1537, Training accuracy = 0.9601, F1 = 0.9601



Epoch 9/10:  86%|████████▋ | 1907/2208 [01:51<00:20, 14.59it/s][A
Epoch 9/10:  87%|████████▋ | 1910/2208 [01:51<00:18, 16.03it/s][A
Epoch 9/10:  87%|████████▋ | 1913/2208 [01:51<00:17, 17.22it/s][A
Epoch 9/10:  87%|████████▋ | 1916/2208 [01:51<00:16, 18.13it/s][A
Epoch 9/10:  87%|████████▋ | 1919/2208 [01:52<00:15, 18.93it/s][A
Epoch 9/10:  87%|████████▋ | 1922/2208 [01:52<00:14, 19.58it/s][A
  with torch.cuda.amp.autocast():

Epoch 9/10:  87%|████████▋ | 1928/2208 [01:52<00:25, 11.15it/s][A

Batch 1925: Training loss = 0.1584, Training accuracy = 0.9601, F1 = 0.9601



Epoch 9/10:  87%|████████▋ | 1931/2208 [01:52<00:21, 13.01it/s][A
Epoch 9/10:  88%|████████▊ | 1934/2208 [01:53<00:18, 14.71it/s][A
Epoch 9/10:  88%|████████▊ | 1937/2208 [01:53<00:16, 16.12it/s][A
Epoch 9/10:  88%|████████▊ | 1940/2208 [01:53<00:15, 17.33it/s][A
Epoch 9/10:  88%|████████▊ | 1943/2208 [01:53<00:14, 18.32it/s][A
Epoch 9/10:  88%|████████▊ | 1946/2208 [01:53<00:13, 19.06it/s][A
  with torch.cuda.amp.autocast():

Epoch 9/10:  88%|████████▊ | 1952/2208 [01:54<00:22, 11.19it/s][A
Epoch 9/10:  89%|████████▊ | 1955/2208 [01:54<00:19, 13.10it/s][A

Batch 1950: Training loss = 0.1477, Training accuracy = 0.9602, F1 = 0.9601



Epoch 9/10:  89%|████████▊ | 1958/2208 [01:54<00:16, 14.85it/s][A
Epoch 9/10:  89%|████████▉ | 1961/2208 [01:54<00:15, 16.25it/s][A
Epoch 9/10:  89%|████████▉ | 1964/2208 [01:54<00:14, 17.40it/s][A
Epoch 9/10:  89%|████████▉ | 1967/2208 [01:55<00:13, 18.37it/s][A
Epoch 9/10:  89%|████████▉ | 1970/2208 [01:55<00:12, 19.24it/s][A
Epoch 9/10:  89%|████████▉ | 1973/2208 [01:55<00:11, 19.83it/s][A
  with torch.cuda.amp.autocast():

Epoch 9/10:  90%|████████▉ | 1979/2208 [01:56<00:17, 12.96it/s][A

Batch 1975: Training loss = 0.1847, Training accuracy = 0.9602, F1 = 0.9601



Epoch 9/10:  90%|████████▉ | 1982/2208 [01:56<00:15, 14.73it/s][A
Epoch 9/10:  90%|████████▉ | 1985/2208 [01:56<00:13, 16.22it/s][A
Epoch 9/10:  90%|█████████ | 1988/2208 [01:56<00:12, 17.35it/s][A
Epoch 9/10:  90%|█████████ | 1991/2208 [01:56<00:12, 17.78it/s][A
Epoch 9/10:  90%|█████████ | 1993/2208 [01:56<00:13, 15.75it/s][A
Epoch 9/10:  90%|█████████ | 1996/2208 [01:56<00:12, 17.15it/s][A
Epoch 9/10:  90%|█████████ | 1998/2208 [01:57<00:12, 17.48it/s][A
  with torch.cuda.amp.autocast():

Epoch 9/10:  91%|█████████ | 2004/2208 [01:57<00:17, 11.88it/s][A

Batch 2000: Training loss = 0.0610, Training accuracy = 0.9602, F1 = 0.9602



Epoch 9/10:  91%|█████████ | 2007/2208 [01:57<00:14, 13.85it/s][A
Epoch 9/10:  91%|█████████ | 2010/2208 [01:58<00:12, 15.57it/s][A
Epoch 9/10:  91%|█████████ | 2013/2208 [01:58<00:11, 17.00it/s][A
Epoch 9/10:  91%|█████████▏| 2016/2208 [01:58<00:10, 17.98it/s][A
Epoch 9/10:  91%|█████████▏| 2019/2208 [01:58<00:10, 18.68it/s][A
Epoch 9/10:  92%|█████████▏| 2022/2208 [01:58<00:09, 19.32it/s][A
  with torch.cuda.amp.autocast():

Epoch 9/10:  92%|█████████▏| 2028/2208 [01:59<00:16, 10.98it/s][A

Batch 2025: Training loss = 0.2183, Training accuracy = 0.9602, F1 = 0.9602



Epoch 9/10:  92%|█████████▏| 2031/2208 [01:59<00:13, 12.89it/s][A
Epoch 9/10:  92%|█████████▏| 2034/2208 [01:59<00:11, 14.59it/s][A
Epoch 9/10:  92%|█████████▏| 2037/2208 [01:59<00:10, 16.13it/s][A
Epoch 9/10:  92%|█████████▏| 2040/2208 [01:59<00:09, 17.47it/s][A
Epoch 9/10:  93%|█████████▎| 2043/2208 [02:00<00:09, 16.95it/s][A
Epoch 9/10:  93%|█████████▎| 2046/2208 [02:00<00:09, 17.99it/s][A
Epoch 9/10:  93%|█████████▎| 2048/2208 [02:00<00:08, 18.35it/s][A
  with torch.cuda.amp.autocast():

Epoch 9/10:  93%|█████████▎| 2054/2208 [02:01<00:12, 12.23it/s][A

Batch 2050: Training loss = 0.0702, Training accuracy = 0.9602, F1 = 0.9601



Epoch 9/10:  93%|█████████▎| 2057/2208 [02:01<00:10, 14.07it/s][A
Epoch 9/10:  93%|█████████▎| 2060/2208 [02:01<00:09, 15.72it/s][A
Epoch 9/10:  93%|█████████▎| 2063/2208 [02:01<00:08, 17.03it/s][A
Epoch 9/10:  94%|█████████▎| 2066/2208 [02:01<00:07, 18.05it/s][A
Epoch 9/10:  94%|█████████▎| 2069/2208 [02:01<00:07, 17.82it/s][A
Epoch 9/10:  94%|█████████▍| 2071/2208 [02:01<00:07, 17.84it/s][A
Epoch 9/10:  94%|█████████▍| 2073/2208 [02:02<00:08, 16.84it/s][A
  with torch.cuda.amp.autocast():

Epoch 9/10:  94%|█████████▍| 2079/2208 [02:02<00:11, 11.52it/s][A

Batch 2075: Training loss = 0.0327, Training accuracy = 0.9603, F1 = 0.9602



Epoch 9/10:  94%|█████████▍| 2082/2208 [02:02<00:09, 13.47it/s][A
Epoch 9/10:  94%|█████████▍| 2085/2208 [02:03<00:08, 15.25it/s][A
Epoch 9/10:  95%|█████████▍| 2088/2208 [02:03<00:07, 16.65it/s][A
Epoch 9/10:  95%|█████████▍| 2091/2208 [02:03<00:06, 17.87it/s][A
Epoch 9/10:  95%|█████████▍| 2094/2208 [02:03<00:06, 18.66it/s][A
Epoch 9/10:  95%|█████████▍| 2097/2208 [02:03<00:05, 19.43it/s][A
  with torch.cuda.amp.autocast():

Epoch 9/10:  95%|█████████▌| 2103/2208 [02:04<00:09, 10.51it/s][A

Batch 2100: Training loss = 0.1684, Training accuracy = 0.9602, F1 = 0.9602



Epoch 9/10:  95%|█████████▌| 2106/2208 [02:04<00:08, 12.42it/s][A
Epoch 9/10:  96%|█████████▌| 2109/2208 [02:04<00:06, 14.19it/s][A
Epoch 9/10:  96%|█████████▌| 2112/2208 [02:04<00:06, 15.65it/s][A
Epoch 9/10:  96%|█████████▌| 2115/2208 [02:04<00:05, 16.91it/s][A
Epoch 9/10:  96%|█████████▌| 2118/2208 [02:05<00:04, 18.02it/s][A
Epoch 9/10:  96%|█████████▌| 2121/2208 [02:05<00:04, 18.81it/s][A
  with torch.cuda.amp.autocast():

Epoch 9/10:  96%|█████████▋| 2127/2208 [02:05<00:07, 10.71it/s][A
Epoch 9/10:  96%|█████████▋| 2130/2208 [02:06<00:06, 12.65it/s][A

Batch 2125: Training loss = 0.0484, Training accuracy = 0.9603, F1 = 0.9603



Epoch 9/10:  97%|█████████▋| 2133/2208 [02:06<00:05, 14.40it/s][A
Epoch 9/10:  97%|█████████▋| 2136/2208 [02:06<00:04, 15.94it/s][A
Epoch 9/10:  97%|█████████▋| 2139/2208 [02:06<00:03, 17.26it/s][A
Epoch 9/10:  97%|█████████▋| 2142/2208 [02:06<00:03, 18.39it/s][A
Epoch 9/10:  97%|█████████▋| 2145/2208 [02:06<00:03, 19.14it/s][A
Epoch 9/10:  97%|█████████▋| 2148/2208 [02:06<00:03, 19.66it/s][A
  with torch.cuda.amp.autocast():

Epoch 9/10:  98%|█████████▊| 2154/2208 [02:07<00:04, 12.22it/s][A

Batch 2150: Training loss = 0.0760, Training accuracy = 0.9603, F1 = 0.9603



Epoch 9/10:  98%|█████████▊| 2157/2208 [02:07<00:03, 14.05it/s][A
Epoch 9/10:  98%|█████████▊| 2160/2208 [02:07<00:03, 15.57it/s][A
Epoch 9/10:  98%|█████████▊| 2163/2208 [02:08<00:02, 16.90it/s][A
Epoch 9/10:  98%|█████████▊| 2166/2208 [02:08<00:02, 17.99it/s][A
Epoch 9/10:  98%|█████████▊| 2169/2208 [02:08<00:02, 18.78it/s][A
Epoch 9/10:  98%|█████████▊| 2172/2208 [02:08<00:01, 19.35it/s][A
  with torch.cuda.amp.autocast():

Epoch 9/10:  99%|█████████▊| 2178/2208 [02:09<00:03,  9.81it/s][A

Batch 2175: Training loss = 0.2032, Training accuracy = 0.9604, F1 = 0.9604



Epoch 9/10:  99%|█████████▉| 2181/2208 [02:09<00:02, 11.74it/s][A
Epoch 9/10:  99%|█████████▉| 2184/2208 [02:09<00:01, 13.61it/s][A
Epoch 9/10:  99%|█████████▉| 2187/2208 [02:09<00:01, 15.25it/s][A
Epoch 9/10:  99%|█████████▉| 2190/2208 [02:09<00:01, 16.64it/s][A
Epoch 9/10:  99%|█████████▉| 2193/2208 [02:10<00:00, 17.74it/s][A
Epoch 9/10:  99%|█████████▉| 2196/2208 [02:10<00:00, 18.62it/s][A
  with torch.cuda.amp.autocast():

Epoch 9/10: 100%|█████████▉| 2202/2208 [02:10<00:00, 10.53it/s][A
Epoch 9/10: 100%|█████████▉| 2205/2208 [02:11<00:00, 12.47it/s][A

Batch 2200: Training loss = 0.1309, Training accuracy = 0.9604, F1 = 0.9604



Epoch 9/10: 100%|██████████| 2208/2208 [02:11<00:00, 14.31it/s][A
                                                               [A


Epoch 9 Training Metrics:
Loss: 0.1205
Accuracy: 0.9604
F1 Score: 0.9604
Precision: 0.9604
Recall: 0.9604

Starting validation...



Validation:   0%|          | 0/552 [00:00<?, ?it/s][A
Validation:   0%|          | 1/552 [00:01<14:46,  1.61s/it][A
Validation:   0%|          | 2/552 [00:01<06:40,  1.37it/s][A
Validation:   1%|          | 4/552 [00:01<02:47,  3.28it/s][A
Validation:   1%|          | 6/552 [00:01<01:41,  5.36it/s][A
Validation:   1%|▏         | 8/552 [00:02<01:12,  7.51it/s][A
Validation:   2%|▏         | 10/552 [00:02<00:56,  9.61it/s][A
Validation:   2%|▏         | 12/552 [00:02<00:46, 11.54it/s][A
Validation:   3%|▎         | 14/552 [00:02<00:40, 13.26it/s][A
Validation:   3%|▎         | 16/552 [00:02<00:36, 14.73it/s][A
Validation:   3%|▎         | 18/552 [00:02<00:33, 15.76it/s][A
Validation:   4%|▎         | 20/552 [00:02<00:31, 16.63it/s][A
Validation:   4%|▍         | 22/552 [00:02<00:30, 17.26it/s][A
Validation:   4%|▍         | 24/552 [00:02<00:29, 17.67it/s][A
Validation:   5%|▍         | 26/552 [00:02<00:29, 18.04it/s][A
Validation:   5%|▌         | 28/552 [00:03<00:28, 18.


Epoch 9 Validation Metrics:
Loss: 0.1427
Accuracy: 0.9560
F1 Score: 0.9558
Precision: 0.9576
Recall: 0.9560

Starting epoch 10/10



  with torch.cuda.amp.autocast():

  with torch.cuda.amp.autocast():

Epoch 10/10:   0%|          | 3/2208 [00:01<17:45,  2.07it/s]  [A

Batch 0: Training loss = 0.0572, Training accuracy = 0.9688, F1 = 0.9688



Epoch 10/10:   0%|          | 5/2208 [00:02<10:28,  3.50it/s][A
Epoch 10/10:   0%|          | 8/2208 [00:02<05:53,  6.22it/s][A
Epoch 10/10:   0%|          | 11/2208 [00:02<04:06,  8.90it/s][A
Epoch 10/10:   1%|          | 14/2208 [00:02<03:12, 11.37it/s][A
Epoch 10/10:   1%|          | 17/2208 [00:02<02:41, 13.60it/s][A
Epoch 10/10:   1%|          | 20/2208 [00:02<02:22, 15.41it/s][A
Epoch 10/10:   1%|          | 23/2208 [00:02<02:09, 16.89it/s][A
  with torch.cuda.amp.autocast():

Epoch 10/10:   1%|▏         | 29/2208 [00:03<01:59, 18.20it/s][A

Batch 25: Training loss = 0.0517, Training accuracy = 0.9642, F1 = 0.9641



Epoch 10/10:   1%|▏         | 32/2208 [00:03<01:54, 19.01it/s][A
Epoch 10/10:   2%|▏         | 35/2208 [00:03<01:50, 19.60it/s][A
Epoch 10/10:   2%|▏         | 38/2208 [00:03<01:54, 19.02it/s][A
Epoch 10/10:   2%|▏         | 41/2208 [00:03<02:01, 17.84it/s][A
Epoch 10/10:   2%|▏         | 44/2208 [00:03<01:55, 18.75it/s][A
Epoch 10/10:   2%|▏         | 47/2208 [00:04<01:51, 19.31it/s][A
Epoch 10/10:   2%|▏         | 49/2208 [00:04<02:12, 16.27it/s][A
  with torch.cuda.amp.autocast():

Epoch 10/10:   2%|▏         | 54/2208 [00:04<02:01, 17.73it/s][A

Batch 50: Training loss = 0.1138, Training accuracy = 0.9622, F1 = 0.9621



Epoch 10/10:   3%|▎         | 57/2208 [00:04<01:54, 18.76it/s][A
Epoch 10/10:   3%|▎         | 60/2208 [00:04<01:50, 19.42it/s][A
Epoch 10/10:   3%|▎         | 63/2208 [00:04<01:47, 19.98it/s][A
Epoch 10/10:   3%|▎         | 66/2208 [00:05<01:45, 20.33it/s][A
Epoch 10/10:   3%|▎         | 69/2208 [00:05<01:44, 20.52it/s][A
Epoch 10/10:   3%|▎         | 72/2208 [00:05<01:42, 20.77it/s][A
  with torch.cuda.amp.autocast():

Epoch 10/10:   4%|▎         | 78/2208 [00:05<01:45, 20.15it/s][A

Batch 75: Training loss = 0.1628, Training accuracy = 0.9608, F1 = 0.9608



Epoch 10/10:   4%|▎         | 81/2208 [00:05<01:45, 20.22it/s][A
Epoch 10/10:   4%|▍         | 84/2208 [00:06<01:43, 20.56it/s][A
Epoch 10/10:   4%|▍         | 87/2208 [00:06<01:43, 20.45it/s][A
Epoch 10/10:   4%|▍         | 90/2208 [00:06<01:42, 20.76it/s][A
Epoch 10/10:   4%|▍         | 93/2208 [00:06<01:42, 20.72it/s][A
Epoch 10/10:   4%|▍         | 96/2208 [00:06<01:41, 20.73it/s][A
  with torch.cuda.amp.autocast():

Epoch 10/10:   5%|▍         | 102/2208 [00:06<01:45, 19.98it/s][A
Epoch 10/10:   5%|▍         | 105/2208 [00:07<01:43, 20.37it/s][A

Batch 100: Training loss = 0.0745, Training accuracy = 0.9619, F1 = 0.9619



Epoch 10/10:   5%|▍         | 108/2208 [00:07<01:42, 20.47it/s][A
Epoch 10/10:   5%|▌         | 111/2208 [00:07<01:42, 20.47it/s][A
Epoch 10/10:   5%|▌         | 114/2208 [00:07<01:46, 19.73it/s][A
Epoch 10/10:   5%|▌         | 117/2208 [00:07<01:44, 20.00it/s][A
Epoch 10/10:   5%|▌         | 120/2208 [00:07<01:50, 18.89it/s][A
Epoch 10/10:   6%|▌         | 123/2208 [00:07<01:46, 19.54it/s][A
  with torch.cuda.amp.autocast():

Epoch 10/10:   6%|▌         | 128/2208 [00:08<01:52, 18.49it/s][A

Batch 125: Training loss = 0.0901, Training accuracy = 0.9627, F1 = 0.9627



Epoch 10/10:   6%|▌         | 131/2208 [00:08<01:48, 19.18it/s][A
Epoch 10/10:   6%|▌         | 133/2208 [00:08<01:47, 19.23it/s][A
Epoch 10/10:   6%|▌         | 136/2208 [00:08<01:44, 19.74it/s][A
Epoch 10/10:   6%|▋         | 139/2208 [00:08<01:42, 20.26it/s][A
Epoch 10/10:   6%|▋         | 142/2208 [00:08<01:41, 20.40it/s][A
Epoch 10/10:   7%|▋         | 145/2208 [00:09<01:43, 19.85it/s][A
Epoch 10/10:   7%|▋         | 148/2208 [00:09<01:41, 20.30it/s][A
  with torch.cuda.amp.autocast():

Epoch 10/10:   7%|▋         | 154/2208 [00:09<01:49, 18.68it/s][A

Batch 150: Training loss = 0.0569, Training accuracy = 0.9642, F1 = 0.9641



Epoch 10/10:   7%|▋         | 157/2208 [00:09<01:57, 17.41it/s][A
Epoch 10/10:   7%|▋         | 160/2208 [00:09<01:51, 18.29it/s][A
Epoch 10/10:   7%|▋         | 162/2208 [00:10<01:58, 17.29it/s][A
Epoch 10/10:   7%|▋         | 165/2208 [00:10<02:00, 16.91it/s][A
Epoch 10/10:   8%|▊         | 168/2208 [00:10<01:53, 18.01it/s][A
Epoch 10/10:   8%|▊         | 171/2208 [00:10<01:47, 18.88it/s][A
Epoch 10/10:   8%|▊         | 174/2208 [00:10<01:49, 18.55it/s][A
  with torch.cuda.amp.autocast():

Epoch 10/10:   8%|▊         | 178/2208 [00:10<01:58, 17.12it/s][A

Batch 175: Training loss = 0.0657, Training accuracy = 0.9638, F1 = 0.9637



Epoch 10/10:   8%|▊         | 181/2208 [00:11<01:52, 18.06it/s][A
Epoch 10/10:   8%|▊         | 183/2208 [00:11<01:49, 18.48it/s][A
Epoch 10/10:   8%|▊         | 185/2208 [00:11<01:49, 18.49it/s][A
Epoch 10/10:   9%|▊         | 188/2208 [00:11<01:45, 19.13it/s][A
Epoch 10/10:   9%|▊         | 190/2208 [00:11<01:55, 17.54it/s][A
Epoch 10/10:   9%|▊         | 193/2208 [00:11<01:48, 18.60it/s][A
Epoch 10/10:   9%|▉         | 196/2208 [00:11<01:43, 19.35it/s][A
Epoch 10/10:   9%|▉         | 198/2208 [00:11<01:44, 19.22it/s][A
  with torch.cuda.amp.autocast():

Epoch 10/10:   9%|▉         | 204/2208 [00:12<01:45, 19.08it/s][A

Batch 200: Training loss = 0.1930, Training accuracy = 0.9632, F1 = 0.9631



Epoch 10/10:   9%|▉         | 207/2208 [00:12<01:41, 19.64it/s][A
Epoch 10/10:  10%|▉         | 210/2208 [00:12<01:40, 19.94it/s][A
Epoch 10/10:  10%|▉         | 212/2208 [00:12<01:46, 18.81it/s][A
Epoch 10/10:  10%|▉         | 214/2208 [00:12<01:44, 19.05it/s][A
Epoch 10/10:  10%|▉         | 216/2208 [00:12<01:51, 17.94it/s][A
Epoch 10/10:  10%|▉         | 219/2208 [00:13<01:55, 17.26it/s][A
Epoch 10/10:  10%|█         | 222/2208 [00:13<01:48, 18.29it/s][A
Epoch 10/10:  10%|█         | 224/2208 [00:13<01:59, 16.62it/s][A
  with torch.cuda.amp.autocast():

Epoch 10/10:  10%|█         | 228/2208 [00:13<02:02, 16.11it/s][A

Batch 225: Training loss = 0.0674, Training accuracy = 0.9632, F1 = 0.9632



Epoch 10/10:  10%|█         | 231/2208 [00:13<01:51, 17.67it/s][A
Epoch 10/10:  11%|█         | 233/2208 [00:13<01:48, 18.13it/s][A
Epoch 10/10:  11%|█         | 235/2208 [00:14<01:46, 18.58it/s][A
Epoch 10/10:  11%|█         | 237/2208 [00:14<01:45, 18.62it/s][A
Epoch 10/10:  11%|█         | 240/2208 [00:14<01:44, 18.85it/s][A
Epoch 10/10:  11%|█         | 243/2208 [00:14<01:44, 18.87it/s][A
Epoch 10/10:  11%|█         | 246/2208 [00:14<01:42, 19.11it/s][A
Epoch 10/10:  11%|█         | 248/2208 [00:14<01:59, 16.34it/s][A
  with torch.cuda.amp.autocast():

Epoch 10/10:  12%|█▏        | 254/2208 [00:15<01:54, 17.10it/s][A

Batch 250: Training loss = 0.3048, Training accuracy = 0.9631, F1 = 0.9630



Epoch 10/10:  12%|█▏        | 257/2208 [00:15<01:46, 18.24it/s][A
Epoch 10/10:  12%|█▏        | 260/2208 [00:15<01:42, 18.98it/s][A
Epoch 10/10:  12%|█▏        | 263/2208 [00:15<01:47, 18.16it/s][A
Epoch 10/10:  12%|█▏        | 266/2208 [00:15<01:41, 19.05it/s][A
Epoch 10/10:  12%|█▏        | 269/2208 [00:15<01:39, 19.53it/s][A
Epoch 10/10:  12%|█▏        | 271/2208 [00:16<01:43, 18.65it/s][A
Epoch 10/10:  12%|█▏        | 274/2208 [00:16<01:39, 19.37it/s][A
  with torch.cuda.amp.autocast():

Epoch 10/10:  13%|█▎        | 278/2208 [00:16<01:54, 16.87it/s][A

Batch 275: Training loss = 0.0490, Training accuracy = 0.9632, F1 = 0.9631



Epoch 10/10:  13%|█▎        | 281/2208 [00:16<01:46, 18.06it/s][A
Epoch 10/10:  13%|█▎        | 284/2208 [00:16<01:41, 19.00it/s][A
Epoch 10/10:  13%|█▎        | 287/2208 [00:16<01:37, 19.69it/s][A
Epoch 10/10:  13%|█▎        | 290/2208 [00:17<01:35, 20.04it/s][A
Epoch 10/10:  13%|█▎        | 293/2208 [00:17<01:37, 19.61it/s][A
Epoch 10/10:  13%|█▎        | 296/2208 [00:17<01:34, 20.13it/s][A
  with torch.cuda.amp.autocast():

Epoch 10/10:  14%|█▎        | 302/2208 [00:17<01:43, 18.50it/s][A
Epoch 10/10:  14%|█▍        | 304/2208 [00:17<01:44, 18.19it/s][A

Batch 300: Training loss = 0.0991, Training accuracy = 0.9631, F1 = 0.9630



Epoch 10/10:  14%|█▍        | 307/2208 [00:17<01:47, 17.71it/s][A
Epoch 10/10:  14%|█▍        | 310/2208 [00:18<01:41, 18.74it/s][A
Epoch 10/10:  14%|█▍        | 313/2208 [00:18<01:37, 19.47it/s][A
Epoch 10/10:  14%|█▍        | 316/2208 [00:18<01:34, 20.02it/s][A
Epoch 10/10:  14%|█▍        | 319/2208 [00:18<01:32, 20.37it/s][A
Epoch 10/10:  15%|█▍        | 322/2208 [00:18<01:32, 20.48it/s][A
  with torch.cuda.amp.autocast():

Epoch 10/10:  15%|█▍        | 328/2208 [00:19<01:44, 17.92it/s][A

Batch 325: Training loss = 0.0601, Training accuracy = 0.9628, F1 = 0.9627



Epoch 10/10:  15%|█▍        | 331/2208 [00:19<01:40, 18.73it/s][A
Epoch 10/10:  15%|█▌        | 334/2208 [00:19<01:36, 19.35it/s][A
Epoch 10/10:  15%|█▌        | 337/2208 [00:19<01:41, 18.44it/s][A
Epoch 10/10:  15%|█▌        | 340/2208 [00:19<01:37, 19.06it/s][A
Epoch 10/10:  16%|█▌        | 343/2208 [00:19<01:34, 19.65it/s][A
Epoch 10/10:  16%|█▌        | 345/2208 [00:19<01:52, 16.49it/s][A
Epoch 10/10:  16%|█▌        | 348/2208 [00:20<01:44, 17.87it/s][A
  with torch.cuda.amp.autocast():

Epoch 10/10:  16%|█▌        | 354/2208 [00:20<01:43, 17.85it/s][A

Batch 350: Training loss = 0.0751, Training accuracy = 0.9627, F1 = 0.9626



Epoch 10/10:  16%|█▌        | 357/2208 [00:20<01:38, 18.88it/s][A
Epoch 10/10:  16%|█▋        | 360/2208 [00:20<01:35, 19.44it/s][A
Epoch 10/10:  16%|█▋        | 363/2208 [00:20<01:32, 19.84it/s][A
Epoch 10/10:  17%|█▋        | 366/2208 [00:21<01:30, 20.26it/s][A
Epoch 10/10:  17%|█▋        | 369/2208 [00:21<01:29, 20.49it/s][A
Epoch 10/10:  17%|█▋        | 372/2208 [00:21<01:29, 20.52it/s][A
  with torch.cuda.amp.autocast():

Epoch 10/10:  17%|█▋        | 378/2208 [00:21<01:40, 18.26it/s][A

Batch 375: Training loss = 0.2366, Training accuracy = 0.9625, F1 = 0.9625



Epoch 10/10:  17%|█▋        | 381/2208 [00:21<01:35, 19.06it/s][A
Epoch 10/10:  17%|█▋        | 384/2208 [00:21<01:32, 19.71it/s][A
Epoch 10/10:  18%|█▊        | 387/2208 [00:22<01:34, 19.37it/s][A
Epoch 10/10:  18%|█▊        | 390/2208 [00:22<01:30, 20.00it/s][A
Epoch 10/10:  18%|█▊        | 393/2208 [00:22<01:29, 20.30it/s][A
Epoch 10/10:  18%|█▊        | 396/2208 [00:22<01:44, 17.29it/s][A
Epoch 10/10:  18%|█▊        | 399/2208 [00:22<01:39, 18.24it/s][A
  with torch.cuda.amp.autocast():

Epoch 10/10:  18%|█▊        | 404/2208 [00:23<01:45, 17.05it/s][A

Batch 400: Training loss = 0.2540, Training accuracy = 0.9625, F1 = 0.9624



Epoch 10/10:  18%|█▊        | 407/2208 [00:23<01:38, 18.27it/s][A
Epoch 10/10:  19%|█▊        | 410/2208 [00:23<01:34, 19.00it/s][A
Epoch 10/10:  19%|█▊        | 412/2208 [00:23<01:34, 19.08it/s][A
Epoch 10/10:  19%|█▉        | 415/2208 [00:23<01:31, 19.57it/s][A
Epoch 10/10:  19%|█▉        | 418/2208 [00:23<01:28, 20.19it/s][A
Epoch 10/10:  19%|█▉        | 421/2208 [00:23<01:27, 20.45it/s][A
  with torch.cuda.amp.autocast():

Epoch 10/10:  19%|█▉        | 427/2208 [00:24<01:44, 17.11it/s][A
Epoch 10/10:  19%|█▉        | 430/2208 [00:24<01:36, 18.34it/s][A

Batch 425: Training loss = 0.1154, Training accuracy = 0.9627, F1 = 0.9627



Epoch 10/10:  20%|█▉        | 433/2208 [00:24<01:32, 19.13it/s][A
Epoch 10/10:  20%|█▉        | 436/2208 [00:24<01:29, 19.75it/s][A
Epoch 10/10:  20%|█▉        | 439/2208 [00:24<01:33, 18.88it/s][A
Epoch 10/10:  20%|█▉        | 441/2208 [00:25<01:39, 17.68it/s][A
Epoch 10/10:  20%|██        | 443/2208 [00:25<01:41, 17.41it/s][A
Epoch 10/10:  20%|██        | 445/2208 [00:25<01:49, 16.10it/s][A
Epoch 10/10:  20%|██        | 448/2208 [00:25<01:41, 17.36it/s][A
  with torch.cuda.amp.autocast():

Epoch 10/10:  21%|██        | 454/2208 [00:25<01:42, 17.17it/s][A

Batch 450: Training loss = 0.0694, Training accuracy = 0.9628, F1 = 0.9628



Epoch 10/10:  21%|██        | 456/2208 [00:25<01:38, 17.74it/s][A
Epoch 10/10:  21%|██        | 459/2208 [00:26<01:33, 18.63it/s][A
Epoch 10/10:  21%|██        | 461/2208 [00:26<01:37, 18.01it/s][A
Epoch 10/10:  21%|██        | 464/2208 [00:26<01:37, 17.90it/s][A
Epoch 10/10:  21%|██        | 467/2208 [00:26<01:32, 18.84it/s][A
Epoch 10/10:  21%|██        | 469/2208 [00:26<01:36, 18.04it/s][A
Epoch 10/10:  21%|██▏       | 472/2208 [00:26<01:39, 17.37it/s][A
  with torch.cuda.amp.autocast():

Epoch 10/10:  22%|██▏       | 477/2208 [00:27<01:49, 15.83it/s][A
Epoch 10/10:  22%|██▏       | 480/2208 [00:27<01:40, 17.26it/s][A

Batch 475: Training loss = 0.0739, Training accuracy = 0.9626, F1 = 0.9626



Epoch 10/10:  22%|██▏       | 483/2208 [00:27<01:33, 18.40it/s][A
Epoch 10/10:  22%|██▏       | 485/2208 [00:27<01:40, 17.23it/s][A
Epoch 10/10:  22%|██▏       | 487/2208 [00:27<01:36, 17.83it/s][A
Epoch 10/10:  22%|██▏       | 490/2208 [00:27<01:31, 18.88it/s][A
Epoch 10/10:  22%|██▏       | 492/2208 [00:27<01:35, 18.03it/s][A
Epoch 10/10:  22%|██▏       | 495/2208 [00:28<01:30, 19.00it/s][A
Epoch 10/10:  23%|██▎       | 497/2208 [00:28<01:29, 19.21it/s][A
  with torch.cuda.amp.autocast():

Epoch 10/10:  23%|██▎       | 502/2208 [00:28<01:58, 14.40it/s][A
Epoch 10/10:  23%|██▎       | 505/2208 [00:28<01:45, 16.20it/s][A

Batch 500: Training loss = 0.1128, Training accuracy = 0.9629, F1 = 0.9628



Epoch 10/10:  23%|██▎       | 508/2208 [00:28<01:36, 17.58it/s][A
Epoch 10/10:  23%|██▎       | 511/2208 [00:28<01:31, 18.51it/s][A
Epoch 10/10:  23%|██▎       | 513/2208 [00:29<01:30, 18.74it/s][A
Epoch 10/10:  23%|██▎       | 516/2208 [00:29<01:27, 19.39it/s][A
Epoch 10/10:  24%|██▎       | 519/2208 [00:29<01:25, 19.78it/s][A
Epoch 10/10:  24%|██▎       | 522/2208 [00:29<01:26, 19.40it/s][A
Epoch 10/10:  24%|██▎       | 524/2208 [00:29<01:35, 17.71it/s][A
  with torch.cuda.amp.autocast():

Epoch 10/10:  24%|██▍       | 529/2208 [00:30<01:40, 16.66it/s][A

Batch 525: Training loss = 0.0704, Training accuracy = 0.9631, F1 = 0.9630



Epoch 10/10:  24%|██▍       | 532/2208 [00:30<01:33, 17.88it/s][A
Epoch 10/10:  24%|██▍       | 535/2208 [00:30<01:28, 18.81it/s][A
Epoch 10/10:  24%|██▍       | 538/2208 [00:30<01:25, 19.49it/s][A
Epoch 10/10:  24%|██▍       | 540/2208 [00:30<01:25, 19.50it/s][A
Epoch 10/10:  25%|██▍       | 543/2208 [00:30<01:23, 19.92it/s][A
Epoch 10/10:  25%|██▍       | 546/2208 [00:30<01:21, 20.42it/s][A
  with torch.cuda.amp.autocast():

Epoch 10/10:  25%|██▌       | 552/2208 [00:31<01:36, 17.16it/s][A
Epoch 10/10:  25%|██▌       | 555/2208 [00:31<01:30, 18.30it/s][A

Batch 550: Training loss = 0.1368, Training accuracy = 0.9633, F1 = 0.9633



Epoch 10/10:  25%|██▌       | 558/2208 [00:31<01:26, 19.03it/s][A
Epoch 10/10:  25%|██▌       | 561/2208 [00:31<01:23, 19.64it/s][A
Epoch 10/10:  26%|██▌       | 564/2208 [00:31<01:21, 20.08it/s][A
Epoch 10/10:  26%|██▌       | 567/2208 [00:31<01:20, 20.45it/s][A
Epoch 10/10:  26%|██▌       | 570/2208 [00:32<01:19, 20.55it/s][A
Epoch 10/10:  26%|██▌       | 573/2208 [00:32<01:18, 20.80it/s][A
  with torch.cuda.amp.autocast():

Epoch 10/10:  26%|██▌       | 579/2208 [00:32<01:30, 18.07it/s][A

Batch 575: Training loss = 0.1345, Training accuracy = 0.9636, F1 = 0.9636



Epoch 10/10:  26%|██▋       | 582/2208 [00:32<01:25, 18.96it/s][A
Epoch 10/10:  26%|██▋       | 585/2208 [00:32<01:23, 19.54it/s][A
Epoch 10/10:  27%|██▋       | 588/2208 [00:33<01:21, 20.00it/s][A
Epoch 10/10:  27%|██▋       | 591/2208 [00:33<01:19, 20.31it/s][A
Epoch 10/10:  27%|██▋       | 594/2208 [00:33<01:18, 20.54it/s][A
Epoch 10/10:  27%|██▋       | 597/2208 [00:33<01:17, 20.85it/s][A
  with torch.cuda.amp.autocast():

Epoch 10/10:  27%|██▋       | 603/2208 [00:33<01:36, 16.68it/s][A

Batch 600: Training loss = 0.1719, Training accuracy = 0.9637, F1 = 0.9636



Epoch 10/10:  27%|██▋       | 606/2208 [00:34<01:29, 17.89it/s][A
Epoch 10/10:  28%|██▊       | 609/2208 [00:34<01:25, 18.71it/s][A
Epoch 10/10:  28%|██▊       | 612/2208 [00:34<01:22, 19.38it/s][A
Epoch 10/10:  28%|██▊       | 615/2208 [00:34<01:19, 19.92it/s][A
Epoch 10/10:  28%|██▊       | 618/2208 [00:34<01:18, 20.14it/s][A
Epoch 10/10:  28%|██▊       | 621/2208 [00:34<01:17, 20.40it/s][A
  with torch.cuda.amp.autocast():

Epoch 10/10:  28%|██▊       | 627/2208 [00:35<01:39, 15.83it/s][A
Epoch 10/10:  29%|██▊       | 630/2208 [00:35<01:32, 17.14it/s][A

Batch 625: Training loss = 0.1042, Training accuracy = 0.9634, F1 = 0.9634



Epoch 10/10:  29%|██▊       | 633/2208 [00:35<01:26, 18.19it/s][A
Epoch 10/10:  29%|██▉       | 636/2208 [00:35<01:22, 19.03it/s][A
Epoch 10/10:  29%|██▉       | 639/2208 [00:35<01:20, 19.60it/s][A
Epoch 10/10:  29%|██▉       | 642/2208 [00:35<01:17, 20.19it/s][A
Epoch 10/10:  29%|██▉       | 645/2208 [00:35<01:16, 20.55it/s][A
Epoch 10/10:  29%|██▉       | 648/2208 [00:36<01:16, 20.50it/s][A
  with torch.cuda.amp.autocast():

Epoch 10/10:  30%|██▉       | 654/2208 [00:36<01:27, 17.68it/s][A

Batch 650: Training loss = 0.0831, Training accuracy = 0.9637, F1 = 0.9637



Epoch 10/10:  30%|██▉       | 657/2208 [00:36<01:23, 18.52it/s][A
Epoch 10/10:  30%|██▉       | 660/2208 [00:36<01:19, 19.36it/s][A
Epoch 10/10:  30%|███       | 663/2208 [00:36<01:17, 19.92it/s][A
Epoch 10/10:  30%|███       | 666/2208 [00:37<01:15, 20.34it/s][A
Epoch 10/10:  30%|███       | 669/2208 [00:37<01:14, 20.76it/s][A
Epoch 10/10:  30%|███       | 672/2208 [00:37<01:13, 20.90it/s][A
  with torch.cuda.amp.autocast():

Epoch 10/10:  31%|███       | 678/2208 [00:37<01:38, 15.52it/s][A

Batch 675: Training loss = 0.1081, Training accuracy = 0.9637, F1 = 0.9637



Epoch 10/10:  31%|███       | 681/2208 [00:37<01:30, 16.93it/s][A
Epoch 10/10:  31%|███       | 684/2208 [00:38<01:25, 17.92it/s][A
Epoch 10/10:  31%|███       | 687/2208 [00:38<01:21, 18.70it/s][A
Epoch 10/10:  31%|███▏      | 690/2208 [00:38<01:17, 19.50it/s][A
Epoch 10/10:  31%|███▏      | 693/2208 [00:38<01:15, 19.98it/s][A
Epoch 10/10:  32%|███▏      | 696/2208 [00:38<01:14, 20.32it/s][A
  with torch.cuda.amp.autocast():

Epoch 10/10:  32%|███▏      | 702/2208 [00:39<01:34, 15.94it/s][A
Epoch 10/10:  32%|███▏      | 705/2208 [00:39<01:26, 17.29it/s][A

Batch 700: Training loss = 0.1198, Training accuracy = 0.9637, F1 = 0.9636



Epoch 10/10:  32%|███▏      | 708/2208 [00:39<01:22, 18.28it/s][A
Epoch 10/10:  32%|███▏      | 711/2208 [00:39<01:18, 19.01it/s][A
Epoch 10/10:  32%|███▏      | 714/2208 [00:39<01:15, 19.67it/s][A
Epoch 10/10:  32%|███▏      | 717/2208 [00:39<01:14, 20.14it/s][A
Epoch 10/10:  33%|███▎      | 720/2208 [00:39<01:12, 20.40it/s][A
Epoch 10/10:  33%|███▎      | 723/2208 [00:40<01:18, 18.83it/s][A
  with torch.cuda.amp.autocast():

Epoch 10/10:  33%|███▎      | 727/2208 [00:40<01:45, 14.10it/s][A
Epoch 10/10:  33%|███▎      | 729/2208 [00:40<01:37, 15.18it/s][A

Batch 725: Training loss = 0.0734, Training accuracy = 0.9636, F1 = 0.9636



Epoch 10/10:  33%|███▎      | 732/2208 [00:40<01:27, 16.82it/s][A
Epoch 10/10:  33%|███▎      | 735/2208 [00:40<01:21, 18.02it/s][A
Epoch 10/10:  33%|███▎      | 738/2208 [00:41<01:18, 18.77it/s][A
Epoch 10/10:  34%|███▎      | 740/2208 [00:41<01:17, 18.97it/s][A
Epoch 10/10:  34%|███▎      | 743/2208 [00:41<01:15, 19.48it/s][A
Epoch 10/10:  34%|███▍      | 746/2208 [00:41<01:13, 19.89it/s][A
Epoch 10/10:  34%|███▍      | 749/2208 [00:41<01:19, 18.42it/s][A
  with torch.cuda.amp.autocast():

Epoch 10/10:  34%|███▍      | 754/2208 [00:42<01:30, 16.12it/s][A

Batch 750: Training loss = 0.0505, Training accuracy = 0.9636, F1 = 0.9635



Epoch 10/10:  34%|███▍      | 757/2208 [00:42<01:23, 17.44it/s][A
Epoch 10/10:  34%|███▍      | 760/2208 [00:42<01:18, 18.45it/s][A
Epoch 10/10:  35%|███▍      | 763/2208 [00:42<01:15, 19.12it/s][A
Epoch 10/10:  35%|███▍      | 765/2208 [00:42<01:15, 19.24it/s][A
Epoch 10/10:  35%|███▍      | 768/2208 [00:42<01:12, 19.76it/s][A
Epoch 10/10:  35%|███▍      | 771/2208 [00:42<01:16, 18.83it/s][A
Epoch 10/10:  35%|███▌      | 774/2208 [00:43<01:13, 19.43it/s][A
  with torch.cuda.amp.autocast():

Epoch 10/10:  35%|███▌      | 779/2208 [00:43<01:27, 16.31it/s][A

Batch 775: Training loss = 0.1969, Training accuracy = 0.9635, F1 = 0.9635



Epoch 10/10:  35%|███▌      | 782/2208 [00:43<01:21, 17.49it/s][A
Epoch 10/10:  36%|███▌      | 785/2208 [00:43<01:17, 18.47it/s][A
Epoch 10/10:  36%|███▌      | 788/2208 [00:43<01:13, 19.24it/s][A
Epoch 10/10:  36%|███▌      | 791/2208 [00:44<01:19, 17.75it/s][A
Epoch 10/10:  36%|███▌      | 793/2208 [00:44<01:23, 16.96it/s][A
Epoch 10/10:  36%|███▌      | 796/2208 [00:44<01:20, 17.53it/s][A
Epoch 10/10:  36%|███▌      | 799/2208 [00:44<01:16, 18.44it/s][A
  with torch.cuda.amp.autocast():

Epoch 10/10:  36%|███▋      | 804/2208 [00:44<01:29, 15.73it/s][A

Batch 800: Training loss = 0.0479, Training accuracy = 0.9636, F1 = 0.9636



Epoch 10/10:  37%|███▋      | 807/2208 [00:45<01:21, 17.12it/s][A
Epoch 10/10:  37%|███▋      | 809/2208 [00:45<01:19, 17.69it/s][A
Epoch 10/10:  37%|███▋      | 812/2208 [00:45<01:14, 18.63it/s][A
Epoch 10/10:  37%|███▋      | 815/2208 [00:45<01:11, 19.37it/s][A
Epoch 10/10:  37%|███▋      | 818/2208 [00:45<01:09, 19.93it/s][A
Epoch 10/10:  37%|███▋      | 821/2208 [00:45<01:08, 20.35it/s][A
  with torch.cuda.amp.autocast():

Epoch 10/10:  37%|███▋      | 827/2208 [00:46<01:30, 15.21it/s][A
Epoch 10/10:  38%|███▊      | 830/2208 [00:46<01:22, 16.71it/s][A

Batch 825: Training loss = 0.1155, Training accuracy = 0.9637, F1 = 0.9637



Epoch 10/10:  38%|███▊      | 833/2208 [00:46<01:16, 17.90it/s][A
Epoch 10/10:  38%|███▊      | 836/2208 [00:46<01:13, 18.79it/s][A
Epoch 10/10:  38%|███▊      | 839/2208 [00:46<01:09, 19.60it/s][A
Epoch 10/10:  38%|███▊      | 842/2208 [00:46<01:08, 20.04it/s][A
Epoch 10/10:  38%|███▊      | 845/2208 [00:46<01:06, 20.45it/s][A
Epoch 10/10:  38%|███▊      | 848/2208 [00:47<01:05, 20.68it/s][A
  with torch.cuda.amp.autocast():

Epoch 10/10:  39%|███▊      | 854/2208 [00:47<01:21, 16.61it/s][A

Batch 850: Training loss = 0.0722, Training accuracy = 0.9635, F1 = 0.9635



Epoch 10/10:  39%|███▉      | 857/2208 [00:47<01:16, 17.77it/s][A
Epoch 10/10:  39%|███▉      | 860/2208 [00:47<01:11, 18.73it/s][A
Epoch 10/10:  39%|███▉      | 863/2208 [00:48<01:09, 19.35it/s][A
Epoch 10/10:  39%|███▉      | 866/2208 [00:48<01:07, 19.80it/s][A
Epoch 10/10:  39%|███▉      | 869/2208 [00:48<01:05, 20.32it/s][A
Epoch 10/10:  39%|███▉      | 872/2208 [00:48<01:05, 20.43it/s][A
  with torch.cuda.amp.autocast():

Epoch 10/10:  40%|███▉      | 878/2208 [00:48<01:31, 14.47it/s][A

Batch 875: Training loss = 0.0617, Training accuracy = 0.9635, F1 = 0.9635



Epoch 10/10:  40%|███▉      | 881/2208 [00:49<01:22, 16.04it/s][A
Epoch 10/10:  40%|████      | 884/2208 [00:49<01:16, 17.27it/s][A
Epoch 10/10:  40%|████      | 887/2208 [00:49<01:12, 18.32it/s][A
Epoch 10/10:  40%|████      | 890/2208 [00:49<01:09, 18.90it/s][A
Epoch 10/10:  40%|████      | 893/2208 [00:49<01:07, 19.47it/s][A
Epoch 10/10:  41%|████      | 896/2208 [00:49<01:05, 20.09it/s][A
  with torch.cuda.amp.autocast():

Epoch 10/10:  41%|████      | 902/2208 [00:50<01:24, 15.42it/s][A
Epoch 10/10:  41%|████      | 905/2208 [00:50<01:17, 16.85it/s][A

Batch 900: Training loss = 0.0809, Training accuracy = 0.9634, F1 = 0.9634



Epoch 10/10:  41%|████      | 908/2208 [00:50<01:12, 17.95it/s][A
Epoch 10/10:  41%|████▏     | 911/2208 [00:50<01:09, 18.79it/s][A
Epoch 10/10:  41%|████▏     | 914/2208 [00:50<01:06, 19.47it/s][A
Epoch 10/10:  42%|████▏     | 917/2208 [00:50<01:05, 19.85it/s][A
Epoch 10/10:  42%|████▏     | 920/2208 [00:51<01:03, 20.22it/s][A
Epoch 10/10:  42%|████▏     | 923/2208 [00:51<01:02, 20.47it/s][A
  with torch.cuda.amp.autocast():

Epoch 10/10:  42%|████▏     | 929/2208 [00:51<01:17, 16.42it/s][A

Batch 925: Training loss = 0.0935, Training accuracy = 0.9633, F1 = 0.9633



Epoch 10/10:  42%|████▏     | 932/2208 [00:51<01:12, 17.66it/s][A
Epoch 10/10:  42%|████▏     | 935/2208 [00:51<01:08, 18.60it/s][A
Epoch 10/10:  42%|████▏     | 938/2208 [00:52<01:05, 19.28it/s][A
Epoch 10/10:  43%|████▎     | 941/2208 [00:52<01:04, 19.75it/s][A
Epoch 10/10:  43%|████▎     | 944/2208 [00:52<01:02, 20.25it/s][A
Epoch 10/10:  43%|████▎     | 947/2208 [00:52<01:01, 20.57it/s][A
  with torch.cuda.amp.autocast():

Epoch 10/10:  43%|████▎     | 953/2208 [00:53<01:22, 15.18it/s][A

Batch 950: Training loss = 0.0979, Training accuracy = 0.9634, F1 = 0.9634



Epoch 10/10:  43%|████▎     | 956/2208 [00:53<01:14, 16.70it/s][A
Epoch 10/10:  43%|████▎     | 959/2208 [00:53<01:10, 17.77it/s][A
Epoch 10/10:  44%|████▎     | 962/2208 [00:53<01:06, 18.66it/s][A
Epoch 10/10:  44%|████▎     | 965/2208 [00:53<01:04, 19.31it/s][A
Epoch 10/10:  44%|████▍     | 968/2208 [00:53<01:03, 19.67it/s][A
Epoch 10/10:  44%|████▍     | 971/2208 [00:53<01:01, 20.10it/s][A
  with torch.cuda.amp.autocast():

Epoch 10/10:  44%|████▍     | 977/2208 [00:54<01:23, 14.71it/s][A
Epoch 10/10:  44%|████▍     | 980/2208 [00:54<01:15, 16.20it/s][A

Batch 975: Training loss = 0.1134, Training accuracy = 0.9634, F1 = 0.9634



Epoch 10/10:  45%|████▍     | 983/2208 [00:54<01:10, 17.32it/s][A
Epoch 10/10:  45%|████▍     | 986/2208 [00:54<01:07, 18.12it/s][A
Epoch 10/10:  45%|████▍     | 989/2208 [00:54<01:04, 18.80it/s][A
Epoch 10/10:  45%|████▍     | 992/2208 [00:55<01:02, 19.50it/s][A
Epoch 10/10:  45%|████▌     | 995/2208 [00:55<01:00, 19.94it/s][A
Epoch 10/10:  45%|████▌     | 998/2208 [00:55<00:59, 20.30it/s][A
  with torch.cuda.amp.autocast():

Epoch 10/10:  45%|████▌     | 1004/2208 [00:55<01:17, 15.63it/s][A

Batch 1000: Training loss = 0.1267, Training accuracy = 0.9635, F1 = 0.9635



Epoch 10/10:  46%|████▌     | 1007/2208 [00:55<01:10, 16.95it/s][A
Epoch 10/10:  46%|████▌     | 1010/2208 [00:56<01:06, 18.10it/s][A
Epoch 10/10:  46%|████▌     | 1013/2208 [00:56<01:03, 18.97it/s][A
Epoch 10/10:  46%|████▌     | 1016/2208 [00:56<01:01, 19.47it/s][A
Epoch 10/10:  46%|████▌     | 1019/2208 [00:56<01:06, 17.77it/s][A
Epoch 10/10:  46%|████▋     | 1022/2208 [00:56<01:03, 18.55it/s][A
  with torch.cuda.amp.autocast():

Epoch 10/10:  47%|████▋     | 1027/2208 [00:57<01:30, 13.00it/s][A
Epoch 10/10:  47%|████▋     | 1030/2208 [00:57<01:18, 14.92it/s][A

Batch 1025: Training loss = 0.1134, Training accuracy = 0.9635, F1 = 0.9635



Epoch 10/10:  47%|████▋     | 1033/2208 [00:57<01:10, 16.56it/s][A
Epoch 10/10:  47%|████▋     | 1036/2208 [00:57<01:05, 17.78it/s][A
Epoch 10/10:  47%|████▋     | 1039/2208 [00:57<01:08, 16.97it/s][A
Epoch 10/10:  47%|████▋     | 1042/2208 [00:57<01:04, 17.95it/s][A
Epoch 10/10:  47%|████▋     | 1044/2208 [00:58<01:05, 17.67it/s][A
Epoch 10/10:  47%|████▋     | 1047/2208 [00:58<01:04, 17.98it/s][A
  with torch.cuda.amp.autocast():

Epoch 10/10:  48%|████▊     | 1052/2208 [00:58<01:45, 10.99it/s][A
Epoch 10/10:  48%|████▊     | 1055/2208 [00:58<01:27, 13.13it/s][A

Batch 1050: Training loss = 0.1083, Training accuracy = 0.9637, F1 = 0.9636



Epoch 10/10:  48%|████▊     | 1058/2208 [00:59<01:17, 14.93it/s][A
Epoch 10/10:  48%|████▊     | 1061/2208 [00:59<01:09, 16.43it/s][A
Epoch 10/10:  48%|████▊     | 1064/2208 [00:59<01:04, 17.69it/s][A
Epoch 10/10:  48%|████▊     | 1067/2208 [00:59<01:01, 18.63it/s][A
Epoch 10/10:  48%|████▊     | 1070/2208 [00:59<00:58, 19.46it/s][A
Epoch 10/10:  49%|████▊     | 1073/2208 [00:59<00:57, 19.85it/s][A
  with torch.cuda.amp.autocast():

Epoch 10/10:  49%|████▉     | 1079/2208 [01:00<01:11, 15.79it/s][A

Batch 1075: Training loss = 0.0418, Training accuracy = 0.9638, F1 = 0.9637



Epoch 10/10:  49%|████▉     | 1082/2208 [01:00<01:05, 17.21it/s][A
Epoch 10/10:  49%|████▉     | 1085/2208 [01:00<01:01, 18.24it/s][A
Epoch 10/10:  49%|████▉     | 1088/2208 [01:00<00:59, 18.95it/s][A
Epoch 10/10:  49%|████▉     | 1091/2208 [01:00<00:57, 19.40it/s][A
Epoch 10/10:  50%|████▉     | 1094/2208 [01:01<00:56, 19.77it/s][A
Epoch 10/10:  50%|████▉     | 1097/2208 [01:01<00:55, 20.01it/s][A
  with torch.cuda.amp.autocast():

Epoch 10/10:  50%|████▉     | 1103/2208 [01:01<01:18, 14.12it/s][A

Batch 1100: Training loss = 0.0518, Training accuracy = 0.9638, F1 = 0.9638



Epoch 10/10:  50%|█████     | 1106/2208 [01:01<01:09, 15.76it/s][A
Epoch 10/10:  50%|█████     | 1109/2208 [01:01<01:04, 17.06it/s][A
Epoch 10/10:  50%|█████     | 1112/2208 [01:02<01:00, 18.03it/s][A
Epoch 10/10:  50%|█████     | 1115/2208 [01:02<00:58, 18.83it/s][A
Epoch 10/10:  51%|█████     | 1118/2208 [01:02<00:55, 19.51it/s][A
Epoch 10/10:  51%|█████     | 1121/2208 [01:02<00:54, 19.91it/s][A
  with torch.cuda.amp.autocast():

Epoch 10/10:  51%|█████     | 1127/2208 [01:03<01:15, 14.25it/s][A
Epoch 10/10:  51%|█████     | 1130/2208 [01:03<01:08, 15.73it/s][A

Batch 1125: Training loss = 0.2274, Training accuracy = 0.9638, F1 = 0.9638



Epoch 10/10:  51%|█████▏    | 1133/2208 [01:03<01:02, 17.10it/s][A
Epoch 10/10:  51%|█████▏    | 1136/2208 [01:03<00:58, 18.20it/s][A
Epoch 10/10:  52%|█████▏    | 1139/2208 [01:03<00:56, 19.06it/s][A
Epoch 10/10:  52%|█████▏    | 1142/2208 [01:03<00:54, 19.58it/s][A
Epoch 10/10:  52%|█████▏    | 1145/2208 [01:03<00:53, 19.99it/s][A
Epoch 10/10:  52%|█████▏    | 1148/2208 [01:04<00:52, 20.18it/s][A
  with torch.cuda.amp.autocast():

Epoch 10/10:  52%|█████▏    | 1154/2208 [01:04<01:10, 15.03it/s][A

Batch 1150: Training loss = 0.1258, Training accuracy = 0.9637, F1 = 0.9637



Epoch 10/10:  52%|█████▏    | 1157/2208 [01:04<01:03, 16.54it/s][A
Epoch 10/10:  53%|█████▎    | 1160/2208 [01:04<00:59, 17.65it/s][A
Epoch 10/10:  53%|█████▎    | 1163/2208 [01:05<00:56, 18.57it/s][A
Epoch 10/10:  53%|█████▎    | 1166/2208 [01:05<00:54, 19.25it/s][A
Epoch 10/10:  53%|█████▎    | 1169/2208 [01:05<00:52, 19.66it/s][A
Epoch 10/10:  53%|█████▎    | 1172/2208 [01:05<00:51, 20.12it/s][A
  with torch.cuda.amp.autocast():

Epoch 10/10:  53%|█████▎    | 1178/2208 [01:06<01:22, 12.54it/s][A

Batch 1175: Training loss = 0.1186, Training accuracy = 0.9635, F1 = 0.9635



Epoch 10/10:  53%|█████▎    | 1181/2208 [01:06<01:11, 14.37it/s][A
Epoch 10/10:  54%|█████▎    | 1184/2208 [01:06<01:03, 16.01it/s][A
Epoch 10/10:  54%|█████▎    | 1186/2208 [01:06<01:01, 16.72it/s][A
Epoch 10/10:  54%|█████▍    | 1189/2208 [01:06<00:57, 17.87it/s][A
Epoch 10/10:  54%|█████▍    | 1192/2208 [01:06<00:54, 18.77it/s][A
Epoch 10/10:  54%|█████▍    | 1195/2208 [01:06<00:51, 19.55it/s][A
Epoch 10/10:  54%|█████▍    | 1198/2208 [01:06<00:50, 20.00it/s][A
  with torch.cuda.amp.autocast():

Epoch 10/10:  55%|█████▍    | 1204/2208 [01:07<01:08, 14.70it/s][A

Batch 1200: Training loss = 0.1728, Training accuracy = 0.9635, F1 = 0.9635



Epoch 10/10:  55%|█████▍    | 1207/2208 [01:07<01:01, 16.25it/s][A
Epoch 10/10:  55%|█████▍    | 1210/2208 [01:07<00:57, 17.42it/s][A
Epoch 10/10:  55%|█████▍    | 1213/2208 [01:07<00:54, 18.41it/s][A
Epoch 10/10:  55%|█████▌    | 1216/2208 [01:08<00:52, 19.06it/s][A
Epoch 10/10:  55%|█████▌    | 1219/2208 [01:08<00:50, 19.60it/s][A
Epoch 10/10:  55%|█████▌    | 1222/2208 [01:08<00:49, 20.06it/s][A
  with torch.cuda.amp.autocast():

Epoch 10/10:  56%|█████▌    | 1228/2208 [01:08<01:14, 13.21it/s][A

Batch 1225: Training loss = 0.2096, Training accuracy = 0.9635, F1 = 0.9635



Epoch 10/10:  56%|█████▌    | 1231/2208 [01:09<01:05, 14.90it/s][A
Epoch 10/10:  56%|█████▌    | 1234/2208 [01:09<01:00, 16.23it/s][A
Epoch 10/10:  56%|█████▌    | 1237/2208 [01:09<00:55, 17.37it/s][A
Epoch 10/10:  56%|█████▌    | 1240/2208 [01:09<00:52, 18.35it/s][A
Epoch 10/10:  56%|█████▋    | 1243/2208 [01:09<00:50, 19.01it/s][A
Epoch 10/10:  56%|█████▋    | 1246/2208 [01:09<00:49, 19.48it/s][A
  with torch.cuda.amp.autocast():

Epoch 10/10:  57%|█████▋    | 1252/2208 [01:10<01:19, 12.08it/s][A
Epoch 10/10:  57%|█████▋    | 1255/2208 [01:10<01:08, 13.93it/s][A

Batch 1250: Training loss = 0.1878, Training accuracy = 0.9634, F1 = 0.9634



Epoch 10/10:  57%|█████▋    | 1258/2208 [01:10<01:01, 15.54it/s][A
Epoch 10/10:  57%|█████▋    | 1261/2208 [01:10<00:55, 16.93it/s][A
Epoch 10/10:  57%|█████▋    | 1264/2208 [01:10<00:52, 18.00it/s][A
Epoch 10/10:  57%|█████▋    | 1267/2208 [01:11<00:50, 18.76it/s][A
Epoch 10/10:  58%|█████▊    | 1270/2208 [01:11<00:48, 19.39it/s][A
Epoch 10/10:  58%|█████▊    | 1273/2208 [01:11<00:47, 19.73it/s][A
  with torch.cuda.amp.autocast():

Epoch 10/10:  58%|█████▊    | 1279/2208 [01:11<01:03, 14.54it/s][A

Batch 1275: Training loss = 0.2077, Training accuracy = 0.9635, F1 = 0.9634



Epoch 10/10:  58%|█████▊    | 1282/2208 [01:12<00:57, 16.05it/s][A
Epoch 10/10:  58%|█████▊    | 1285/2208 [01:12<00:53, 17.26it/s][A
Epoch 10/10:  58%|█████▊    | 1288/2208 [01:12<00:50, 18.22it/s][A
Epoch 10/10:  58%|█████▊    | 1291/2208 [01:12<00:48, 18.93it/s][A
Epoch 10/10:  59%|█████▊    | 1294/2208 [01:12<00:50, 18.02it/s][A
Epoch 10/10:  59%|█████▊    | 1297/2208 [01:12<00:48, 18.77it/s][A
  with torch.cuda.amp.autocast():

Epoch 10/10:  59%|█████▉    | 1303/2208 [01:13<01:23, 10.80it/s][A

Batch 1300: Training loss = 0.1407, Training accuracy = 0.9635, F1 = 0.9635



Epoch 10/10:  59%|█████▉    | 1306/2208 [01:13<01:10, 12.72it/s][A
Epoch 10/10:  59%|█████▉    | 1309/2208 [01:13<01:02, 14.50it/s][A
Epoch 10/10:  59%|█████▉    | 1312/2208 [01:14<00:55, 16.00it/s][A
Epoch 10/10:  60%|█████▉    | 1315/2208 [01:14<00:52, 17.16it/s][A
Epoch 10/10:  60%|█████▉    | 1318/2208 [01:14<00:48, 18.24it/s][A
Epoch 10/10:  60%|█████▉    | 1321/2208 [01:14<00:46, 19.06it/s][A
  with torch.cuda.amp.autocast():

Epoch 10/10:  60%|██████    | 1327/2208 [01:15<01:07, 13.07it/s][A
Epoch 10/10:  60%|██████    | 1330/2208 [01:15<00:59, 14.84it/s][A

Batch 1325: Training loss = 0.0786, Training accuracy = 0.9634, F1 = 0.9634



Epoch 10/10:  60%|██████    | 1333/2208 [01:15<00:53, 16.23it/s][A
Epoch 10/10:  61%|██████    | 1336/2208 [01:15<00:49, 17.44it/s][A
Epoch 10/10:  61%|██████    | 1339/2208 [01:15<00:47, 18.36it/s][A
Epoch 10/10:  61%|██████    | 1342/2208 [01:15<00:45, 19.17it/s][A
Epoch 10/10:  61%|██████    | 1345/2208 [01:15<00:43, 19.76it/s][A
Epoch 10/10:  61%|██████    | 1348/2208 [01:15<00:43, 19.96it/s][A
  with torch.cuda.amp.autocast():

Epoch 10/10:  61%|██████▏   | 1354/2208 [01:16<00:57, 14.79it/s][A

Batch 1350: Training loss = 0.1156, Training accuracy = 0.9634, F1 = 0.9634



Epoch 10/10:  61%|██████▏   | 1357/2208 [01:16<00:52, 16.31it/s][A
Epoch 10/10:  62%|██████▏   | 1360/2208 [01:16<00:48, 17.51it/s][A
Epoch 10/10:  62%|██████▏   | 1363/2208 [01:16<00:45, 18.44it/s][A
Epoch 10/10:  62%|██████▏   | 1366/2208 [01:17<00:43, 19.19it/s][A
Epoch 10/10:  62%|██████▏   | 1369/2208 [01:17<00:42, 19.85it/s][A
Epoch 10/10:  62%|██████▏   | 1372/2208 [01:17<00:41, 20.09it/s][A
  with torch.cuda.amp.autocast():

Epoch 10/10:  62%|██████▏   | 1378/2208 [01:17<01:05, 12.72it/s][A

Batch 1375: Training loss = 0.1575, Training accuracy = 0.9633, F1 = 0.9633



Epoch 10/10:  63%|██████▎   | 1381/2208 [01:18<00:56, 14.52it/s][A
Epoch 10/10:  63%|██████▎   | 1384/2208 [01:18<00:51, 16.09it/s][A
Epoch 10/10:  63%|██████▎   | 1387/2208 [01:18<00:47, 17.31it/s][A
Epoch 10/10:  63%|██████▎   | 1390/2208 [01:18<00:44, 18.25it/s][A
Epoch 10/10:  63%|██████▎   | 1393/2208 [01:18<00:42, 19.03it/s][A
Epoch 10/10:  63%|██████▎   | 1396/2208 [01:18<00:41, 19.63it/s][A
  with torch.cuda.amp.autocast():

Epoch 10/10:  63%|██████▎   | 1402/2208 [01:19<01:02, 12.90it/s][A
Epoch 10/10:  64%|██████▎   | 1405/2208 [01:19<00:54, 14.70it/s][A

Batch 1400: Training loss = 0.0778, Training accuracy = 0.9633, F1 = 0.9633



Epoch 10/10:  64%|██████▍   | 1408/2208 [01:19<00:49, 16.27it/s][A
Epoch 10/10:  64%|██████▍   | 1411/2208 [01:19<00:45, 17.46it/s][A
Epoch 10/10:  64%|██████▍   | 1414/2208 [01:19<00:42, 18.49it/s][A
Epoch 10/10:  64%|██████▍   | 1417/2208 [01:20<00:41, 19.23it/s][A
Epoch 10/10:  64%|██████▍   | 1420/2208 [01:20<00:39, 19.74it/s][A
Epoch 10/10:  64%|██████▍   | 1423/2208 [01:20<00:39, 20.06it/s][A
  with torch.cuda.amp.autocast():

Epoch 10/10:  65%|██████▍   | 1429/2208 [01:21<00:55, 13.99it/s][A

Batch 1425: Training loss = 0.0926, Training accuracy = 0.9634, F1 = 0.9634



Epoch 10/10:  65%|██████▍   | 1432/2208 [01:21<00:49, 15.66it/s][A
Epoch 10/10:  65%|██████▍   | 1435/2208 [01:21<00:45, 16.99it/s][A
Epoch 10/10:  65%|██████▌   | 1438/2208 [01:21<00:42, 18.03it/s][A
Epoch 10/10:  65%|██████▌   | 1441/2208 [01:21<00:40, 18.93it/s][A
Epoch 10/10:  65%|██████▌   | 1444/2208 [01:21<00:39, 19.48it/s][A
Epoch 10/10:  66%|██████▌   | 1447/2208 [01:21<00:38, 19.94it/s][A
  with torch.cuda.amp.autocast():

Epoch 10/10:  66%|██████▌   | 1453/2208 [01:22<00:59, 12.62it/s][A

Batch 1450: Training loss = 0.1314, Training accuracy = 0.9634, F1 = 0.9634



Epoch 10/10:  66%|██████▌   | 1456/2208 [01:22<00:52, 14.43it/s][A
Epoch 10/10:  66%|██████▌   | 1459/2208 [01:22<00:46, 16.00it/s][A
Epoch 10/10:  66%|██████▌   | 1462/2208 [01:22<00:43, 17.22it/s][A
Epoch 10/10:  66%|██████▋   | 1465/2208 [01:23<00:40, 18.19it/s][A
Epoch 10/10:  66%|██████▋   | 1468/2208 [01:23<00:39, 18.90it/s][A
Epoch 10/10:  67%|██████▋   | 1471/2208 [01:23<00:37, 19.59it/s][A
  with torch.cuda.amp.autocast():

Epoch 10/10:  67%|██████▋   | 1477/2208 [01:23<01:00, 11.99it/s][A
Epoch 10/10:  67%|██████▋   | 1480/2208 [01:24<00:52, 13.86it/s][A

Batch 1475: Training loss = 0.1136, Training accuracy = 0.9635, F1 = 0.9635



Epoch 10/10:  67%|██████▋   | 1483/2208 [01:24<00:47, 15.41it/s][A
Epoch 10/10:  67%|██████▋   | 1486/2208 [01:24<00:43, 16.73it/s][A
Epoch 10/10:  67%|██████▋   | 1489/2208 [01:24<00:40, 17.79it/s][A
Epoch 10/10:  68%|██████▊   | 1492/2208 [01:24<00:39, 18.36it/s][A
Epoch 10/10:  68%|██████▊   | 1495/2208 [01:24<00:37, 19.03it/s][A
Epoch 10/10:  68%|██████▊   | 1498/2208 [01:25<00:44, 16.00it/s][A
  with torch.cuda.amp.autocast():

Epoch 10/10:  68%|██████▊   | 1504/2208 [01:25<00:54, 12.96it/s][A

Batch 1500: Training loss = 0.1293, Training accuracy = 0.9635, F1 = 0.9635



Epoch 10/10:  68%|██████▊   | 1507/2208 [01:25<00:47, 14.70it/s][A
Epoch 10/10:  68%|██████▊   | 1510/2208 [01:25<00:43, 16.16it/s][A
Epoch 10/10:  69%|██████▊   | 1513/2208 [01:26<00:40, 17.35it/s][A
Epoch 10/10:  69%|██████▊   | 1516/2208 [01:26<00:38, 18.19it/s][A
Epoch 10/10:  69%|██████▉   | 1518/2208 [01:26<00:37, 18.44it/s][A
Epoch 10/10:  69%|██████▉   | 1520/2208 [01:26<00:38, 17.80it/s][A
Epoch 10/10:  69%|██████▉   | 1523/2208 [01:26<00:36, 18.71it/s][A
  with torch.cuda.amp.autocast():

Epoch 10/10:  69%|██████▉   | 1527/2208 [01:27<01:12,  9.42it/s][A
Epoch 10/10:  69%|██████▉   | 1530/2208 [01:27<00:57, 11.78it/s][A

Batch 1525: Training loss = 0.1623, Training accuracy = 0.9635, F1 = 0.9635



Epoch 10/10:  69%|██████▉   | 1532/2208 [01:27<00:51, 13.14it/s][A
Epoch 10/10:  70%|██████▉   | 1535/2208 [01:27<00:44, 15.13it/s][A
Epoch 10/10:  70%|██████▉   | 1538/2208 [01:27<00:39, 16.79it/s][A
Epoch 10/10:  70%|██████▉   | 1541/2208 [01:27<00:37, 18.00it/s][A
Epoch 10/10:  70%|██████▉   | 1544/2208 [01:28<00:34, 18.97it/s][A
Epoch 10/10:  70%|███████   | 1547/2208 [01:28<00:34, 19.15it/s][A
  with torch.cuda.amp.autocast():

Epoch 10/10:  70%|███████   | 1553/2208 [01:28<00:55, 11.86it/s][A

Batch 1550: Training loss = 0.1333, Training accuracy = 0.9636, F1 = 0.9636



Epoch 10/10:  70%|███████   | 1556/2208 [01:28<00:47, 13.75it/s][A
Epoch 10/10:  71%|███████   | 1559/2208 [01:29<00:42, 15.42it/s][A
Epoch 10/10:  71%|███████   | 1562/2208 [01:29<00:38, 16.67it/s][A
Epoch 10/10:  71%|███████   | 1565/2208 [01:29<00:36, 17.77it/s][A
Epoch 10/10:  71%|███████   | 1568/2208 [01:29<00:34, 18.62it/s][A
Epoch 10/10:  71%|███████   | 1571/2208 [01:29<00:32, 19.33it/s][A
  with torch.cuda.amp.autocast():

Epoch 10/10:  71%|███████▏  | 1577/2208 [01:30<00:53, 11.78it/s][A
Epoch 10/10:  72%|███████▏  | 1580/2208 [01:30<00:45, 13.65it/s][A

Batch 1575: Training loss = 0.1479, Training accuracy = 0.9636, F1 = 0.9636



Epoch 10/10:  72%|███████▏  | 1583/2208 [01:30<00:40, 15.32it/s][A
Epoch 10/10:  72%|███████▏  | 1586/2208 [01:30<00:37, 16.77it/s][A
Epoch 10/10:  72%|███████▏  | 1589/2208 [01:30<00:34, 17.94it/s][A
Epoch 10/10:  72%|███████▏  | 1592/2208 [01:30<00:32, 18.77it/s][A
Epoch 10/10:  72%|███████▏  | 1595/2208 [01:31<00:31, 19.54it/s][A
Epoch 10/10:  72%|███████▏  | 1598/2208 [01:31<00:30, 20.09it/s][A
  with torch.cuda.amp.autocast():

Epoch 10/10:  73%|███████▎  | 1604/2208 [01:31<00:43, 13.99it/s][A

Batch 1600: Training loss = 0.1218, Training accuracy = 0.9636, F1 = 0.9636



Epoch 10/10:  73%|███████▎  | 1607/2208 [01:32<00:38, 15.61it/s][A
Epoch 10/10:  73%|███████▎  | 1610/2208 [01:32<00:35, 16.91it/s][A
Epoch 10/10:  73%|███████▎  | 1613/2208 [01:32<00:32, 18.13it/s][A
Epoch 10/10:  73%|███████▎  | 1616/2208 [01:32<00:31, 18.82it/s][A
Epoch 10/10:  73%|███████▎  | 1619/2208 [01:32<00:30, 19.45it/s][A
Epoch 10/10:  73%|███████▎  | 1622/2208 [01:32<00:29, 19.98it/s][A
  with torch.cuda.amp.autocast():

Epoch 10/10:  74%|███████▎  | 1628/2208 [01:33<00:47, 12.25it/s][A

Batch 1625: Training loss = 0.1212, Training accuracy = 0.9636, F1 = 0.9635



Epoch 10/10:  74%|███████▍  | 1631/2208 [01:33<00:40, 14.09it/s][A
Epoch 10/10:  74%|███████▍  | 1634/2208 [01:33<00:36, 15.64it/s][A
Epoch 10/10:  74%|███████▍  | 1637/2208 [01:33<00:33, 16.96it/s][A
Epoch 10/10:  74%|███████▍  | 1640/2208 [01:33<00:31, 17.98it/s][A
Epoch 10/10:  74%|███████▍  | 1643/2208 [01:34<00:29, 18.86it/s][A
Epoch 10/10:  75%|███████▍  | 1646/2208 [01:34<00:28, 19.60it/s][A
  with torch.cuda.amp.autocast():

Epoch 10/10:  75%|███████▍  | 1652/2208 [01:34<00:47, 11.82it/s][A
Epoch 10/10:  75%|███████▍  | 1655/2208 [01:34<00:40, 13.70it/s][A

Batch 1650: Training loss = 0.1150, Training accuracy = 0.9635, F1 = 0.9635



Epoch 10/10:  75%|███████▌  | 1658/2208 [01:35<00:35, 15.36it/s][A
Epoch 10/10:  75%|███████▌  | 1661/2208 [01:35<00:32, 16.72it/s][A
Epoch 10/10:  75%|███████▌  | 1664/2208 [01:35<00:30, 17.90it/s][A
Epoch 10/10:  75%|███████▌  | 1667/2208 [01:35<00:28, 18.69it/s][A
Epoch 10/10:  76%|███████▌  | 1670/2208 [01:35<00:27, 19.44it/s][A
Epoch 10/10:  76%|███████▌  | 1673/2208 [01:35<00:26, 19.97it/s][A
  with torch.cuda.amp.autocast():

Epoch 10/10:  76%|███████▌  | 1679/2208 [01:36<00:38, 13.87it/s][A

Batch 1675: Training loss = 0.1172, Training accuracy = 0.9636, F1 = 0.9636



Epoch 10/10:  76%|███████▌  | 1682/2208 [01:36<00:33, 15.55it/s][A
Epoch 10/10:  76%|███████▋  | 1685/2208 [01:36<00:31, 16.82it/s][A
Epoch 10/10:  76%|███████▋  | 1688/2208 [01:36<00:28, 17.95it/s][A
Epoch 10/10:  77%|███████▋  | 1691/2208 [01:36<00:27, 18.85it/s][A
Epoch 10/10:  77%|███████▋  | 1694/2208 [01:37<00:26, 19.54it/s][A
Epoch 10/10:  77%|███████▋  | 1697/2208 [01:37<00:25, 20.07it/s][A
  with torch.cuda.amp.autocast():

Epoch 10/10:  77%|███████▋  | 1703/2208 [01:37<00:43, 11.56it/s][A

Batch 1700: Training loss = 0.1183, Training accuracy = 0.9636, F1 = 0.9636



Epoch 10/10:  77%|███████▋  | 1706/2208 [01:38<00:37, 13.43it/s][A
Epoch 10/10:  77%|███████▋  | 1709/2208 [01:38<00:33, 15.09it/s][A
Epoch 10/10:  78%|███████▊  | 1712/2208 [01:38<00:30, 16.52it/s][A
Epoch 10/10:  78%|███████▊  | 1715/2208 [01:38<00:29, 16.71it/s][A
Epoch 10/10:  78%|███████▊  | 1717/2208 [01:38<00:28, 17.32it/s][A
Epoch 10/10:  78%|███████▊  | 1720/2208 [01:38<00:26, 18.45it/s][A
Epoch 10/10:  78%|███████▊  | 1723/2208 [01:38<00:29, 16.65it/s][A
  with torch.cuda.amp.autocast():

Epoch 10/10:  78%|███████▊  | 1729/2208 [01:39<00:37, 12.71it/s][A

Batch 1725: Training loss = 0.0380, Training accuracy = 0.9638, F1 = 0.9638



Epoch 10/10:  78%|███████▊  | 1732/2208 [01:39<00:32, 14.49it/s][A
Epoch 10/10:  79%|███████▊  | 1735/2208 [01:39<00:29, 16.00it/s][A
Epoch 10/10:  79%|███████▊  | 1738/2208 [01:40<00:27, 17.20it/s][A
Epoch 10/10:  79%|███████▉  | 1741/2208 [01:40<00:25, 18.24it/s][A
Epoch 10/10:  79%|███████▉  | 1743/2208 [01:40<00:26, 17.42it/s][A
Epoch 10/10:  79%|███████▉  | 1746/2208 [01:40<00:24, 18.51it/s][A
Epoch 10/10:  79%|███████▉  | 1749/2208 [01:40<00:23, 19.18it/s][A
  with torch.cuda.amp.autocast():

Epoch 10/10:  79%|███████▉  | 1754/2208 [01:41<00:39, 11.56it/s][A

Batch 1750: Training loss = 0.1630, Training accuracy = 0.9638, F1 = 0.9638



Epoch 10/10:  80%|███████▉  | 1757/2208 [01:41<00:33, 13.57it/s][A
Epoch 10/10:  80%|███████▉  | 1760/2208 [01:41<00:29, 15.30it/s][A
Epoch 10/10:  80%|███████▉  | 1762/2208 [01:41<00:27, 16.10it/s][A
Epoch 10/10:  80%|███████▉  | 1764/2208 [01:41<00:26, 16.88it/s][A
Epoch 10/10:  80%|███████▉  | 1766/2208 [01:41<00:25, 17.57it/s][A
Epoch 10/10:  80%|████████  | 1768/2208 [01:42<00:24, 18.15it/s][A
Epoch 10/10:  80%|████████  | 1771/2208 [01:42<00:24, 17.99it/s][A
Epoch 10/10:  80%|████████  | 1774/2208 [01:42<00:22, 19.16it/s][A
  with torch.cuda.amp.autocast():

Epoch 10/10:  81%|████████  | 1779/2208 [01:42<00:36, 11.88it/s][A

Batch 1775: Training loss = 0.0851, Training accuracy = 0.9638, F1 = 0.9638



Epoch 10/10:  81%|████████  | 1782/2208 [01:43<00:30, 13.95it/s][A
Epoch 10/10:  81%|████████  | 1785/2208 [01:43<00:27, 15.63it/s][A
Epoch 10/10:  81%|████████  | 1788/2208 [01:43<00:24, 17.04it/s][A
Epoch 10/10:  81%|████████  | 1791/2208 [01:43<00:22, 18.17it/s][A
Epoch 10/10:  81%|████████▏ | 1794/2208 [01:43<00:21, 19.06it/s][A
Epoch 10/10:  81%|████████▏ | 1797/2208 [01:43<00:20, 19.68it/s][A
  with torch.cuda.amp.autocast():

Epoch 10/10:  82%|████████▏ | 1803/2208 [01:44<00:35, 11.30it/s][A

Batch 1800: Training loss = 0.1231, Training accuracy = 0.9639, F1 = 0.9639



Epoch 10/10:  82%|████████▏ | 1806/2208 [01:44<00:30, 13.22it/s][A
Epoch 10/10:  82%|████████▏ | 1809/2208 [01:44<00:26, 14.94it/s][A
Epoch 10/10:  82%|████████▏ | 1812/2208 [01:44<00:24, 16.39it/s][A
Epoch 10/10:  82%|████████▏ | 1815/2208 [01:45<00:22, 17.65it/s][A
Epoch 10/10:  82%|████████▏ | 1818/2208 [01:45<00:20, 18.58it/s][A
Epoch 10/10:  82%|████████▏ | 1821/2208 [01:45<00:20, 19.27it/s][A
  with torch.cuda.amp.autocast():

Epoch 10/10:  83%|████████▎ | 1827/2208 [01:46<00:33, 11.37it/s][A
Epoch 10/10:  83%|████████▎ | 1830/2208 [01:46<00:28, 13.27it/s][A

Batch 1825: Training loss = 0.1206, Training accuracy = 0.9638, F1 = 0.9638



Epoch 10/10:  83%|████████▎ | 1833/2208 [01:46<00:25, 14.94it/s][A
Epoch 10/10:  83%|████████▎ | 1836/2208 [01:46<00:22, 16.36it/s][A
Epoch 10/10:  83%|████████▎ | 1839/2208 [01:46<00:20, 17.67it/s][A
Epoch 10/10:  83%|████████▎ | 1842/2208 [01:46<00:19, 18.66it/s][A
Epoch 10/10:  84%|████████▎ | 1845/2208 [01:46<00:18, 19.29it/s][A
Epoch 10/10:  84%|████████▎ | 1848/2208 [01:47<00:18, 19.93it/s][A
  with torch.cuda.amp.autocast():

Epoch 10/10:  84%|████████▍ | 1854/2208 [01:47<00:26, 13.53it/s][A

Batch 1850: Training loss = 0.1544, Training accuracy = 0.9638, F1 = 0.9638



Epoch 10/10:  84%|████████▍ | 1857/2208 [01:47<00:23, 15.22it/s][A
Epoch 10/10:  84%|████████▍ | 1860/2208 [01:47<00:20, 16.60it/s][A
Epoch 10/10:  84%|████████▍ | 1863/2208 [01:48<00:19, 17.71it/s][A
Epoch 10/10:  85%|████████▍ | 1866/2208 [01:48<00:18, 18.56it/s][A
Epoch 10/10:  85%|████████▍ | 1869/2208 [01:48<00:17, 19.30it/s][A
Epoch 10/10:  85%|████████▍ | 1872/2208 [01:48<00:16, 19.80it/s][A
  with torch.cuda.amp.autocast():

Epoch 10/10:  85%|████████▌ | 1878/2208 [01:49<00:29, 11.23it/s][A

Batch 1875: Training loss = 0.0876, Training accuracy = 0.9638, F1 = 0.9638



Epoch 10/10:  85%|████████▌ | 1881/2208 [01:49<00:24, 13.08it/s][A
Epoch 10/10:  85%|████████▌ | 1884/2208 [01:49<00:21, 14.75it/s][A
Epoch 10/10:  85%|████████▌ | 1887/2208 [01:49<00:19, 16.20it/s][A
Epoch 10/10:  86%|████████▌ | 1890/2208 [01:49<00:18, 17.49it/s][A
Epoch 10/10:  86%|████████▌ | 1893/2208 [01:49<00:17, 18.36it/s][A
Epoch 10/10:  86%|████████▌ | 1896/2208 [01:50<00:16, 19.04it/s][A
  with torch.cuda.amp.autocast():

Epoch 10/10:  86%|████████▌ | 1902/2208 [01:50<00:26, 11.41it/s][A
Epoch 10/10:  86%|████████▋ | 1905/2208 [01:50<00:22, 13.32it/s][A

Batch 1900: Training loss = 0.0713, Training accuracy = 0.9638, F1 = 0.9638



Epoch 10/10:  86%|████████▋ | 1908/2208 [01:50<00:19, 15.01it/s][A
Epoch 10/10:  87%|████████▋ | 1911/2208 [01:51<00:17, 16.52it/s][A
Epoch 10/10:  87%|████████▋ | 1914/2208 [01:51<00:16, 17.64it/s][A
Epoch 10/10:  87%|████████▋ | 1917/2208 [01:51<00:15, 18.53it/s][A
Epoch 10/10:  87%|████████▋ | 1920/2208 [01:51<00:14, 19.30it/s][A
Epoch 10/10:  87%|████████▋ | 1923/2208 [01:51<00:14, 19.92it/s][A
  with torch.cuda.amp.autocast():

Epoch 10/10:  87%|████████▋ | 1929/2208 [01:52<00:21, 13.20it/s][A

Batch 1925: Training loss = 0.1091, Training accuracy = 0.9639, F1 = 0.9639



Epoch 10/10:  88%|████████▊ | 1932/2208 [01:52<00:18, 14.88it/s][A
Epoch 10/10:  88%|████████▊ | 1935/2208 [01:52<00:16, 16.34it/s][A
Epoch 10/10:  88%|████████▊ | 1938/2208 [01:52<00:15, 17.41it/s][A
Epoch 10/10:  88%|████████▊ | 1941/2208 [01:52<00:14, 18.40it/s][A
Epoch 10/10:  88%|████████▊ | 1944/2208 [01:53<00:13, 19.03it/s][A
Epoch 10/10:  88%|████████▊ | 1947/2208 [01:53<00:13, 19.65it/s][A
  with torch.cuda.amp.autocast():

Epoch 10/10:  88%|████████▊ | 1953/2208 [01:53<00:24, 10.52it/s][A

Batch 1950: Training loss = 0.0552, Training accuracy = 0.9640, F1 = 0.9640



Epoch 10/10:  89%|████████▊ | 1956/2208 [01:54<00:20, 12.39it/s][A
Epoch 10/10:  89%|████████▊ | 1959/2208 [01:54<00:17, 14.15it/s][A
Epoch 10/10:  89%|████████▉ | 1961/2208 [01:54<00:16, 15.07it/s][A
Epoch 10/10:  89%|████████▉ | 1963/2208 [01:54<00:15, 16.01it/s][A
Epoch 10/10:  89%|████████▉ | 1966/2208 [01:54<00:13, 17.40it/s][A
Epoch 10/10:  89%|████████▉ | 1969/2208 [01:54<00:12, 18.46it/s][A
Epoch 10/10:  89%|████████▉ | 1972/2208 [01:54<00:13, 17.63it/s][A
  with torch.cuda.amp.autocast():

Epoch 10/10:  90%|████████▉ | 1977/2208 [01:55<00:24,  9.42it/s][A
Epoch 10/10:  90%|████████▉ | 1980/2208 [01:55<00:19, 11.59it/s][A

Batch 1975: Training loss = 0.1262, Training accuracy = 0.9640, F1 = 0.9640



Epoch 10/10:  90%|████████▉ | 1983/2208 [01:55<00:16, 13.54it/s][A
Epoch 10/10:  90%|████████▉ | 1986/2208 [01:56<00:14, 15.25it/s][A
Epoch 10/10:  90%|█████████ | 1989/2208 [01:56<00:13, 16.64it/s][A
Epoch 10/10:  90%|█████████ | 1992/2208 [01:56<00:12, 17.14it/s][A
Epoch 10/10:  90%|█████████ | 1995/2208 [01:56<00:11, 18.18it/s][A
Epoch 10/10:  90%|█████████ | 1998/2208 [01:56<00:11, 18.89it/s][A
  with torch.cuda.amp.autocast():

Epoch 10/10:  91%|█████████ | 2002/2208 [01:57<00:21,  9.48it/s][A
Epoch 10/10:  91%|█████████ | 2005/2208 [01:57<00:17, 11.76it/s][A

Batch 2000: Training loss = 0.0902, Training accuracy = 0.9640, F1 = 0.9640



Epoch 10/10:  91%|█████████ | 2008/2208 [01:57<00:14, 13.78it/s][A
Epoch 10/10:  91%|█████████ | 2011/2208 [01:57<00:12, 15.61it/s][A
Epoch 10/10:  91%|█████████ | 2014/2208 [01:57<00:11, 17.00it/s][A
Epoch 10/10:  91%|█████████▏| 2017/2208 [01:58<00:10, 18.11it/s][A
Epoch 10/10:  91%|█████████▏| 2020/2208 [01:58<00:09, 19.02it/s][A
Epoch 10/10:  92%|█████████▏| 2023/2208 [01:58<00:09, 19.61it/s][A
  with torch.cuda.amp.autocast():

Epoch 10/10:  92%|█████████▏| 2029/2208 [01:58<00:13, 12.89it/s][A

Batch 2025: Training loss = 0.0417, Training accuracy = 0.9641, F1 = 0.9641



Epoch 10/10:  92%|█████████▏| 2032/2208 [01:59<00:12, 14.62it/s][A
Epoch 10/10:  92%|█████████▏| 2035/2208 [01:59<00:10, 16.12it/s][A
Epoch 10/10:  92%|█████████▏| 2038/2208 [01:59<00:09, 17.43it/s][A
Epoch 10/10:  92%|█████████▏| 2041/2208 [01:59<00:09, 18.39it/s][A
Epoch 10/10:  93%|█████████▎| 2044/2208 [01:59<00:08, 19.15it/s][A
Epoch 10/10:  93%|█████████▎| 2047/2208 [01:59<00:08, 19.76it/s][A
  with torch.cuda.amp.autocast():

Epoch 10/10:  93%|█████████▎| 2053/2208 [02:00<00:14, 10.55it/s][A

Batch 2050: Training loss = 0.1322, Training accuracy = 0.9641, F1 = 0.9641



Epoch 10/10:  93%|█████████▎| 2056/2208 [02:00<00:12, 12.43it/s][A
Epoch 10/10:  93%|█████████▎| 2059/2208 [02:00<00:10, 14.24it/s][A
Epoch 10/10:  93%|█████████▎| 2062/2208 [02:01<00:09, 15.79it/s][A
Epoch 10/10:  93%|█████████▎| 2064/2208 [02:01<00:08, 16.50it/s][A
Epoch 10/10:  94%|█████████▎| 2067/2208 [02:01<00:07, 17.70it/s][A
Epoch 10/10:  94%|█████████▍| 2070/2208 [02:01<00:07, 18.60it/s][A
Epoch 10/10:  94%|█████████▍| 2073/2208 [02:01<00:06, 19.42it/s][A
  with torch.cuda.amp.autocast():

Epoch 10/10:  94%|█████████▍| 2079/2208 [02:02<00:10, 12.00it/s][A

Batch 2075: Training loss = 0.0693, Training accuracy = 0.9642, F1 = 0.9642



Epoch 10/10:  94%|█████████▍| 2082/2208 [02:02<00:09, 13.87it/s][A
Epoch 10/10:  94%|█████████▍| 2085/2208 [02:02<00:07, 15.49it/s][A
Epoch 10/10:  95%|█████████▍| 2088/2208 [02:02<00:07, 16.82it/s][A
Epoch 10/10:  95%|█████████▍| 2091/2208 [02:02<00:06, 17.83it/s][A
Epoch 10/10:  95%|█████████▍| 2094/2208 [02:03<00:06, 18.75it/s][A
Epoch 10/10:  95%|█████████▍| 2097/2208 [02:03<00:05, 18.61it/s][A
Epoch 10/10:  95%|█████████▌| 2099/2208 [02:03<00:05, 18.85it/s][A
  with torch.cuda.amp.autocast():

Epoch 10/10:  95%|█████████▌| 2104/2208 [02:03<00:08, 11.56it/s][A

Batch 2100: Training loss = 0.1536, Training accuracy = 0.9642, F1 = 0.9642



Epoch 10/10:  95%|█████████▌| 2107/2208 [02:04<00:07, 13.66it/s][A
Epoch 10/10:  96%|█████████▌| 2109/2208 [02:04<00:06, 14.75it/s][A
Epoch 10/10:  96%|█████████▌| 2112/2208 [02:04<00:05, 16.35it/s][A
Epoch 10/10:  96%|█████████▌| 2115/2208 [02:04<00:05, 17.67it/s][A
Epoch 10/10:  96%|█████████▌| 2118/2208 [02:04<00:04, 18.56it/s][A
Epoch 10/10:  96%|█████████▌| 2121/2208 [02:04<00:04, 19.30it/s][A
  with torch.cuda.amp.autocast():

Epoch 10/10:  96%|█████████▋| 2127/2208 [02:05<00:07, 10.62it/s][A
Epoch 10/10:  96%|█████████▋| 2130/2208 [02:05<00:06, 12.58it/s][A

Batch 2125: Training loss = 0.1831, Training accuracy = 0.9642, F1 = 0.9642



Epoch 10/10:  97%|█████████▋| 2133/2208 [02:05<00:05, 14.35it/s][A
Epoch 10/10:  97%|█████████▋| 2136/2208 [02:05<00:04, 15.94it/s][A
Epoch 10/10:  97%|█████████▋| 2139/2208 [02:06<00:04, 17.24it/s][A
Epoch 10/10:  97%|█████████▋| 2142/2208 [02:06<00:03, 18.33it/s][A
Epoch 10/10:  97%|█████████▋| 2145/2208 [02:06<00:03, 19.12it/s][A
Epoch 10/10:  97%|█████████▋| 2148/2208 [02:06<00:03, 19.63it/s][A
  with torch.cuda.amp.autocast():

Epoch 10/10:  98%|█████████▊| 2154/2208 [02:07<00:04, 11.60it/s][A

Batch 2150: Training loss = 0.0584, Training accuracy = 0.9643, F1 = 0.9642



Epoch 10/10:  98%|█████████▊| 2157/2208 [02:07<00:03, 13.35it/s][A
Epoch 10/10:  98%|█████████▊| 2159/2208 [02:07<00:03, 14.41it/s][A
Epoch 10/10:  98%|█████████▊| 2162/2208 [02:07<00:02, 15.99it/s][A
Epoch 10/10:  98%|█████████▊| 2165/2208 [02:07<00:02, 17.35it/s][A
Epoch 10/10:  98%|█████████▊| 2168/2208 [02:08<00:02, 16.39it/s][A
Epoch 10/10:  98%|█████████▊| 2171/2208 [02:08<00:02, 17.57it/s][A
Epoch 10/10:  98%|█████████▊| 2174/2208 [02:08<00:01, 18.49it/s][A
  with torch.cuda.amp.autocast():

Epoch 10/10:  99%|█████████▊| 2179/2208 [02:09<00:02, 10.39it/s][A

Batch 2175: Training loss = 0.1555, Training accuracy = 0.9643, F1 = 0.9642



Epoch 10/10:  99%|█████████▉| 2182/2208 [02:09<00:02, 12.41it/s][A
Epoch 10/10:  99%|█████████▉| 2185/2208 [02:09<00:01, 14.28it/s][A
Epoch 10/10:  99%|█████████▉| 2188/2208 [02:09<00:01, 15.83it/s][A
Epoch 10/10:  99%|█████████▉| 2191/2208 [02:09<00:00, 17.07it/s][A
Epoch 10/10:  99%|█████████▉| 2194/2208 [02:09<00:00, 18.07it/s][A
Epoch 10/10: 100%|█████████▉| 2197/2208 [02:10<00:00, 18.63it/s][A
  with torch.cuda.amp.autocast():

Epoch 10/10: 100%|█████████▉| 2202/2208 [02:10<00:00,  8.97it/s][A
Epoch 10/10: 100%|█████████▉| 2205/2208 [02:10<00:00, 11.10it/s][A

Batch 2200: Training loss = 0.1586, Training accuracy = 0.9643, F1 = 0.9643



Epoch 10/10: 100%|██████████| 2208/2208 [02:11<00:00, 13.15it/s][A
                                                                [A


Epoch 10 Training Metrics:
Loss: 0.1088
Accuracy: 0.9643
F1 Score: 0.9643
Precision: 0.9643
Recall: 0.9643

Starting validation...



Validation:   0%|          | 0/552 [00:00<?, ?it/s][A
Validation:   0%|          | 1/552 [00:01<15:01,  1.64s/it][A
Validation:   1%|          | 3/552 [00:01<04:16,  2.14it/s][A
Validation:   1%|          | 5/552 [00:01<02:19,  3.92it/s][A
Validation:   1%|▏         | 7/552 [00:01<01:32,  5.86it/s][A
Validation:   2%|▏         | 9/552 [00:02<01:08,  7.89it/s][A
Validation:   2%|▏         | 11/552 [00:02<00:54,  9.91it/s][A
Validation:   2%|▏         | 13/552 [00:02<00:46, 11.69it/s][A
Validation:   3%|▎         | 15/552 [00:02<00:40, 13.33it/s][A
Validation:   3%|▎         | 17/552 [00:02<00:36, 14.67it/s][A
Validation:   3%|▎         | 19/552 [00:02<00:33, 15.74it/s][A
Validation:   4%|▍         | 21/552 [00:02<00:31, 16.60it/s][A
Validation:   4%|▍         | 23/552 [00:02<00:30, 17.19it/s][A
Validation:   5%|▍         | 25/552 [00:02<00:29, 17.63it/s][A
Validation:   5%|▍         | 27/552 [00:03<00:29, 18.08it/s][A
Validation:   5%|▌         | 29/552 [00:03<00:28, 18.


Epoch 10 Validation Metrics:
Loss: 0.1286
Accuracy: 0.9610
F1 Score: 0.9609
Precision: 0.9621
Recall: 0.9610


Training epochs: 100%|██████████| 10/10 [27:00<00:00, 162.08s/it]


Saving the model...
Model saved to /content/drive/MyDrive/TKPR221/models/ResNet_Synthetic20241228_141207.pth


  checkpoint = torch.load(model_save_path)


Saved the model to /content/drive/MyDrive/TKPR221/models/ResNet_Synthetic20241228_141207.pth

Starting final testing...





Final Test Metrics:
Loss: 0.1302
Accuracy: 0.9607
F1 Score: 0.9606
Precision: 0.9620
Recall: 0.9607
[neptune] [info   ] Shutting down background jobs, please wait a moment...
[neptune] [info   ] Done!
[neptune] [info   ] Waiting for the remaining 5 operations to synchronize with Neptune. Do not kill this process.
[neptune] [info   ] All 5 operations synced, thanks for waiting!
[neptune] [info   ] Explore the metadata in the Neptune app: https://app.neptune.ai/muguryalcin/TKPR221/e/TKPR-193/metadata


In [None]:
# Calculate and print class-wise F1 scores
class_f1 = f1_score(test_labels, test_preds, average=None)

print("\nF1 Scores by Class:")
for class_idx, f1 in enumerate(class_f1):
    print(f"Class {class_idx}: {f1:.4f}")

# Create a more detailed classification report
from sklearn.metrics import classification_report
class_report = classification_report(test_labels, test_preds)
print("\nDetailed Classification Report:")
print(class_report)



F1 Scores by Class:
Class 0: 0.9217
Class 1: 0.7880
Class 2: 0.7165
Class 3: 0.7206
Class 4: 0.7280
Class 5: 0.8721
Class 6: 0.7201
Class 7: 0.6655
Class 8: 0.8692
Class 9: 0.9622
Class 10: 0.5463
Class 11: 0.7204
Class 12: 0.8230
Class 13: 0.7396
Class 14: 0.7545
Class 15: 0.9854
Class 16: 0.8436
Class 17: 0.8282
Class 18: 0.7140
Class 19: 0.9079
Class 20: 0.8787
Class 21: 0.9041
Class 22: 0.8421
Class 23: 0.6740
Class 24: 0.7706
Class 25: 0.6443
Class 26: 0.5146
Class 27: 0.7025
Class 28: 0.7763
Class 29: 0.7735
Class 30: 0.9076
Class 31: 0.8539
Class 32: 0.7120
Class 33: 0.7628
Class 34: 0.8956
Class 35: 0.8274
Class 36: 0.9734
Class 37: 0.9854
Class 38: 0.9073
Class 39: 0.9133
Class 40: 0.9535
Class 41: 0.9264
Class 42: 0.9045
Class 43: 0.9754
Class 44: 0.9667
Class 45: 0.9042
Class 46: 0.8787
Class 47: 0.9938
Class 48: 0.9664
Class 49: 0.7562
Class 50: 0.9140
Class 51: 0.9732
Class 52: 0.9658
Class 53: 0.9959
Class 54: 0.9896
Class 55: 0.9053
Class 56: 0.9412
Class 57: 0.9388
Cla

## Using CNN Model with SGD Classifier

IF YOU WANT TO TRAIN JUST CNN, DON'T USE THIS PART

This part uses already trained CNN to extract features and feed them into the SGD model. You can use the CNN that you have trained in the first part (if so, dont change the model path), or you can use already trained model (change the model path to the path of the trained model from Google Drive).

In [None]:
# Load the CNN model
convolution_model = CNN(n_classes,return_convolution=True)
model_path = f'/content/drive/MyDrive/TKPR221/models/{run_name}.pth' # CHANGE THE MODEL NAME ACCORDINGLY FROM DRIVE (EACH MODEL HAS UNIQUE NAME)
convolution_model.load_state_dict(torch.load(model_path)['model_state_dict'])
sgd_clf = SGDClassifier(
    loss='hinge',
    penalty='elasticnet',
    max_iter=1000,
)


  convolution_model.load_state_dict(torch.load(model_path)['model_state_dict'])


Initializing new run for the Convolutional SGD model

In [None]:
# Initialize Neptune for experiment tracking
run_name = f"ConvolutionalML_{time.strftime('%Y%m%d_%H%M%S')}"
run = neptune.init_run(
    # DON'T CHANGE THIS
    project="muguryalcin/TKPR221",
    # ENTER YOUR API TOKEN HERE
    api_token="",
    # Name of the experiment using timestamp to prevent confusion
    name=run_name,
    # Description of the experiment
    description="Using pretrained CNN to extract features and feed them to SGD for traffic sign classification",
    # Tags describing the experiment
    tags=["C+ML","SGDClassifier"]
)

# Log the hyperparameters
run["hyperparameters"] = {
    "n_epochs": n_epochs,
    # Classifier Specific Parameters
    "model": {
        "type": "SGDClassifier",
        "loss": sgd_clf.get_params()['loss'],
        "penalty": sgd_clf.get_params()['penalty'],
        "alpha": sgd_clf.get_params()['alpha'],
        "max_iter": sgd_clf.get_params()['max_iter']
    },
    # Dataset Specific Parameters
    "dataset": {
        "batch_size": batch_size,
        "total_size": len(train_dataset),
        "train_size": len(train_df),
        "val_size": len(val_df),
        "test_size": len(test_df),
        "n_classes": len(train_dataset.label_encoder.classes_),
        "image_size": image_size,
        "flattened": True,
        "transformations": str(train_transform)  # Convert transform to string representation
    },
}

[neptune] [info   ] Neptune initialized. Open in the app: https://app.neptune.ai/muguryalcin/TKPR221/e/TKPR-191


Train Loop

In [None]:
# Get unique classes and encode them
unique_classes = train_dataset.label_encoder.classes_

for epoch in tqdm(range(n_epochs), desc="Training epochs"):
    train_preds = []
    train_labels = []
    print(f"\nStarting epoch {epoch+1}/{n_epochs}")

    for i, (images, labels) in enumerate(tqdm(train_loader, desc=f"Epoch {epoch+1}/{n_epochs}", leave=False)):
        # Get CNN features
        with torch.no_grad():
            images = images.to(device)
            features = model(images).cpu().numpy()
        labels = labels.numpy()
        # Train SGD on batch
        sgd_clf.partial_fit(features, labels, classes=unique_classes)
        preds = sgd_clf.predict(features)
        # Store predictions and labels for metrics
        train_preds.extend(preds)
        train_labels.extend(labels)

        if i % 25 == 0:
            batch_acc = accuracy_score(labels, preds)
            batch_f1 = f1_score(labels, preds, average='weighted')
            batch_precision = precision_score(labels, preds, average='weighted')
            batch_recall = recall_score(labels, preds, average='weighted')
            print(f"Batch {i}: Training accuracy = {batch_acc:.4f}, F1 = {batch_f1:.4f}, Precision = {batch_precision:.4f}, Recall = {batch_recall:.4f}")

    # Calculate Train Metrics
    train_accuracy = accuracy_score(train_labels, train_preds)
    train_f1 = f1_score(train_labels, train_preds, average='weighted')
    train_precision = precision_score(train_labels, train_preds, average='weighted')
    train_recall = recall_score(train_labels, train_preds, average='weighted')
    # Log Train Metrics
    run["train/accuracy"].log(train_accuracy)
    run["train/f1"].log(train_f1)
    run["train/precision"].log(train_precision)
    run["train/recall"].log(train_recall)
    # Print Train Metrics
    print(f"\nEpoch {epoch+1} training accuracy: {train_accuracy:.2f}%")
    print(f"Epoch {epoch+1} training F1 score: {train_f1:.4f}")
    print(f"Epoch {epoch+1} training precision: {train_precision:.4f}")
    print(f"Epoch {epoch+1} training recall: {train_recall:.4f}")

    # Validation
    print("\nStarting validation...")
    val_preds = []
    val_labels = []
    with torch.no_grad():
        for images, labels in tqdm(val_loader, desc="Validation", leave=False):
            images = images.to(device)
            features = model(images).cpu().numpy()
            preds = sgd_clf.predict(features)
            val_preds.extend(preds)
            val_labels.extend(labels.numpy())

    # Calculate Validation Metrics
    val_accuracy = accuracy_score(val_labels, val_preds)
    val_f1 = f1_score(val_labels, val_preds, average='weighted')
    val_precision = precision_score(val_labels, val_preds, average='weighted')
    val_recall = recall_score(val_labels, val_preds, average='weighted')
    # Log Validation Metrics
    run["validation/accuracy"].log(val_accuracy)
    run["validation/f1"].log(val_f1)
    run["validation/precision"].log(val_precision)
    run["validation/recall"].log(val_recall)
    # Print Validation Metrics
    print(f"Validation accuracy: {val_accuracy:.2f}%")
    print(f"Validation F1 score: {val_f1:.4f}")
    print(f"Validation precision: {val_precision:.4f}")
    print(f"Validation recall: {val_recall:.4f}")

# TEST
print("\nStarting testing...")
test_preds = []
test_labels = []

with torch.no_grad():
    for images, labels in tqdm(test_loader, desc="Testing", leave=False):
        images = images.to(device)
        features = model(images).cpu().numpy()
        preds = sgd_clf.predict(features)
        test_preds.extend(preds)
        test_labels.extend(labels.numpy())

# Calculate Test Metrics
test_accuracy = accuracy_score(test_labels, test_preds)
test_f1 = f1_score(test_labels, test_preds, average='weighted')
test_precision = precision_score(test_labels, test_preds, average='weighted')
test_recall = recall_score(test_labels, test_preds, average='weighted')
# Log Test Metrics
run["test/accuracy"].log(test_accuracy)
run["test/f1"].log(test_f1)
run["test/precision"].log(test_precision)
run["test/recall"].log(test_recall)
# Print Test Metrics
print(f"Test accuracy: {test_accuracy:.2f}%")
print(f"Test F1 score: {test_f1:.4f}")
print(f"Test precision: {test_precision:.4f}")
print(f"Test recall: {test_recall:.4f}")

run.stop()

Training epochs:   0%|          | 0/5 [00:00<?, ?it/s]


Starting epoch 1/5



  _warn_prf(average, modifier, f"{metric.capitalize()} is", len(result))
  _warn_prf(average, modifier, f"{metric.capitalize()} is", len(result))

Epoch 1/5:   0%|          | 1/2208 [00:01<1:07:19,  1.83s/it][A

Batch 0: Training accuracy = 0.0625, F1 = 0.0456, Precision = 0.0448, Recall = 0.0625



Epoch 1/5:   0%|          | 2/2208 [00:02<35:02,  1.05it/s]  [A
Epoch 1/5:   0%|          | 3/2208 [00:02<24:43,  1.49it/s][A
Epoch 1/5:   0%|          | 4/2208 [00:02<20:01,  1.83it/s][A
Epoch 1/5:   0%|          | 5/2208 [00:03<17:43,  2.07it/s][A
Epoch 1/5:   0%|          | 6/2208 [00:03<15:56,  2.30it/s][A
Epoch 1/5:   0%|          | 7/2208 [00:03<15:13,  2.41it/s][A
Epoch 1/5:   0%|          | 8/2208 [00:04<14:21,  2.55it/s][A
Epoch 1/5:   0%|          | 9/2208 [00:04<13:46,  2.66it/s][A
Epoch 1/5:   0%|          | 10/2208 [00:04<13:22,  2.74it/s][A
Epoch 1/5:   0%|          | 11/2208 [00:05<13:23,  2.73it/s][A
Epoch 1/5:   1%|          | 12/2208 [00:05<13:05,  2.80it/s][A
Epoch 1/5:   1%|          | 13/2208 [00:06<12:52,  2.84it/s][A
Epoch 1/5:   1%|          | 14/2208 [00:06<12:44,  2.87it/s][A
Epoch 1/5:   1%|          | 15/2208 [00:06<13:05,  2.79it/s][A
Epoch 1/5:   1%|          | 16/2208 [00:07<13:26,  2.72it/s][A
Epoch 1/5:   1%|          | 17/2208 [00:07<13

Batch 25: Training accuracy = 0.2422, F1 = 0.1660, Precision = 0.1468, Recall = 0.2422



Epoch 1/5:   1%|          | 27/2208 [00:11<13:42,  2.65it/s][A
Epoch 1/5:   1%|▏         | 28/2208 [00:11<13:23,  2.71it/s][A
Epoch 1/5:   1%|▏         | 29/2208 [00:11<13:17,  2.73it/s][A
Epoch 1/5:   1%|▏         | 30/2208 [00:12<13:00,  2.79it/s][A
Epoch 1/5:   1%|▏         | 31/2208 [00:12<12:59,  2.79it/s][A
Epoch 1/5:   1%|▏         | 32/2208 [00:12<13:04,  2.77it/s][A
Epoch 1/5:   1%|▏         | 33/2208 [00:13<13:07,  2.76it/s][A
Epoch 1/5:   2%|▏         | 34/2208 [00:13<13:11,  2.75it/s][A
Epoch 1/5:   2%|▏         | 35/2208 [00:14<13:12,  2.74it/s][A
Epoch 1/5:   2%|▏         | 36/2208 [00:14<13:19,  2.72it/s][A
Epoch 1/5:   2%|▏         | 37/2208 [00:14<13:12,  2.74it/s][A
Epoch 1/5:   2%|▏         | 38/2208 [00:15<13:05,  2.76it/s][A
Epoch 1/5:   2%|▏         | 39/2208 [00:15<13:22,  2.70it/s][A
Epoch 1/5:   2%|▏         | 40/2208 [00:15<13:07,  2.75it/s][A
Epoch 1/5:   2%|▏         | 41/2208 [00:16<12:51,  2.81it/s][A
Epoch 1/5:   2%|▏         | 42/2208 [00

Batch 50: Training accuracy = 0.3203, F1 = 0.2622, Precision = 0.2605, Recall = 0.3203



Epoch 1/5:   2%|▏         | 52/2208 [00:20<12:19,  2.91it/s][A
Epoch 1/5:   2%|▏         | 53/2208 [00:20<12:16,  2.92it/s][A
Epoch 1/5:   2%|▏         | 54/2208 [00:20<12:33,  2.86it/s][A
Epoch 1/5:   2%|▏         | 55/2208 [00:21<12:27,  2.88it/s][A
Epoch 1/5:   3%|▎         | 56/2208 [00:21<12:27,  2.88it/s][A
Epoch 1/5:   3%|▎         | 57/2208 [00:21<12:37,  2.84it/s][A
Epoch 1/5:   3%|▎         | 58/2208 [00:22<13:02,  2.75it/s][A
Epoch 1/5:   3%|▎         | 59/2208 [00:22<13:13,  2.71it/s][A
Epoch 1/5:   3%|▎         | 60/2208 [00:22<13:03,  2.74it/s][A
Epoch 1/5:   3%|▎         | 61/2208 [00:23<13:08,  2.72it/s][A
Epoch 1/5:   3%|▎         | 62/2208 [00:23<12:52,  2.78it/s][A
Epoch 1/5:   3%|▎         | 63/2208 [00:24<13:16,  2.69it/s][A
Epoch 1/5:   3%|▎         | 64/2208 [00:24<12:56,  2.76it/s][A
Epoch 1/5:   3%|▎         | 65/2208 [00:24<12:53,  2.77it/s][A
Epoch 1/5:   3%|▎         | 66/2208 [00:25<12:55,  2.76it/s][A
Epoch 1/5:   3%|▎         | 67/2208 [00

Batch 75: Training accuracy = 0.5156, F1 = 0.4471, Precision = 0.4327, Recall = 0.5156



Epoch 1/5:   3%|▎         | 77/2208 [00:29<13:05,  2.71it/s][A
Epoch 1/5:   4%|▎         | 78/2208 [00:29<13:09,  2.70it/s][A
Epoch 1/5:   4%|▎         | 79/2208 [00:29<13:03,  2.72it/s][A
Epoch 1/5:   4%|▎         | 80/2208 [00:30<12:42,  2.79it/s][A
Epoch 1/5:   4%|▎         | 81/2208 [00:30<12:42,  2.79it/s][A
Epoch 1/5:   4%|▎         | 82/2208 [00:30<12:54,  2.74it/s][A
Epoch 1/5:   4%|▍         | 83/2208 [00:31<12:38,  2.80it/s][A
Epoch 1/5:   4%|▍         | 84/2208 [00:31<12:45,  2.77it/s][A
Epoch 1/5:   4%|▍         | 85/2208 [00:32<12:29,  2.83it/s][A
Epoch 1/5:   4%|▍         | 86/2208 [00:32<12:31,  2.82it/s][A
Epoch 1/5:   4%|▍         | 87/2208 [00:32<12:29,  2.83it/s][A
Epoch 1/5:   4%|▍         | 88/2208 [00:33<12:40,  2.79it/s][A
Epoch 1/5:   4%|▍         | 89/2208 [00:33<12:26,  2.84it/s][A
Epoch 1/5:   4%|▍         | 90/2208 [00:33<12:27,  2.83it/s][A
Epoch 1/5:   4%|▍         | 91/2208 [00:34<12:38,  2.79it/s][A
Epoch 1/5:   4%|▍         | 92/2208 [00

Batch 100: Training accuracy = 0.4297, F1 = 0.3866, Precision = 0.3795, Recall = 0.4297



Epoch 1/5:   5%|▍         | 102/2208 [00:38<12:31,  2.80it/s][A
Epoch 1/5:   5%|▍         | 103/2208 [00:38<12:44,  2.75it/s][A
Epoch 1/5:   5%|▍         | 104/2208 [00:38<12:46,  2.74it/s][A
Epoch 1/5:   5%|▍         | 105/2208 [00:39<12:52,  2.72it/s][A
Epoch 1/5:   5%|▍         | 106/2208 [00:39<12:48,  2.73it/s][A
Epoch 1/5:   5%|▍         | 107/2208 [00:39<12:33,  2.79it/s][A
Epoch 1/5:   5%|▍         | 108/2208 [00:40<12:37,  2.77it/s][A
Epoch 1/5:   5%|▍         | 109/2208 [00:40<12:24,  2.82it/s][A
Epoch 1/5:   5%|▍         | 110/2208 [00:40<12:20,  2.83it/s][A
Epoch 1/5:   5%|▌         | 111/2208 [00:41<12:10,  2.87it/s][A
Epoch 1/5:   5%|▌         | 112/2208 [00:41<12:02,  2.90it/s][A
Epoch 1/5:   5%|▌         | 113/2208 [00:42<12:12,  2.86it/s][A
Epoch 1/5:   5%|▌         | 114/2208 [00:42<12:05,  2.89it/s][A
Epoch 1/5:   5%|▌         | 115/2208 [00:42<12:03,  2.89it/s][A
Epoch 1/5:   5%|▌         | 116/2208 [00:43<12:16,  2.84it/s][A
Epoch 1/5:   5%|▌       

Batch 125: Training accuracy = 0.5703, F1 = 0.5167, Precision = 0.5133, Recall = 0.5703



Epoch 1/5:   6%|▌         | 127/2208 [00:46<12:20,  2.81it/s][A
Epoch 1/5:   6%|▌         | 128/2208 [00:47<12:10,  2.85it/s][A
Epoch 1/5:   6%|▌         | 129/2208 [00:47<12:03,  2.88it/s][A
Epoch 1/5:   6%|▌         | 130/2208 [00:47<11:57,  2.90it/s][A
Epoch 1/5:   6%|▌         | 131/2208 [00:48<11:56,  2.90it/s][A
Epoch 1/5:   6%|▌         | 132/2208 [00:48<11:57,  2.89it/s][A
Epoch 1/5:   6%|▌         | 133/2208 [00:49<11:52,  2.91it/s][A
Epoch 1/5:   6%|▌         | 134/2208 [00:49<11:47,  2.93it/s][A
Epoch 1/5:   6%|▌         | 135/2208 [00:49<12:04,  2.86it/s][A
Epoch 1/5:   6%|▌         | 136/2208 [00:50<11:57,  2.89it/s][A
Epoch 1/5:   6%|▌         | 137/2208 [00:50<12:05,  2.86it/s][A
Epoch 1/5:   6%|▋         | 138/2208 [00:50<12:01,  2.87it/s][A
Epoch 1/5:   6%|▋         | 139/2208 [00:51<12:01,  2.87it/s][A
Epoch 1/5:   6%|▋         | 140/2208 [00:51<12:14,  2.81it/s][A
Epoch 1/5:   6%|▋         | 141/2208 [00:51<12:26,  2.77it/s][A
Epoch 1/5:   6%|▋       

Batch 150: Training accuracy = 0.5391, F1 = 0.4784, Precision = 0.4649, Recall = 0.5391



Epoch 1/5:   7%|▋         | 152/2208 [00:56<12:53,  2.66it/s][A
Epoch 1/5:   7%|▋         | 153/2208 [00:56<12:28,  2.75it/s][A
Epoch 1/5:   7%|▋         | 154/2208 [00:56<12:33,  2.73it/s][A
Epoch 1/5:   7%|▋         | 155/2208 [00:57<12:17,  2.79it/s][A
Epoch 1/5:   7%|▋         | 156/2208 [00:57<12:14,  2.79it/s][A
Epoch 1/5:   7%|▋         | 157/2208 [00:57<12:08,  2.81it/s][A
Epoch 1/5:   7%|▋         | 158/2208 [00:58<12:16,  2.78it/s][A
Epoch 1/5:   7%|▋         | 159/2208 [00:58<12:06,  2.82it/s][A
Epoch 1/5:   7%|▋         | 160/2208 [00:58<11:57,  2.85it/s][A
Epoch 1/5:   7%|▋         | 161/2208 [00:59<12:11,  2.80it/s][A
Epoch 1/5:   7%|▋         | 162/2208 [00:59<12:15,  2.78it/s][A
Epoch 1/5:   7%|▋         | 163/2208 [00:59<12:03,  2.83it/s][A
Epoch 1/5:   7%|▋         | 164/2208 [01:00<12:08,  2.81it/s][A
Epoch 1/5:   7%|▋         | 165/2208 [01:00<11:57,  2.85it/s][A
Epoch 1/5:   8%|▊         | 166/2208 [01:00<12:05,  2.81it/s][A
Epoch 1/5:   8%|▊       

Batch 175: Training accuracy = 0.5156, F1 = 0.4532, Precision = 0.4457, Recall = 0.5156



Epoch 1/5:   8%|▊         | 177/2208 [01:04<12:06,  2.80it/s][A
Epoch 1/5:   8%|▊         | 178/2208 [01:05<11:59,  2.82it/s][A
Epoch 1/5:   8%|▊         | 179/2208 [01:05<11:47,  2.87it/s][A
Epoch 1/5:   8%|▊         | 180/2208 [01:05<11:48,  2.86it/s][A
Epoch 1/5:   8%|▊         | 181/2208 [01:06<11:56,  2.83it/s][A
Epoch 1/5:   8%|▊         | 182/2208 [01:06<11:54,  2.83it/s][A
Epoch 1/5:   8%|▊         | 183/2208 [01:07<12:46,  2.64it/s][A
Epoch 1/5:   8%|▊         | 184/2208 [01:07<12:28,  2.71it/s][A
Epoch 1/5:   8%|▊         | 185/2208 [01:07<12:10,  2.77it/s][A
Epoch 1/5:   8%|▊         | 186/2208 [01:08<11:59,  2.81it/s][A
Epoch 1/5:   8%|▊         | 187/2208 [01:08<11:47,  2.86it/s][A
Epoch 1/5:   9%|▊         | 188/2208 [01:08<11:42,  2.87it/s][A
Epoch 1/5:   9%|▊         | 189/2208 [01:09<11:38,  2.89it/s][A
Epoch 1/5:   9%|▊         | 190/2208 [01:09<11:54,  2.82it/s][A
Epoch 1/5:   9%|▊         | 191/2208 [01:09<11:48,  2.85it/s][A
Epoch 1/5:   9%|▊       

Batch 200: Training accuracy = 0.6484, F1 = 0.5872, Precision = 0.5641, Recall = 0.6484



Epoch 1/5:   9%|▉         | 202/2208 [01:13<11:38,  2.87it/s][A
Epoch 1/5:   9%|▉         | 203/2208 [01:13<11:33,  2.89it/s][A
Epoch 1/5:   9%|▉         | 204/2208 [01:14<11:30,  2.90it/s][A
Epoch 1/5:   9%|▉         | 205/2208 [01:14<11:32,  2.89it/s][A
Epoch 1/5:   9%|▉         | 206/2208 [01:15<11:44,  2.84it/s][A
Epoch 1/5:   9%|▉         | 207/2208 [01:15<11:51,  2.81it/s][A
Epoch 1/5:   9%|▉         | 208/2208 [01:15<11:42,  2.85it/s][A
Epoch 1/5:   9%|▉         | 209/2208 [01:16<11:44,  2.84it/s][A
Epoch 1/5:  10%|▉         | 210/2208 [01:16<11:57,  2.78it/s][A
Epoch 1/5:  10%|▉         | 211/2208 [01:16<12:00,  2.77it/s][A
Epoch 1/5:  10%|▉         | 212/2208 [01:17<12:19,  2.70it/s][A
Epoch 1/5:  10%|▉         | 213/2208 [01:17<12:01,  2.77it/s][A
Epoch 1/5:  10%|▉         | 214/2208 [01:17<11:48,  2.81it/s][A
Epoch 1/5:  10%|▉         | 215/2208 [01:18<11:51,  2.80it/s][A
Epoch 1/5:  10%|▉         | 216/2208 [01:18<11:58,  2.77it/s][A
Epoch 1/5:  10%|▉       

Batch 225: Training accuracy = 0.6797, F1 = 0.6353, Precision = 0.6309, Recall = 0.6797



Epoch 1/5:  10%|█         | 227/2208 [01:22<11:55,  2.77it/s][A
Epoch 1/5:  10%|█         | 228/2208 [01:22<11:45,  2.80it/s][A
Epoch 1/5:  10%|█         | 229/2208 [01:23<11:55,  2.77it/s][A
Epoch 1/5:  10%|█         | 230/2208 [01:23<12:04,  2.73it/s][A
Epoch 1/5:  10%|█         | 231/2208 [01:24<11:50,  2.78it/s][A
Epoch 1/5:  11%|█         | 232/2208 [01:24<11:40,  2.82it/s][A
Epoch 1/5:  11%|█         | 233/2208 [01:24<11:33,  2.85it/s][A
Epoch 1/5:  11%|█         | 234/2208 [01:25<11:27,  2.87it/s][A
Epoch 1/5:  11%|█         | 235/2208 [01:25<11:24,  2.88it/s][A
Epoch 1/5:  11%|█         | 236/2208 [01:25<11:18,  2.91it/s][A
Epoch 1/5:  11%|█         | 237/2208 [01:26<11:14,  2.92it/s][A
Epoch 1/5:  11%|█         | 238/2208 [01:26<11:24,  2.88it/s][A
Epoch 1/5:  11%|█         | 239/2208 [01:26<11:38,  2.82it/s][A
Epoch 1/5:  11%|█         | 240/2208 [01:27<11:28,  2.86it/s][A
Epoch 1/5:  11%|█         | 241/2208 [01:27<11:31,  2.84it/s][A
Epoch 1/5:  11%|█       

Batch 250: Training accuracy = 0.5469, F1 = 0.4853, Precision = 0.4624, Recall = 0.5469



Epoch 1/5:  11%|█▏        | 252/2208 [01:31<11:16,  2.89it/s][A
Epoch 1/5:  11%|█▏        | 253/2208 [01:31<11:20,  2.87it/s][A
Epoch 1/5:  12%|█▏        | 254/2208 [01:32<11:16,  2.89it/s][A
Epoch 1/5:  12%|█▏        | 255/2208 [01:32<11:26,  2.84it/s][A
Epoch 1/5:  12%|█▏        | 256/2208 [01:32<11:17,  2.88it/s][A
Epoch 1/5:  12%|█▏        | 257/2208 [01:33<11:09,  2.91it/s][A
Epoch 1/5:  12%|█▏        | 258/2208 [01:33<11:05,  2.93it/s][A
Epoch 1/5:  12%|█▏        | 259/2208 [01:33<11:04,  2.93it/s][A
Epoch 1/5:  12%|█▏        | 260/2208 [01:34<11:23,  2.85it/s][A
Epoch 1/5:  12%|█▏        | 261/2208 [01:34<11:18,  2.87it/s][A
Epoch 1/5:  12%|█▏        | 262/2208 [01:34<11:16,  2.88it/s][A
Epoch 1/5:  12%|█▏        | 263/2208 [01:35<11:13,  2.89it/s][A
Epoch 1/5:  12%|█▏        | 264/2208 [01:35<11:22,  2.85it/s][A
Epoch 1/5:  12%|█▏        | 265/2208 [01:35<11:20,  2.86it/s][A
Epoch 1/5:  12%|█▏        | 266/2208 [01:36<11:13,  2.88it/s][A
Epoch 1/5:  12%|█▏      

Batch 275: Training accuracy = 0.6953, F1 = 0.6585, Precision = 0.6423, Recall = 0.6953



Epoch 1/5:  13%|█▎        | 277/2208 [01:40<11:51,  2.71it/s][A
Epoch 1/5:  13%|█▎        | 278/2208 [01:40<12:04,  2.66it/s][A
Epoch 1/5:  13%|█▎        | 279/2208 [01:41<12:15,  2.62it/s][A
Epoch 1/5:  13%|█▎        | 280/2208 [01:41<11:48,  2.72it/s][A
Epoch 1/5:  13%|█▎        | 281/2208 [01:41<11:41,  2.75it/s][A
Epoch 1/5:  13%|█▎        | 282/2208 [01:42<11:40,  2.75it/s][A
Epoch 1/5:  13%|█▎        | 283/2208 [01:42<11:27,  2.80it/s][A
Epoch 1/5:  13%|█▎        | 284/2208 [01:42<11:15,  2.85it/s][A
Epoch 1/5:  13%|█▎        | 285/2208 [01:43<11:33,  2.77it/s][A
Epoch 1/5:  13%|█▎        | 286/2208 [01:43<11:20,  2.82it/s][A
Epoch 1/5:  13%|█▎        | 287/2208 [01:43<11:11,  2.86it/s][A
Epoch 1/5:  13%|█▎        | 288/2208 [01:44<11:04,  2.89it/s][A
Epoch 1/5:  13%|█▎        | 289/2208 [01:44<11:01,  2.90it/s][A
Epoch 1/5:  13%|█▎        | 290/2208 [01:44<10:59,  2.91it/s][A
Epoch 1/5:  13%|█▎        | 291/2208 [01:45<11:06,  2.88it/s][A
Epoch 1/5:  13%|█▎      

Batch 300: Training accuracy = 0.6562, F1 = 0.6265, Precision = 0.6292, Recall = 0.6562



Epoch 1/5:  14%|█▎        | 302/2208 [01:49<11:17,  2.81it/s][A
Epoch 1/5:  14%|█▎        | 303/2208 [01:49<11:11,  2.84it/s][A
Epoch 1/5:  14%|█▍        | 304/2208 [01:49<11:20,  2.80it/s][A
Epoch 1/5:  14%|█▍        | 305/2208 [01:50<11:11,  2.83it/s][A
Epoch 1/5:  14%|█▍        | 306/2208 [01:50<11:11,  2.83it/s][A
Epoch 1/5:  14%|█▍        | 307/2208 [01:50<11:03,  2.87it/s][A
Epoch 1/5:  14%|█▍        | 308/2208 [01:51<11:12,  2.83it/s][A
Epoch 1/5:  14%|█▍        | 309/2208 [01:51<11:25,  2.77it/s][A
Epoch 1/5:  14%|█▍        | 310/2208 [01:52<11:35,  2.73it/s][A
Epoch 1/5:  14%|█▍        | 311/2208 [01:52<11:26,  2.77it/s][A
Epoch 1/5:  14%|█▍        | 312/2208 [01:52<11:16,  2.80it/s][A
Epoch 1/5:  14%|█▍        | 313/2208 [01:53<11:12,  2.82it/s][A
Epoch 1/5:  14%|█▍        | 314/2208 [01:53<11:14,  2.81it/s][A
Epoch 1/5:  14%|█▍        | 315/2208 [01:53<11:12,  2.81it/s][A
Epoch 1/5:  14%|█▍        | 316/2208 [01:54<11:19,  2.78it/s][A
Epoch 1/5:  14%|█▍      

Batch 325: Training accuracy = 0.6641, F1 = 0.6295, Precision = 0.6243, Recall = 0.6641



Epoch 1/5:  15%|█▍        | 327/2208 [01:58<11:25,  2.74it/s][A
Epoch 1/5:  15%|█▍        | 328/2208 [01:58<11:11,  2.80it/s][A
Epoch 1/5:  15%|█▍        | 329/2208 [01:58<11:02,  2.83it/s][A
Epoch 1/5:  15%|█▍        | 330/2208 [01:59<10:54,  2.87it/s][A
Epoch 1/5:  15%|█▍        | 331/2208 [01:59<10:47,  2.90it/s][A
Epoch 1/5:  15%|█▌        | 332/2208 [01:59<10:48,  2.89it/s][A
Epoch 1/5:  15%|█▌        | 333/2208 [02:00<10:43,  2.91it/s][A
Epoch 1/5:  15%|█▌        | 334/2208 [02:00<10:50,  2.88it/s][A
Epoch 1/5:  15%|█▌        | 335/2208 [02:00<11:02,  2.83it/s][A
Epoch 1/5:  15%|█▌        | 336/2208 [02:01<11:16,  2.77it/s][A
Epoch 1/5:  15%|█▌        | 337/2208 [02:01<11:07,  2.80it/s][A
Epoch 1/5:  15%|█▌        | 338/2208 [02:01<10:57,  2.84it/s][A
Epoch 1/5:  15%|█▌        | 339/2208 [02:02<10:49,  2.88it/s][A
Epoch 1/5:  15%|█▌        | 340/2208 [02:02<10:47,  2.89it/s][A
Epoch 1/5:  15%|█▌        | 341/2208 [02:02<10:42,  2.91it/s][A
Epoch 1/5:  15%|█▌      

Batch 350: Training accuracy = 0.6484, F1 = 0.6112, Precision = 0.6150, Recall = 0.6484



Epoch 1/5:  16%|█▌        | 352/2208 [02:06<10:48,  2.86it/s][A
Epoch 1/5:  16%|█▌        | 353/2208 [02:07<10:58,  2.82it/s][A
Epoch 1/5:  16%|█▌        | 354/2208 [02:07<11:04,  2.79it/s][A
Epoch 1/5:  16%|█▌        | 355/2208 [02:07<11:08,  2.77it/s][A
Epoch 1/5:  16%|█▌        | 356/2208 [02:08<10:58,  2.81it/s][A
Epoch 1/5:  16%|█▌        | 357/2208 [02:08<11:02,  2.80it/s][A
Epoch 1/5:  16%|█▌        | 358/2208 [02:08<10:55,  2.82it/s][A
Epoch 1/5:  16%|█▋        | 359/2208 [02:09<11:06,  2.77it/s][A
Epoch 1/5:  16%|█▋        | 360/2208 [02:09<11:12,  2.75it/s][A
Epoch 1/5:  16%|█▋        | 361/2208 [02:10<11:15,  2.74it/s][A
Epoch 1/5:  16%|█▋        | 362/2208 [02:10<11:16,  2.73it/s][A
Epoch 1/5:  16%|█▋        | 363/2208 [02:10<11:00,  2.79it/s][A
Epoch 1/5:  16%|█▋        | 364/2208 [02:11<10:48,  2.84it/s][A
Epoch 1/5:  17%|█▋        | 365/2208 [02:11<10:40,  2.88it/s][A
Epoch 1/5:  17%|█▋        | 366/2208 [02:11<10:36,  2.89it/s][A
Epoch 1/5:  17%|█▋      

Batch 375: Training accuracy = 0.6875, F1 = 0.6432, Precision = 0.6335, Recall = 0.6875



Epoch 1/5:  17%|█▋        | 377/2208 [02:15<11:00,  2.77it/s][A
Epoch 1/5:  17%|█▋        | 378/2208 [02:16<10:54,  2.80it/s][A
Epoch 1/5:  17%|█▋        | 379/2208 [02:16<11:10,  2.73it/s][A
Epoch 1/5:  17%|█▋        | 380/2208 [02:16<10:58,  2.78it/s][A
Epoch 1/5:  17%|█▋        | 381/2208 [02:17<10:50,  2.81it/s][A
Epoch 1/5:  17%|█▋        | 382/2208 [02:17<10:56,  2.78it/s][A
Epoch 1/5:  17%|█▋        | 383/2208 [02:17<10:45,  2.83it/s][A
Epoch 1/5:  17%|█▋        | 384/2208 [02:18<10:38,  2.86it/s][A
Epoch 1/5:  17%|█▋        | 385/2208 [02:18<10:32,  2.88it/s][A
Epoch 1/5:  17%|█▋        | 386/2208 [02:18<10:47,  2.81it/s][A
Epoch 1/5:  18%|█▊        | 387/2208 [02:19<10:41,  2.84it/s][A
Epoch 1/5:  18%|█▊        | 388/2208 [02:19<10:50,  2.80it/s][A
Epoch 1/5:  18%|█▊        | 389/2208 [02:19<11:00,  2.75it/s][A
Epoch 1/5:  18%|█▊        | 390/2208 [02:20<10:48,  2.81it/s][A
Epoch 1/5:  18%|█▊        | 391/2208 [02:20<10:43,  2.82it/s][A
Epoch 1/5:  18%|█▊      

Batch 400: Training accuracy = 0.7891, F1 = 0.7591, Precision = 0.7509, Recall = 0.7891



Epoch 1/5:  18%|█▊        | 402/2208 [02:24<10:46,  2.79it/s][A
Epoch 1/5:  18%|█▊        | 403/2208 [02:25<10:50,  2.78it/s][A
Epoch 1/5:  18%|█▊        | 404/2208 [02:25<10:37,  2.83it/s][A
Epoch 1/5:  18%|█▊        | 405/2208 [02:25<10:50,  2.77it/s][A
Epoch 1/5:  18%|█▊        | 406/2208 [02:26<10:55,  2.75it/s][A
Epoch 1/5:  18%|█▊        | 407/2208 [02:26<10:41,  2.81it/s][A
Epoch 1/5:  18%|█▊        | 408/2208 [02:26<10:41,  2.81it/s][A
Epoch 1/5:  19%|█▊        | 409/2208 [02:27<10:32,  2.85it/s][A
Epoch 1/5:  19%|█▊        | 410/2208 [02:27<10:23,  2.88it/s][A
Epoch 1/5:  19%|█▊        | 411/2208 [02:27<10:40,  2.81it/s][A
Epoch 1/5:  19%|█▊        | 412/2208 [02:28<10:43,  2.79it/s][A
Epoch 1/5:  19%|█▊        | 413/2208 [02:28<10:33,  2.83it/s][A
Epoch 1/5:  19%|█▉        | 414/2208 [02:28<10:40,  2.80it/s][A
Epoch 1/5:  19%|█▉        | 415/2208 [02:29<10:45,  2.78it/s][A
Epoch 1/5:  19%|█▉        | 416/2208 [02:29<10:34,  2.82it/s][A
Epoch 1/5:  19%|█▉      

Batch 425: Training accuracy = 0.7266, F1 = 0.7044, Precision = 0.7211, Recall = 0.7266



Epoch 1/5:  19%|█▉        | 427/2208 [02:33<10:35,  2.80it/s][A
Epoch 1/5:  19%|█▉        | 428/2208 [02:33<10:35,  2.80it/s][A
Epoch 1/5:  19%|█▉        | 429/2208 [02:34<10:37,  2.79it/s][A
Epoch 1/5:  19%|█▉        | 430/2208 [02:34<10:55,  2.71it/s][A
Epoch 1/5:  20%|█▉        | 431/2208 [02:35<11:11,  2.65it/s][A
Epoch 1/5:  20%|█▉        | 432/2208 [02:35<10:50,  2.73it/s][A
Epoch 1/5:  20%|█▉        | 433/2208 [02:35<10:37,  2.78it/s][A
Epoch 1/5:  20%|█▉        | 434/2208 [02:36<10:30,  2.81it/s][A
Epoch 1/5:  20%|█▉        | 435/2208 [02:36<10:46,  2.74it/s][A
Epoch 1/5:  20%|█▉        | 436/2208 [02:36<10:46,  2.74it/s][A
Epoch 1/5:  20%|█▉        | 437/2208 [02:37<10:38,  2.77it/s][A
Epoch 1/5:  20%|█▉        | 438/2208 [02:37<10:25,  2.83it/s][A
Epoch 1/5:  20%|█▉        | 439/2208 [02:37<10:20,  2.85it/s][A
Epoch 1/5:  20%|█▉        | 440/2208 [02:38<10:29,  2.81it/s][A
Epoch 1/5:  20%|█▉        | 441/2208 [02:38<10:22,  2.84it/s][A
Epoch 1/5:  20%|██      

Batch 450: Training accuracy = 0.7188, F1 = 0.6893, Precision = 0.6960, Recall = 0.7188



Epoch 1/5:  20%|██        | 452/2208 [02:42<10:01,  2.92it/s][A
Epoch 1/5:  21%|██        | 453/2208 [02:42<09:59,  2.93it/s][A
Epoch 1/5:  21%|██        | 454/2208 [02:43<09:57,  2.93it/s][A
Epoch 1/5:  21%|██        | 455/2208 [02:43<10:20,  2.82it/s][A
Epoch 1/5:  21%|██        | 456/2208 [02:43<10:17,  2.84it/s][A
Epoch 1/5:  21%|██        | 457/2208 [02:44<10:23,  2.81it/s][A
Epoch 1/5:  21%|██        | 458/2208 [02:44<10:42,  2.72it/s][A
Epoch 1/5:  21%|██        | 459/2208 [02:44<10:50,  2.69it/s][A
Epoch 1/5:  21%|██        | 460/2208 [02:45<10:32,  2.76it/s][A
Epoch 1/5:  21%|██        | 461/2208 [02:45<10:22,  2.81it/s][A
Epoch 1/5:  21%|██        | 462/2208 [02:45<10:12,  2.85it/s][A
Epoch 1/5:  21%|██        | 463/2208 [02:46<10:32,  2.76it/s][A
Epoch 1/5:  21%|██        | 464/2208 [02:46<10:27,  2.78it/s][A
Epoch 1/5:  21%|██        | 465/2208 [02:47<10:18,  2.82it/s][A
Epoch 1/5:  21%|██        | 466/2208 [02:47<10:36,  2.73it/s][A
Epoch 1/5:  21%|██      

Batch 475: Training accuracy = 0.7109, F1 = 0.6688, Precision = 0.6543, Recall = 0.7109



Epoch 1/5:  22%|██▏       | 477/2208 [02:51<10:41,  2.70it/s][A
Epoch 1/5:  22%|██▏       | 478/2208 [02:51<10:29,  2.75it/s][A
Epoch 1/5:  22%|██▏       | 479/2208 [02:52<10:34,  2.73it/s][A
Epoch 1/5:  22%|██▏       | 480/2208 [02:52<10:42,  2.69it/s][A
Epoch 1/5:  22%|██▏       | 481/2208 [02:52<10:46,  2.67it/s][A
Epoch 1/5:  22%|██▏       | 482/2208 [02:53<10:40,  2.70it/s][A
Epoch 1/5:  22%|██▏       | 483/2208 [02:53<10:39,  2.70it/s][A
Epoch 1/5:  22%|██▏       | 484/2208 [02:53<10:44,  2.67it/s][A
Epoch 1/5:  22%|██▏       | 485/2208 [02:54<10:25,  2.75it/s][A
Epoch 1/5:  22%|██▏       | 486/2208 [02:54<10:13,  2.81it/s][A
Epoch 1/5:  22%|██▏       | 487/2208 [02:54<10:02,  2.85it/s][A
Epoch 1/5:  22%|██▏       | 488/2208 [02:55<09:56,  2.89it/s][A
Epoch 1/5:  22%|██▏       | 489/2208 [02:55<09:53,  2.90it/s][A
Epoch 1/5:  22%|██▏       | 490/2208 [02:56<10:16,  2.79it/s][A
Epoch 1/5:  22%|██▏       | 491/2208 [02:56<10:05,  2.83it/s][A
Epoch 1/5:  22%|██▏     

Batch 500: Training accuracy = 0.5859, F1 = 0.5417, Precision = 0.5309, Recall = 0.5859



Epoch 1/5:  23%|██▎       | 502/2208 [03:00<10:01,  2.84it/s][A
Epoch 1/5:  23%|██▎       | 503/2208 [03:00<09:54,  2.87it/s][A
Epoch 1/5:  23%|██▎       | 504/2208 [03:00<09:50,  2.89it/s][A
Epoch 1/5:  23%|██▎       | 505/2208 [03:01<09:45,  2.91it/s][A
Epoch 1/5:  23%|██▎       | 506/2208 [03:01<10:01,  2.83it/s][A
Epoch 1/5:  23%|██▎       | 507/2208 [03:02<09:55,  2.86it/s][A
Epoch 1/5:  23%|██▎       | 508/2208 [03:02<10:01,  2.83it/s][A
Epoch 1/5:  23%|██▎       | 509/2208 [03:02<10:12,  2.78it/s][A
Epoch 1/5:  23%|██▎       | 510/2208 [03:03<10:11,  2.77it/s][A
Epoch 1/5:  23%|██▎       | 511/2208 [03:03<10:02,  2.82it/s][A
Epoch 1/5:  23%|██▎       | 512/2208 [03:03<10:09,  2.78it/s][A
Epoch 1/5:  23%|██▎       | 513/2208 [03:04<10:05,  2.80it/s][A
Epoch 1/5:  23%|██▎       | 514/2208 [03:04<10:00,  2.82it/s][A
Epoch 1/5:  23%|██▎       | 515/2208 [03:04<10:15,  2.75it/s][A
Epoch 1/5:  23%|██▎       | 516/2208 [03:05<10:03,  2.80it/s][A
Epoch 1/5:  23%|██▎     

Batch 525: Training accuracy = 0.7656, F1 = 0.7305, Precision = 0.7161, Recall = 0.7656



Epoch 1/5:  24%|██▍       | 527/2208 [03:09<09:45,  2.87it/s][A
Epoch 1/5:  24%|██▍       | 528/2208 [03:09<09:41,  2.89it/s][A
Epoch 1/5:  24%|██▍       | 529/2208 [03:09<09:51,  2.84it/s][A
Epoch 1/5:  24%|██▍       | 530/2208 [03:10<09:42,  2.88it/s][A
Epoch 1/5:  24%|██▍       | 531/2208 [03:10<09:39,  2.90it/s][A
Epoch 1/5:  24%|██▍       | 532/2208 [03:10<09:36,  2.91it/s][A
Epoch 1/5:  24%|██▍       | 533/2208 [03:11<09:32,  2.92it/s][A
Epoch 1/5:  24%|██▍       | 534/2208 [03:11<09:42,  2.87it/s][A
Epoch 1/5:  24%|██▍       | 535/2208 [03:11<09:39,  2.89it/s][A
Epoch 1/5:  24%|██▍       | 536/2208 [03:12<09:34,  2.91it/s][A
Epoch 1/5:  24%|██▍       | 537/2208 [03:12<09:33,  2.91it/s][A
Epoch 1/5:  24%|██▍       | 538/2208 [03:12<09:32,  2.92it/s][A
Epoch 1/5:  24%|██▍       | 539/2208 [03:13<09:29,  2.93it/s][A
Epoch 1/5:  24%|██▍       | 540/2208 [03:13<09:39,  2.88it/s][A
Epoch 1/5:  25%|██▍       | 541/2208 [03:13<09:40,  2.87it/s][A
Epoch 1/5:  25%|██▍     

Batch 550: Training accuracy = 0.7344, F1 = 0.7031, Precision = 0.6964, Recall = 0.7344



Epoch 1/5:  25%|██▌       | 552/2208 [03:17<09:51,  2.80it/s][A
Epoch 1/5:  25%|██▌       | 553/2208 [03:18<10:00,  2.76it/s][A
Epoch 1/5:  25%|██▌       | 554/2208 [03:18<09:50,  2.80it/s][A
Epoch 1/5:  25%|██▌       | 555/2208 [03:18<09:39,  2.85it/s][A
Epoch 1/5:  25%|██▌       | 556/2208 [03:19<09:35,  2.87it/s][A
Epoch 1/5:  25%|██▌       | 557/2208 [03:19<09:53,  2.78it/s][A
Epoch 1/5:  25%|██▌       | 558/2208 [03:19<09:46,  2.81it/s][A
Epoch 1/5:  25%|██▌       | 559/2208 [03:20<09:40,  2.84it/s][A
Epoch 1/5:  25%|██▌       | 560/2208 [03:20<09:55,  2.77it/s][A
Epoch 1/5:  25%|██▌       | 561/2208 [03:21<09:42,  2.83it/s][A
Epoch 1/5:  25%|██▌       | 562/2208 [03:21<09:41,  2.83it/s][A
Epoch 1/5:  25%|██▌       | 563/2208 [03:21<09:40,  2.83it/s][A
Epoch 1/5:  26%|██▌       | 564/2208 [03:22<09:36,  2.85it/s][A
Epoch 1/5:  26%|██▌       | 565/2208 [03:22<09:33,  2.86it/s][A
Epoch 1/5:  26%|██▌       | 566/2208 [03:22<09:30,  2.88it/s][A
Epoch 1/5:  26%|██▌     

Batch 575: Training accuracy = 0.6719, F1 = 0.6464, Precision = 0.6523, Recall = 0.6719



Epoch 1/5:  26%|██▌       | 577/2208 [03:26<09:42,  2.80it/s][A
Epoch 1/5:  26%|██▌       | 578/2208 [03:27<09:34,  2.84it/s][A
Epoch 1/5:  26%|██▌       | 579/2208 [03:27<09:26,  2.87it/s][A
Epoch 1/5:  26%|██▋       | 580/2208 [03:27<09:24,  2.88it/s][A
Epoch 1/5:  26%|██▋       | 581/2208 [03:28<09:39,  2.81it/s][A
Epoch 1/5:  26%|██▋       | 582/2208 [03:28<09:43,  2.78it/s][A
Epoch 1/5:  26%|██▋       | 583/2208 [03:28<09:42,  2.79it/s][A
Epoch 1/5:  26%|██▋       | 584/2208 [03:29<09:42,  2.79it/s][A
Epoch 1/5:  26%|██▋       | 585/2208 [03:29<09:31,  2.84it/s][A
Epoch 1/5:  27%|██▋       | 586/2208 [03:29<09:40,  2.79it/s][A
Epoch 1/5:  27%|██▋       | 587/2208 [03:30<09:31,  2.84it/s][A
Epoch 1/5:  27%|██▋       | 588/2208 [03:30<09:35,  2.82it/s][A
Epoch 1/5:  27%|██▋       | 589/2208 [03:30<09:27,  2.85it/s][A
Epoch 1/5:  27%|██▋       | 590/2208 [03:31<09:46,  2.76it/s][A
Epoch 1/5:  27%|██▋       | 591/2208 [03:31<09:34,  2.81it/s][A
Epoch 1/5:  27%|██▋     

Batch 600: Training accuracy = 0.6562, F1 = 0.6173, Precision = 0.6195, Recall = 0.6562



Epoch 1/5:  27%|██▋       | 602/2208 [03:35<09:45,  2.74it/s][A
Epoch 1/5:  27%|██▋       | 603/2208 [03:36<09:40,  2.77it/s][A
Epoch 1/5:  27%|██▋       | 604/2208 [03:36<09:34,  2.79it/s][A
Epoch 1/5:  27%|██▋       | 605/2208 [03:36<09:26,  2.83it/s][A
Epoch 1/5:  27%|██▋       | 606/2208 [03:37<09:29,  2.81it/s][A
Epoch 1/5:  27%|██▋       | 607/2208 [03:37<09:23,  2.84it/s][A
Epoch 1/5:  28%|██▊       | 608/2208 [03:37<09:25,  2.83it/s][A
Epoch 1/5:  28%|██▊       | 609/2208 [03:38<09:26,  2.82it/s][A
Epoch 1/5:  28%|██▊       | 610/2208 [03:38<09:33,  2.79it/s][A
Epoch 1/5:  28%|██▊       | 611/2208 [03:38<09:26,  2.82it/s][A
Epoch 1/5:  28%|██▊       | 612/2208 [03:39<09:22,  2.84it/s][A
Epoch 1/5:  28%|██▊       | 613/2208 [03:39<09:14,  2.88it/s][A
Epoch 1/5:  28%|██▊       | 614/2208 [03:39<09:20,  2.84it/s][A
Epoch 1/5:  28%|██▊       | 615/2208 [03:40<09:13,  2.88it/s][A
Epoch 1/5:  28%|██▊       | 616/2208 [03:40<09:10,  2.89it/s][A
Epoch 1/5:  28%|██▊     

Batch 625: Training accuracy = 0.7969, F1 = 0.7737, Precision = 0.7826, Recall = 0.7969



Epoch 1/5:  28%|██▊       | 627/2208 [03:44<09:24,  2.80it/s][A
Epoch 1/5:  28%|██▊       | 628/2208 [03:44<09:30,  2.77it/s][A
Epoch 1/5:  28%|██▊       | 629/2208 [03:45<09:34,  2.75it/s][A
Epoch 1/5:  29%|██▊       | 630/2208 [03:45<09:21,  2.81it/s][A
Epoch 1/5:  29%|██▊       | 631/2208 [03:45<09:11,  2.86it/s][A
Epoch 1/5:  29%|██▊       | 632/2208 [03:46<09:05,  2.89it/s][A
Epoch 1/5:  29%|██▊       | 633/2208 [03:46<09:02,  2.90it/s][A
Epoch 1/5:  29%|██▊       | 634/2208 [03:46<08:58,  2.92it/s][A
Epoch 1/5:  29%|██▉       | 635/2208 [03:47<08:55,  2.94it/s][A
Epoch 1/5:  29%|██▉       | 636/2208 [03:47<08:55,  2.94it/s][A
Epoch 1/5:  29%|██▉       | 637/2208 [03:47<09:09,  2.86it/s][A
Epoch 1/5:  29%|██▉       | 638/2208 [03:48<09:14,  2.83it/s][A
Epoch 1/5:  29%|██▉       | 639/2208 [03:48<09:07,  2.86it/s][A
Epoch 1/5:  29%|██▉       | 640/2208 [03:49<09:15,  2.82it/s][A
Epoch 1/5:  29%|██▉       | 641/2208 [03:49<09:07,  2.86it/s][A
Epoch 1/5:  29%|██▉     

Batch 650: Training accuracy = 0.7500, F1 = 0.7165, Precision = 0.7191, Recall = 0.7500



Epoch 1/5:  30%|██▉       | 652/2208 [03:53<09:08,  2.84it/s][A
Epoch 1/5:  30%|██▉       | 653/2208 [03:53<09:04,  2.86it/s][A
Epoch 1/5:  30%|██▉       | 654/2208 [03:53<08:58,  2.89it/s][A
Epoch 1/5:  30%|██▉       | 655/2208 [03:54<08:55,  2.90it/s][A
Epoch 1/5:  30%|██▉       | 656/2208 [03:54<08:53,  2.91it/s][A
Epoch 1/5:  30%|██▉       | 657/2208 [03:54<08:50,  2.92it/s][A
Epoch 1/5:  30%|██▉       | 658/2208 [03:55<08:47,  2.94it/s][A
Epoch 1/5:  30%|██▉       | 659/2208 [03:55<08:48,  2.93it/s][A
Epoch 1/5:  30%|██▉       | 660/2208 [03:55<08:47,  2.93it/s][A
Epoch 1/5:  30%|██▉       | 661/2208 [03:56<08:58,  2.88it/s][A
Epoch 1/5:  30%|██▉       | 662/2208 [03:56<08:57,  2.88it/s][A
Epoch 1/5:  30%|███       | 663/2208 [03:57<09:06,  2.83it/s][A
Epoch 1/5:  30%|███       | 664/2208 [03:57<09:09,  2.81it/s][A
Epoch 1/5:  30%|███       | 665/2208 [03:57<09:02,  2.85it/s][A
Epoch 1/5:  30%|███       | 666/2208 [03:58<09:11,  2.80it/s][A
Epoch 1/5:  30%|███     

Batch 675: Training accuracy = 0.7578, F1 = 0.7270, Precision = 0.7171, Recall = 0.7578



Epoch 1/5:  31%|███       | 677/2208 [04:02<09:14,  2.76it/s][A
Epoch 1/5:  31%|███       | 678/2208 [04:02<09:06,  2.80it/s][A
Epoch 1/5:  31%|███       | 679/2208 [04:02<09:10,  2.78it/s][A
Epoch 1/5:  31%|███       | 680/2208 [04:03<08:58,  2.83it/s][A
Epoch 1/5:  31%|███       | 681/2208 [04:03<08:51,  2.87it/s][A
Epoch 1/5:  31%|███       | 682/2208 [04:03<08:55,  2.85it/s][A
Epoch 1/5:  31%|███       | 683/2208 [04:04<09:22,  2.71it/s][A
Epoch 1/5:  31%|███       | 684/2208 [04:04<09:12,  2.76it/s][A
Epoch 1/5:  31%|███       | 685/2208 [04:04<09:07,  2.78it/s][A
Epoch 1/5:  31%|███       | 686/2208 [04:05<09:02,  2.81it/s][A
Epoch 1/5:  31%|███       | 687/2208 [04:05<09:05,  2.79it/s][A
Epoch 1/5:  31%|███       | 688/2208 [04:06<09:02,  2.80it/s][A
Epoch 1/5:  31%|███       | 689/2208 [04:06<09:06,  2.78it/s][A
Epoch 1/5:  31%|███▏      | 690/2208 [04:06<09:15,  2.73it/s][A
Epoch 1/5:  31%|███▏      | 691/2208 [04:07<09:03,  2.79it/s][A
Epoch 1/5:  31%|███▏    

Batch 700: Training accuracy = 0.7422, F1 = 0.7401, Precision = 0.7585, Recall = 0.7422



Epoch 1/5:  32%|███▏      | 702/2208 [04:11<09:07,  2.75it/s][A
Epoch 1/5:  32%|███▏      | 703/2208 [04:11<08:54,  2.82it/s][A
Epoch 1/5:  32%|███▏      | 704/2208 [04:11<09:01,  2.78it/s][A
Epoch 1/5:  32%|███▏      | 705/2208 [04:12<08:53,  2.82it/s][A
Epoch 1/5:  32%|███▏      | 706/2208 [04:12<08:46,  2.85it/s][A
Epoch 1/5:  32%|███▏      | 707/2208 [04:12<08:46,  2.85it/s][A
Epoch 1/5:  32%|███▏      | 708/2208 [04:13<08:57,  2.79it/s][A
Epoch 1/5:  32%|███▏      | 709/2208 [04:13<09:12,  2.71it/s][A
Epoch 1/5:  32%|███▏      | 710/2208 [04:13<08:59,  2.78it/s][A
Epoch 1/5:  32%|███▏      | 711/2208 [04:14<08:56,  2.79it/s][A
Epoch 1/5:  32%|███▏      | 712/2208 [04:14<08:57,  2.78it/s][A
Epoch 1/5:  32%|███▏      | 713/2208 [04:14<08:47,  2.83it/s][A
Epoch 1/5:  32%|███▏      | 714/2208 [04:15<08:58,  2.78it/s][A
Epoch 1/5:  32%|███▏      | 715/2208 [04:15<08:59,  2.77it/s][A
Epoch 1/5:  32%|███▏      | 716/2208 [04:16<09:02,  2.75it/s][A
Epoch 1/5:  32%|███▏    

Batch 725: Training accuracy = 0.7812, F1 = 0.7508, Precision = 0.7513, Recall = 0.7812



Epoch 1/5:  33%|███▎      | 727/2208 [04:20<09:22,  2.63it/s][A
Epoch 1/5:  33%|███▎      | 728/2208 [04:20<09:03,  2.72it/s][A
Epoch 1/5:  33%|███▎      | 729/2208 [04:20<08:52,  2.78it/s][A
Epoch 1/5:  33%|███▎      | 730/2208 [04:21<08:57,  2.75it/s][A
Epoch 1/5:  33%|███▎      | 731/2208 [04:21<09:00,  2.73it/s][A
Epoch 1/5:  33%|███▎      | 732/2208 [04:21<08:51,  2.78it/s][A
Epoch 1/5:  33%|███▎      | 733/2208 [04:22<08:43,  2.82it/s][A
Epoch 1/5:  33%|███▎      | 734/2208 [04:22<08:43,  2.82it/s][A
Epoch 1/5:  33%|███▎      | 735/2208 [04:22<08:45,  2.80it/s][A
Epoch 1/5:  33%|███▎      | 736/2208 [04:23<08:48,  2.78it/s][A
Epoch 1/5:  33%|███▎      | 737/2208 [04:23<08:38,  2.83it/s][A
Epoch 1/5:  33%|███▎      | 738/2208 [04:23<08:31,  2.87it/s][A
Epoch 1/5:  33%|███▎      | 739/2208 [04:24<08:26,  2.90it/s][A
Epoch 1/5:  34%|███▎      | 740/2208 [04:24<08:26,  2.90it/s][A
Epoch 1/5:  34%|███▎      | 741/2208 [04:24<08:22,  2.92it/s][A
Epoch 1/5:  34%|███▎    

Batch 750: Training accuracy = 0.7656, F1 = 0.7445, Precision = 0.7448, Recall = 0.7656



Epoch 1/5:  34%|███▍      | 752/2208 [04:28<08:44,  2.78it/s][A
Epoch 1/5:  34%|███▍      | 753/2208 [04:29<08:35,  2.82it/s][A
Epoch 1/5:  34%|███▍      | 754/2208 [04:29<08:27,  2.86it/s][A
Epoch 1/5:  34%|███▍      | 755/2208 [04:29<08:23,  2.89it/s][A
Epoch 1/5:  34%|███▍      | 756/2208 [04:30<08:20,  2.90it/s][A
Epoch 1/5:  34%|███▍      | 757/2208 [04:30<08:17,  2.92it/s][A
Epoch 1/5:  34%|███▍      | 758/2208 [04:30<08:15,  2.93it/s][A
Epoch 1/5:  34%|███▍      | 759/2208 [04:31<08:12,  2.94it/s][A
Epoch 1/5:  34%|███▍      | 760/2208 [04:31<08:10,  2.95it/s][A
Epoch 1/5:  34%|███▍      | 761/2208 [04:31<08:14,  2.92it/s][A
Epoch 1/5:  35%|███▍      | 762/2208 [04:32<08:13,  2.93it/s][A
Epoch 1/5:  35%|███▍      | 763/2208 [04:32<08:14,  2.92it/s][A
Epoch 1/5:  35%|███▍      | 764/2208 [04:33<08:29,  2.84it/s][A
Epoch 1/5:  35%|███▍      | 765/2208 [04:33<08:24,  2.86it/s][A
Epoch 1/5:  35%|███▍      | 766/2208 [04:33<08:20,  2.88it/s][A
Epoch 1/5:  35%|███▍    

Batch 775: Training accuracy = 0.7734, F1 = 0.7485, Precision = 0.7517, Recall = 0.7734



Epoch 1/5:  35%|███▌      | 777/2208 [04:37<08:52,  2.69it/s][A
Epoch 1/5:  35%|███▌      | 778/2208 [04:38<08:38,  2.76it/s][A
Epoch 1/5:  35%|███▌      | 779/2208 [04:38<08:28,  2.81it/s][A
Epoch 1/5:  35%|███▌      | 780/2208 [04:38<08:26,  2.82it/s][A
Epoch 1/5:  35%|███▌      | 781/2208 [04:39<08:35,  2.77it/s][A
Epoch 1/5:  35%|███▌      | 782/2208 [04:39<08:26,  2.82it/s][A
Epoch 1/5:  35%|███▌      | 783/2208 [04:39<08:19,  2.85it/s][A
Epoch 1/5:  36%|███▌      | 784/2208 [04:40<08:13,  2.88it/s][A
Epoch 1/5:  36%|███▌      | 785/2208 [04:40<08:11,  2.90it/s][A
Epoch 1/5:  36%|███▌      | 786/2208 [04:40<08:18,  2.85it/s][A
Epoch 1/5:  36%|███▌      | 787/2208 [04:41<08:11,  2.89it/s][A
Epoch 1/5:  36%|███▌      | 788/2208 [04:41<08:08,  2.91it/s][A
Epoch 1/5:  36%|███▌      | 789/2208 [04:41<08:07,  2.91it/s][A
Epoch 1/5:  36%|███▌      | 790/2208 [04:42<08:03,  2.93it/s][A
Epoch 1/5:  36%|███▌      | 791/2208 [04:42<08:01,  2.94it/s][A
Epoch 1/5:  36%|███▌    

Batch 800: Training accuracy = 0.7891, F1 = 0.7510, Precision = 0.7333, Recall = 0.7891



Epoch 1/5:  36%|███▋      | 802/2208 [04:46<08:08,  2.88it/s][A
Epoch 1/5:  36%|███▋      | 803/2208 [04:46<08:16,  2.83it/s][A
Epoch 1/5:  36%|███▋      | 804/2208 [04:47<08:27,  2.77it/s][A
Epoch 1/5:  36%|███▋      | 805/2208 [04:47<08:24,  2.78it/s][A
Epoch 1/5:  37%|███▋      | 806/2208 [04:48<08:30,  2.74it/s][A
Epoch 1/5:  37%|███▋      | 807/2208 [04:48<08:22,  2.79it/s][A
Epoch 1/5:  37%|███▋      | 808/2208 [04:48<08:31,  2.74it/s][A
Epoch 1/5:  37%|███▋      | 809/2208 [04:49<08:48,  2.65it/s][A
Epoch 1/5:  37%|███▋      | 810/2208 [04:49<08:32,  2.73it/s][A
Epoch 1/5:  37%|███▋      | 811/2208 [04:49<08:39,  2.69it/s][A
Epoch 1/5:  37%|███▋      | 812/2208 [04:50<08:34,  2.72it/s][A
Epoch 1/5:  37%|███▋      | 813/2208 [04:50<08:23,  2.77it/s][A
Epoch 1/5:  37%|███▋      | 814/2208 [04:50<08:18,  2.80it/s][A
Epoch 1/5:  37%|███▋      | 815/2208 [04:51<08:15,  2.81it/s][A
Epoch 1/5:  37%|███▋      | 816/2208 [04:51<08:09,  2.84it/s][A
Epoch 1/5:  37%|███▋    

Batch 825: Training accuracy = 0.7891, F1 = 0.7501, Precision = 0.7393, Recall = 0.7891



Epoch 1/5:  37%|███▋      | 827/2208 [04:55<08:02,  2.86it/s][A
Epoch 1/5:  38%|███▊      | 828/2208 [04:55<08:19,  2.76it/s][A
Epoch 1/5:  38%|███▊      | 829/2208 [04:56<08:09,  2.82it/s][A
Epoch 1/5:  38%|███▊      | 830/2208 [04:56<08:16,  2.77it/s][A
Epoch 1/5:  38%|███▊      | 831/2208 [04:56<08:06,  2.83it/s][A
Epoch 1/5:  38%|███▊      | 832/2208 [04:57<08:10,  2.80it/s][A
Epoch 1/5:  38%|███▊      | 833/2208 [04:57<08:03,  2.85it/s][A
Epoch 1/5:  38%|███▊      | 834/2208 [04:57<08:13,  2.79it/s][A
Epoch 1/5:  38%|███▊      | 835/2208 [04:58<08:16,  2.76it/s][A
Epoch 1/5:  38%|███▊      | 836/2208 [04:58<08:09,  2.80it/s][A
Epoch 1/5:  38%|███▊      | 837/2208 [04:59<08:02,  2.84it/s][A
Epoch 1/5:  38%|███▊      | 838/2208 [04:59<07:56,  2.87it/s][A
Epoch 1/5:  38%|███▊      | 839/2208 [04:59<08:04,  2.83it/s][A
Epoch 1/5:  38%|███▊      | 840/2208 [05:00<07:57,  2.86it/s][A
Epoch 1/5:  38%|███▊      | 841/2208 [05:00<07:52,  2.89it/s][A
Epoch 1/5:  38%|███▊    

Batch 850: Training accuracy = 0.7422, F1 = 0.7201, Precision = 0.7253, Recall = 0.7422



Epoch 1/5:  39%|███▊      | 852/2208 [05:04<08:17,  2.73it/s][A
Epoch 1/5:  39%|███▊      | 853/2208 [05:04<08:21,  2.70it/s][A
Epoch 1/5:  39%|███▊      | 854/2208 [05:05<08:12,  2.75it/s][A
Epoch 1/5:  39%|███▊      | 855/2208 [05:05<08:00,  2.81it/s][A
Epoch 1/5:  39%|███▉      | 856/2208 [05:05<07:54,  2.85it/s][A
Epoch 1/5:  39%|███▉      | 857/2208 [05:06<08:04,  2.79it/s][A
Epoch 1/5:  39%|███▉      | 858/2208 [05:06<07:56,  2.83it/s][A
Epoch 1/5:  39%|███▉      | 859/2208 [05:06<07:50,  2.87it/s][A
Epoch 1/5:  39%|███▉      | 860/2208 [05:07<07:45,  2.89it/s][A
Epoch 1/5:  39%|███▉      | 861/2208 [05:07<07:47,  2.88it/s][A
Epoch 1/5:  39%|███▉      | 862/2208 [05:07<07:52,  2.85it/s][A
Epoch 1/5:  39%|███▉      | 863/2208 [05:08<07:59,  2.80it/s][A
Epoch 1/5:  39%|███▉      | 864/2208 [05:08<07:53,  2.84it/s][A
Epoch 1/5:  39%|███▉      | 865/2208 [05:08<07:48,  2.87it/s][A
Epoch 1/5:  39%|███▉      | 866/2208 [05:09<07:49,  2.86it/s][A
Epoch 1/5:  39%|███▉    

Batch 875: Training accuracy = 0.8047, F1 = 0.7753, Precision = 0.7728, Recall = 0.8047



Epoch 1/5:  40%|███▉      | 877/2208 [05:13<08:00,  2.77it/s][A
Epoch 1/5:  40%|███▉      | 878/2208 [05:13<07:50,  2.83it/s][A
Epoch 1/5:  40%|███▉      | 879/2208 [05:13<07:53,  2.81it/s][A
Epoch 1/5:  40%|███▉      | 880/2208 [05:14<07:48,  2.83it/s][A
Epoch 1/5:  40%|███▉      | 881/2208 [05:14<07:56,  2.78it/s][A
Epoch 1/5:  40%|███▉      | 882/2208 [05:14<07:50,  2.82it/s][A
Epoch 1/5:  40%|███▉      | 883/2208 [05:15<07:51,  2.81it/s][A
Epoch 1/5:  40%|████      | 884/2208 [05:15<07:46,  2.84it/s][A
Epoch 1/5:  40%|████      | 885/2208 [05:15<07:41,  2.86it/s][A
Epoch 1/5:  40%|████      | 886/2208 [05:16<07:45,  2.84it/s][A
Epoch 1/5:  40%|████      | 887/2208 [05:16<07:40,  2.87it/s][A
Epoch 1/5:  40%|████      | 888/2208 [05:17<07:36,  2.89it/s][A
Epoch 1/5:  40%|████      | 889/2208 [05:17<07:32,  2.92it/s][A
Epoch 1/5:  40%|████      | 890/2208 [05:17<07:31,  2.92it/s][A
Epoch 1/5:  40%|████      | 891/2208 [05:18<07:35,  2.89it/s][A
Epoch 1/5:  40%|████    

Batch 900: Training accuracy = 0.8203, F1 = 0.8125, Precision = 0.8242, Recall = 0.8203



Epoch 1/5:  41%|████      | 902/2208 [05:22<08:09,  2.67it/s][A
Epoch 1/5:  41%|████      | 903/2208 [05:22<08:18,  2.62it/s][A
Epoch 1/5:  41%|████      | 904/2208 [05:22<08:03,  2.70it/s][A
Epoch 1/5:  41%|████      | 905/2208 [05:23<07:52,  2.76it/s][A
Epoch 1/5:  41%|████      | 906/2208 [05:23<07:53,  2.75it/s][A
Epoch 1/5:  41%|████      | 907/2208 [05:23<07:51,  2.76it/s][A
Epoch 1/5:  41%|████      | 908/2208 [05:24<07:41,  2.81it/s][A
Epoch 1/5:  41%|████      | 909/2208 [05:24<07:54,  2.74it/s][A
Epoch 1/5:  41%|████      | 910/2208 [05:24<07:58,  2.71it/s][A
Epoch 1/5:  41%|████▏     | 911/2208 [05:25<07:48,  2.77it/s][A
Epoch 1/5:  41%|████▏     | 912/2208 [05:25<07:54,  2.73it/s][A
Epoch 1/5:  41%|████▏     | 913/2208 [05:26<07:43,  2.79it/s][A
Epoch 1/5:  41%|████▏     | 914/2208 [05:26<07:48,  2.76it/s][A
Epoch 1/5:  41%|████▏     | 915/2208 [05:26<07:45,  2.78it/s][A
Epoch 1/5:  41%|████▏     | 916/2208 [05:27<07:48,  2.76it/s][A
Epoch 1/5:  42%|████▏   

Batch 925: Training accuracy = 0.8516, F1 = 0.8281, Precision = 0.8229, Recall = 0.8516



Epoch 1/5:  42%|████▏     | 927/2208 [05:30<07:31,  2.84it/s][A
Epoch 1/5:  42%|████▏     | 928/2208 [05:31<07:25,  2.88it/s][A
Epoch 1/5:  42%|████▏     | 929/2208 [05:31<07:20,  2.91it/s][A
Epoch 1/5:  42%|████▏     | 930/2208 [05:31<07:19,  2.91it/s][A
Epoch 1/5:  42%|████▏     | 931/2208 [05:32<07:25,  2.87it/s][A
Epoch 1/5:  42%|████▏     | 932/2208 [05:32<07:24,  2.87it/s][A
Epoch 1/5:  42%|████▏     | 933/2208 [05:33<07:32,  2.82it/s][A
Epoch 1/5:  42%|████▏     | 934/2208 [05:33<07:25,  2.86it/s][A
Epoch 1/5:  42%|████▏     | 935/2208 [05:33<07:25,  2.86it/s][A
Epoch 1/5:  42%|████▏     | 936/2208 [05:34<07:34,  2.80it/s][A
Epoch 1/5:  42%|████▏     | 937/2208 [05:34<07:31,  2.82it/s][A
Epoch 1/5:  42%|████▏     | 938/2208 [05:34<07:29,  2.83it/s][A
Epoch 1/5:  43%|████▎     | 939/2208 [05:35<07:35,  2.79it/s][A
Epoch 1/5:  43%|████▎     | 940/2208 [05:35<07:26,  2.84it/s][A
Epoch 1/5:  43%|████▎     | 941/2208 [05:35<07:45,  2.72it/s][A
Epoch 1/5:  43%|████▎   

Batch 950: Training accuracy = 0.7500, F1 = 0.7357, Precision = 0.7451, Recall = 0.7500



Epoch 1/5:  43%|████▎     | 952/2208 [05:39<07:20,  2.85it/s][A
Epoch 1/5:  43%|████▎     | 953/2208 [05:40<07:37,  2.74it/s][A
Epoch 1/5:  43%|████▎     | 954/2208 [05:40<07:30,  2.78it/s][A
Epoch 1/5:  43%|████▎     | 955/2208 [05:40<07:34,  2.76it/s][A
Epoch 1/5:  43%|████▎     | 956/2208 [05:41<07:38,  2.73it/s][A
Epoch 1/5:  43%|████▎     | 957/2208 [05:41<07:29,  2.78it/s][A
Epoch 1/5:  43%|████▎     | 958/2208 [05:41<07:21,  2.83it/s][A
Epoch 1/5:  43%|████▎     | 959/2208 [05:42<07:23,  2.82it/s][A
Epoch 1/5:  43%|████▎     | 960/2208 [05:42<07:19,  2.84it/s][A
Epoch 1/5:  44%|████▎     | 961/2208 [05:43<07:23,  2.81it/s][A
Epoch 1/5:  44%|████▎     | 962/2208 [05:43<07:16,  2.86it/s][A
Epoch 1/5:  44%|████▎     | 963/2208 [05:43<07:22,  2.81it/s][A
Epoch 1/5:  44%|████▎     | 964/2208 [05:44<07:18,  2.84it/s][A
Epoch 1/5:  44%|████▎     | 965/2208 [05:44<07:14,  2.86it/s][A
Epoch 1/5:  44%|████▍     | 966/2208 [05:44<07:12,  2.87it/s][A
Epoch 1/5:  44%|████▍   

Batch 975: Training accuracy = 0.7500, F1 = 0.7219, Precision = 0.7240, Recall = 0.7500



Epoch 1/5:  44%|████▍     | 977/2208 [05:48<07:26,  2.76it/s][A
Epoch 1/5:  44%|████▍     | 978/2208 [05:49<07:26,  2.75it/s][A
Epoch 1/5:  44%|████▍     | 979/2208 [05:49<07:19,  2.80it/s][A
Epoch 1/5:  44%|████▍     | 980/2208 [05:49<07:15,  2.82it/s][A
Epoch 1/5:  44%|████▍     | 981/2208 [05:50<07:12,  2.84it/s][A
Epoch 1/5:  44%|████▍     | 982/2208 [05:50<07:09,  2.85it/s][A
Epoch 1/5:  45%|████▍     | 983/2208 [05:50<07:21,  2.77it/s][A
Epoch 1/5:  45%|████▍     | 984/2208 [05:51<07:21,  2.77it/s][A
Epoch 1/5:  45%|████▍     | 985/2208 [05:51<07:23,  2.76it/s][A
Epoch 1/5:  45%|████▍     | 986/2208 [05:51<07:19,  2.78it/s][A
Epoch 1/5:  45%|████▍     | 987/2208 [05:52<07:20,  2.77it/s][A
Epoch 1/5:  45%|████▍     | 988/2208 [05:52<07:11,  2.83it/s][A
Epoch 1/5:  45%|████▍     | 989/2208 [05:52<07:05,  2.86it/s][A
Epoch 1/5:  45%|████▍     | 990/2208 [05:53<07:11,  2.82it/s][A
Epoch 1/5:  45%|████▍     | 991/2208 [05:53<07:19,  2.77it/s][A
Epoch 1/5:  45%|████▍   

Batch 1000: Training accuracy = 0.7812, F1 = 0.7603, Precision = 0.7814, Recall = 0.7812



Epoch 1/5:  45%|████▌     | 1002/2208 [05:57<06:55,  2.90it/s][A
Epoch 1/5:  45%|████▌     | 1003/2208 [05:57<07:00,  2.87it/s][A
Epoch 1/5:  45%|████▌     | 1004/2208 [05:58<06:55,  2.90it/s][A
Epoch 1/5:  46%|████▌     | 1005/2208 [05:58<06:52,  2.92it/s][A
Epoch 1/5:  46%|████▌     | 1006/2208 [05:58<06:50,  2.93it/s][A
Epoch 1/5:  46%|████▌     | 1007/2208 [05:59<06:48,  2.94it/s][A
Epoch 1/5:  46%|████▌     | 1008/2208 [05:59<06:54,  2.89it/s][A
Epoch 1/5:  46%|████▌     | 1009/2208 [05:59<06:51,  2.91it/s][A
Epoch 1/5:  46%|████▌     | 1010/2208 [06:00<06:49,  2.93it/s][A
Epoch 1/5:  46%|████▌     | 1011/2208 [06:00<06:47,  2.94it/s][A
Epoch 1/5:  46%|████▌     | 1012/2208 [06:00<06:46,  2.94it/s][A
Epoch 1/5:  46%|████▌     | 1013/2208 [06:01<06:44,  2.95it/s][A
Epoch 1/5:  46%|████▌     | 1014/2208 [06:01<06:47,  2.93it/s][A
Epoch 1/5:  46%|████▌     | 1015/2208 [06:02<06:58,  2.85it/s][A
Epoch 1/5:  46%|████▌     | 1016/2208 [06:02<06:58,  2.85it/s][A
Epoch 1/5

Batch 1025: Training accuracy = 0.7578, F1 = 0.7294, Precision = 0.7201, Recall = 0.7578



Epoch 1/5:  47%|████▋     | 1027/2208 [06:06<06:56,  2.83it/s][A
Epoch 1/5:  47%|████▋     | 1028/2208 [06:06<06:52,  2.86it/s][A
Epoch 1/5:  47%|████▋     | 1029/2208 [06:07<06:49,  2.88it/s][A
Epoch 1/5:  47%|████▋     | 1030/2208 [06:07<06:45,  2.90it/s][A
Epoch 1/5:  47%|████▋     | 1031/2208 [06:07<06:53,  2.85it/s][A
Epoch 1/5:  47%|████▋     | 1032/2208 [06:08<06:48,  2.88it/s][A
Epoch 1/5:  47%|████▋     | 1033/2208 [06:08<06:53,  2.84it/s][A
Epoch 1/5:  47%|████▋     | 1034/2208 [06:08<06:50,  2.86it/s][A
Epoch 1/5:  47%|████▋     | 1035/2208 [06:09<06:53,  2.84it/s][A
Epoch 1/5:  47%|████▋     | 1036/2208 [06:09<06:47,  2.88it/s][A
Epoch 1/5:  47%|████▋     | 1037/2208 [06:09<06:44,  2.90it/s][A
Epoch 1/5:  47%|████▋     | 1038/2208 [06:10<06:42,  2.90it/s][A
Epoch 1/5:  47%|████▋     | 1039/2208 [06:10<06:39,  2.92it/s][A
Epoch 1/5:  47%|████▋     | 1040/2208 [06:10<06:37,  2.94it/s][A
Epoch 1/5:  47%|████▋     | 1041/2208 [06:11<06:46,  2.87it/s][A
Epoch 1/5

Batch 1050: Training accuracy = 0.7969, F1 = 0.7721, Precision = 0.7783, Recall = 0.7969



Epoch 1/5:  48%|████▊     | 1052/2208 [06:15<06:57,  2.77it/s][A
Epoch 1/5:  48%|████▊     | 1053/2208 [06:15<06:58,  2.76it/s][A
Epoch 1/5:  48%|████▊     | 1054/2208 [06:16<07:01,  2.74it/s][A
Epoch 1/5:  48%|████▊     | 1055/2208 [06:16<06:52,  2.80it/s][A
Epoch 1/5:  48%|████▊     | 1056/2208 [06:16<06:45,  2.84it/s][A
Epoch 1/5:  48%|████▊     | 1057/2208 [06:17<06:42,  2.86it/s][A
Epoch 1/5:  48%|████▊     | 1058/2208 [06:17<06:39,  2.88it/s][A
Epoch 1/5:  48%|████▊     | 1059/2208 [06:17<06:35,  2.90it/s][A
Epoch 1/5:  48%|████▊     | 1060/2208 [06:18<06:42,  2.85it/s][A
Epoch 1/5:  48%|████▊     | 1061/2208 [06:18<06:37,  2.89it/s][A
Epoch 1/5:  48%|████▊     | 1062/2208 [06:18<06:44,  2.84it/s][A
Epoch 1/5:  48%|████▊     | 1063/2208 [06:19<06:42,  2.84it/s][A
Epoch 1/5:  48%|████▊     | 1064/2208 [06:19<06:52,  2.77it/s][A
Epoch 1/5:  48%|████▊     | 1065/2208 [06:19<06:59,  2.72it/s][A
Epoch 1/5:  48%|████▊     | 1066/2208 [06:20<07:02,  2.70it/s][A
Epoch 1/5

Batch 1075: Training accuracy = 0.8281, F1 = 0.8055, Precision = 0.8060, Recall = 0.8281



Epoch 1/5:  49%|████▉     | 1077/2208 [06:24<06:52,  2.74it/s][A
Epoch 1/5:  49%|████▉     | 1078/2208 [06:24<06:50,  2.75it/s][A
Epoch 1/5:  49%|████▉     | 1079/2208 [06:24<06:44,  2.79it/s][A
Epoch 1/5:  49%|████▉     | 1080/2208 [06:25<06:44,  2.79it/s][A
Epoch 1/5:  49%|████▉     | 1081/2208 [06:25<06:55,  2.71it/s][A
Epoch 1/5:  49%|████▉     | 1082/2208 [06:26<06:54,  2.72it/s][A
Epoch 1/5:  49%|████▉     | 1083/2208 [06:26<06:43,  2.79it/s][A
Epoch 1/5:  49%|████▉     | 1084/2208 [06:26<06:45,  2.77it/s][A
Epoch 1/5:  49%|████▉     | 1085/2208 [06:27<06:48,  2.75it/s][A
Epoch 1/5:  49%|████▉     | 1086/2208 [06:27<06:44,  2.77it/s][A
Epoch 1/5:  49%|████▉     | 1087/2208 [06:27<06:37,  2.82it/s][A
Epoch 1/5:  49%|████▉     | 1088/2208 [06:28<06:34,  2.84it/s][A
Epoch 1/5:  49%|████▉     | 1089/2208 [06:28<06:30,  2.87it/s][A
Epoch 1/5:  49%|████▉     | 1090/2208 [06:28<06:27,  2.89it/s][A
Epoch 1/5:  49%|████▉     | 1091/2208 [06:29<06:24,  2.90it/s][A
Epoch 1/5

Batch 1100: Training accuracy = 0.8125, F1 = 0.8013, Precision = 0.8275, Recall = 0.8125



Epoch 1/5:  50%|████▉     | 1102/2208 [06:33<06:42,  2.74it/s][A
Epoch 1/5:  50%|████▉     | 1103/2208 [06:33<06:34,  2.80it/s][A
Epoch 1/5:  50%|█████     | 1104/2208 [06:33<06:34,  2.79it/s][A
Epoch 1/5:  50%|█████     | 1105/2208 [06:34<06:40,  2.76it/s][A
Epoch 1/5:  50%|█████     | 1106/2208 [06:34<06:36,  2.78it/s][A
Epoch 1/5:  50%|█████     | 1107/2208 [06:34<06:32,  2.81it/s][A
Epoch 1/5:  50%|█████     | 1108/2208 [06:35<06:25,  2.86it/s][A
Epoch 1/5:  50%|█████     | 1109/2208 [06:35<06:33,  2.80it/s][A
Epoch 1/5:  50%|█████     | 1110/2208 [06:35<06:30,  2.81it/s][A
Epoch 1/5:  50%|█████     | 1111/2208 [06:36<06:33,  2.79it/s][A
Epoch 1/5:  50%|█████     | 1112/2208 [06:36<06:41,  2.73it/s][A
Epoch 1/5:  50%|█████     | 1113/2208 [06:37<06:31,  2.80it/s][A
Epoch 1/5:  50%|█████     | 1114/2208 [06:37<06:23,  2.85it/s][A
Epoch 1/5:  50%|█████     | 1115/2208 [06:37<06:20,  2.87it/s][A
Epoch 1/5:  51%|█████     | 1116/2208 [06:38<06:35,  2.76it/s][A
Epoch 1/5

Batch 1125: Training accuracy = 0.7969, F1 = 0.7774, Precision = 0.7793, Recall = 0.7969



Epoch 1/5:  51%|█████     | 1127/2208 [06:41<06:09,  2.92it/s][A
Epoch 1/5:  51%|█████     | 1128/2208 [06:42<06:22,  2.82it/s][A
Epoch 1/5:  51%|█████     | 1129/2208 [06:42<06:17,  2.86it/s][A
Epoch 1/5:  51%|█████     | 1130/2208 [06:42<06:15,  2.87it/s][A
Epoch 1/5:  51%|█████     | 1131/2208 [06:43<06:20,  2.83it/s][A
Epoch 1/5:  51%|█████▏    | 1132/2208 [06:43<06:17,  2.85it/s][A
Epoch 1/5:  51%|█████▏    | 1133/2208 [06:44<06:19,  2.83it/s][A
Epoch 1/5:  51%|█████▏    | 1134/2208 [06:44<06:16,  2.85it/s][A
Epoch 1/5:  51%|█████▏    | 1135/2208 [06:44<06:13,  2.87it/s][A
Epoch 1/5:  51%|█████▏    | 1136/2208 [06:45<06:21,  2.81it/s][A
Epoch 1/5:  51%|█████▏    | 1137/2208 [06:45<06:15,  2.85it/s][A
Epoch 1/5:  52%|█████▏    | 1138/2208 [06:45<06:12,  2.87it/s][A
Epoch 1/5:  52%|█████▏    | 1139/2208 [06:46<06:12,  2.87it/s][A
Epoch 1/5:  52%|█████▏    | 1140/2208 [06:46<06:09,  2.89it/s][A
Epoch 1/5:  52%|█████▏    | 1141/2208 [06:46<06:18,  2.82it/s][A
Epoch 1/5

Batch 1150: Training accuracy = 0.8125, F1 = 0.7880, Precision = 0.7865, Recall = 0.8125



Epoch 1/5:  52%|█████▏    | 1152/2208 [06:50<06:05,  2.89it/s][A
Epoch 1/5:  52%|█████▏    | 1153/2208 [06:51<06:03,  2.90it/s][A
Epoch 1/5:  52%|█████▏    | 1154/2208 [06:51<06:04,  2.89it/s][A
Epoch 1/5:  52%|█████▏    | 1155/2208 [06:51<06:01,  2.91it/s][A
Epoch 1/5:  52%|█████▏    | 1156/2208 [06:52<05:59,  2.93it/s][A
Epoch 1/5:  52%|█████▏    | 1157/2208 [06:52<05:57,  2.94it/s][A
Epoch 1/5:  52%|█████▏    | 1158/2208 [06:52<06:10,  2.83it/s][A
Epoch 1/5:  52%|█████▏    | 1159/2208 [06:53<06:05,  2.87it/s][A
Epoch 1/5:  53%|█████▎    | 1160/2208 [06:53<06:01,  2.90it/s][A
Epoch 1/5:  53%|█████▎    | 1161/2208 [06:53<05:59,  2.91it/s][A
Epoch 1/5:  53%|█████▎    | 1162/2208 [06:54<05:57,  2.93it/s][A
Epoch 1/5:  53%|█████▎    | 1163/2208 [06:54<05:54,  2.94it/s][A
Epoch 1/5:  53%|█████▎    | 1164/2208 [06:54<05:55,  2.94it/s][A
Epoch 1/5:  53%|█████▎    | 1165/2208 [06:55<05:55,  2.93it/s][A
Epoch 1/5:  53%|█████▎    | 1166/2208 [06:55<05:58,  2.91it/s][A
Epoch 1/5

Batch 1175: Training accuracy = 0.8203, F1 = 0.8060, Precision = 0.8069, Recall = 0.8203



Epoch 1/5:  53%|█████▎    | 1177/2208 [06:59<05:59,  2.87it/s][A
Epoch 1/5:  53%|█████▎    | 1178/2208 [06:59<06:00,  2.85it/s][A
Epoch 1/5:  53%|█████▎    | 1179/2208 [07:00<06:07,  2.80it/s][A
Epoch 1/5:  53%|█████▎    | 1180/2208 [07:00<06:08,  2.79it/s][A
Epoch 1/5:  53%|█████▎    | 1181/2208 [07:00<06:03,  2.83it/s][A
Epoch 1/5:  54%|█████▎    | 1182/2208 [07:01<05:58,  2.86it/s][A
Epoch 1/5:  54%|█████▎    | 1183/2208 [07:01<05:56,  2.88it/s][A
Epoch 1/5:  54%|█████▎    | 1184/2208 [07:01<05:54,  2.89it/s][A
Epoch 1/5:  54%|█████▎    | 1185/2208 [07:02<06:03,  2.82it/s][A
Epoch 1/5:  54%|█████▎    | 1186/2208 [07:02<05:59,  2.84it/s][A
Epoch 1/5:  54%|█████▍    | 1187/2208 [07:02<05:57,  2.86it/s][A
Epoch 1/5:  54%|█████▍    | 1188/2208 [07:03<06:01,  2.82it/s][A
Epoch 1/5:  54%|█████▍    | 1189/2208 [07:03<06:01,  2.82it/s][A
Epoch 1/5:  54%|█████▍    | 1190/2208 [07:03<06:09,  2.76it/s][A
Epoch 1/5:  54%|█████▍    | 1191/2208 [07:04<06:03,  2.80it/s][A
Epoch 1/5

Batch 1200: Training accuracy = 0.7656, F1 = 0.7493, Precision = 0.7576, Recall = 0.7656



Epoch 1/5:  54%|█████▍    | 1202/2208 [07:08<05:52,  2.85it/s][A
Epoch 1/5:  54%|█████▍    | 1203/2208 [07:08<05:48,  2.89it/s][A
Epoch 1/5:  55%|█████▍    | 1204/2208 [07:08<05:53,  2.84it/s][A
Epoch 1/5:  55%|█████▍    | 1205/2208 [07:09<05:51,  2.85it/s][A
Epoch 1/5:  55%|█████▍    | 1206/2208 [07:09<05:56,  2.81it/s][A
Epoch 1/5:  55%|█████▍    | 1207/2208 [07:09<06:00,  2.78it/s][A
Epoch 1/5:  55%|█████▍    | 1208/2208 [07:10<06:02,  2.76it/s][A
Epoch 1/5:  55%|█████▍    | 1209/2208 [07:10<05:55,  2.81it/s][A
Epoch 1/5:  55%|█████▍    | 1210/2208 [07:10<05:51,  2.84it/s][A
Epoch 1/5:  55%|█████▍    | 1211/2208 [07:11<05:46,  2.87it/s][A
Epoch 1/5:  55%|█████▍    | 1212/2208 [07:11<06:03,  2.74it/s][A
Epoch 1/5:  55%|█████▍    | 1213/2208 [07:12<05:55,  2.80it/s][A
Epoch 1/5:  55%|█████▍    | 1214/2208 [07:12<05:48,  2.85it/s][A
Epoch 1/5:  55%|█████▌    | 1215/2208 [07:12<05:44,  2.88it/s][A
Epoch 1/5:  55%|█████▌    | 1216/2208 [07:13<05:48,  2.84it/s][A
Epoch 1/5

Batch 1225: Training accuracy = 0.8594, F1 = 0.8497, Precision = 0.8529, Recall = 0.8594



Epoch 1/5:  56%|█████▌    | 1227/2208 [07:17<06:03,  2.70it/s][A
Epoch 1/5:  56%|█████▌    | 1228/2208 [07:17<06:00,  2.72it/s][A
Epoch 1/5:  56%|█████▌    | 1229/2208 [07:17<06:00,  2.71it/s][A
Epoch 1/5:  56%|█████▌    | 1230/2208 [07:18<06:01,  2.70it/s][A
Epoch 1/5:  56%|█████▌    | 1231/2208 [07:18<05:54,  2.75it/s][A
Epoch 1/5:  56%|█████▌    | 1232/2208 [07:18<05:54,  2.75it/s][A
Epoch 1/5:  56%|█████▌    | 1233/2208 [07:19<05:48,  2.80it/s][A
Epoch 1/5:  56%|█████▌    | 1234/2208 [07:19<05:43,  2.83it/s][A
Epoch 1/5:  56%|█████▌    | 1235/2208 [07:19<05:52,  2.76it/s][A
Epoch 1/5:  56%|█████▌    | 1236/2208 [07:20<05:49,  2.78it/s][A
Epoch 1/5:  56%|█████▌    | 1237/2208 [07:20<05:45,  2.81it/s][A
Epoch 1/5:  56%|█████▌    | 1238/2208 [07:20<05:42,  2.83it/s][A
Epoch 1/5:  56%|█████▌    | 1239/2208 [07:21<05:48,  2.78it/s][A
Epoch 1/5:  56%|█████▌    | 1240/2208 [07:21<05:42,  2.83it/s][A
Epoch 1/5:  56%|█████▌    | 1241/2208 [07:22<05:39,  2.85it/s][A
Epoch 1/5

Batch 1250: Training accuracy = 0.8359, F1 = 0.8237, Precision = 0.8294, Recall = 0.8359



Epoch 1/5:  57%|█████▋    | 1252/2208 [07:25<05:36,  2.84it/s][A
Epoch 1/5:  57%|█████▋    | 1253/2208 [07:26<05:32,  2.87it/s][A
Epoch 1/5:  57%|█████▋    | 1254/2208 [07:26<05:37,  2.83it/s][A
Epoch 1/5:  57%|█████▋    | 1255/2208 [07:26<05:41,  2.79it/s][A
Epoch 1/5:  57%|█████▋    | 1256/2208 [07:27<05:35,  2.84it/s][A
Epoch 1/5:  57%|█████▋    | 1257/2208 [07:27<05:30,  2.88it/s][A
Epoch 1/5:  57%|█████▋    | 1258/2208 [07:28<05:41,  2.78it/s][A
Epoch 1/5:  57%|█████▋    | 1259/2208 [07:28<05:34,  2.84it/s][A
Epoch 1/5:  57%|█████▋    | 1260/2208 [07:28<05:33,  2.84it/s][A
Epoch 1/5:  57%|█████▋    | 1261/2208 [07:29<05:47,  2.73it/s][A
Epoch 1/5:  57%|█████▋    | 1262/2208 [07:29<05:45,  2.74it/s][A
Epoch 1/5:  57%|█████▋    | 1263/2208 [07:29<05:37,  2.80it/s][A
Epoch 1/5:  57%|█████▋    | 1264/2208 [07:30<05:39,  2.78it/s][A
Epoch 1/5:  57%|█████▋    | 1265/2208 [07:30<05:32,  2.84it/s][A
Epoch 1/5:  57%|█████▋    | 1266/2208 [07:30<05:28,  2.86it/s][A
Epoch 1/5

Batch 1275: Training accuracy = 0.8047, F1 = 0.7875, Precision = 0.7917, Recall = 0.8047



Epoch 1/5:  58%|█████▊    | 1277/2208 [07:34<05:38,  2.75it/s][A
Epoch 1/5:  58%|█████▊    | 1278/2208 [07:35<05:37,  2.76it/s][A
Epoch 1/5:  58%|█████▊    | 1279/2208 [07:35<05:36,  2.76it/s][A
Epoch 1/5:  58%|█████▊    | 1280/2208 [07:35<05:29,  2.82it/s][A
Epoch 1/5:  58%|█████▊    | 1281/2208 [07:36<05:32,  2.78it/s][A
Epoch 1/5:  58%|█████▊    | 1282/2208 [07:36<05:28,  2.82it/s][A
Epoch 1/5:  58%|█████▊    | 1283/2208 [07:36<05:25,  2.84it/s][A
Epoch 1/5:  58%|█████▊    | 1284/2208 [07:37<05:21,  2.87it/s][A
Epoch 1/5:  58%|█████▊    | 1285/2208 [07:37<05:21,  2.87it/s][A
Epoch 1/5:  58%|█████▊    | 1286/2208 [07:38<05:18,  2.90it/s][A
Epoch 1/5:  58%|█████▊    | 1287/2208 [07:38<05:16,  2.91it/s][A
Epoch 1/5:  58%|█████▊    | 1288/2208 [07:38<05:16,  2.90it/s][A
Epoch 1/5:  58%|█████▊    | 1289/2208 [07:39<05:24,  2.83it/s][A
Epoch 1/5:  58%|█████▊    | 1290/2208 [07:39<05:26,  2.81it/s][A
Epoch 1/5:  58%|█████▊    | 1291/2208 [07:39<05:23,  2.83it/s][A
Epoch 1/5

Batch 1300: Training accuracy = 0.7500, F1 = 0.7320, Precision = 0.7402, Recall = 0.7500



Epoch 1/5:  59%|█████▉    | 1302/2208 [07:43<05:09,  2.92it/s][A
Epoch 1/5:  59%|█████▉    | 1303/2208 [07:43<05:09,  2.92it/s][A
Epoch 1/5:  59%|█████▉    | 1304/2208 [07:44<05:13,  2.89it/s][A
Epoch 1/5:  59%|█████▉    | 1305/2208 [07:44<05:10,  2.91it/s][A
Epoch 1/5:  59%|█████▉    | 1306/2208 [07:44<05:08,  2.92it/s][A
Epoch 1/5:  59%|█████▉    | 1307/2208 [07:45<05:09,  2.91it/s][A
Epoch 1/5:  59%|█████▉    | 1308/2208 [07:45<05:08,  2.92it/s][A
Epoch 1/5:  59%|█████▉    | 1309/2208 [07:45<05:08,  2.92it/s][A
Epoch 1/5:  59%|█████▉    | 1310/2208 [07:46<05:11,  2.88it/s][A
Epoch 1/5:  59%|█████▉    | 1311/2208 [07:46<05:09,  2.90it/s][A
Epoch 1/5:  59%|█████▉    | 1312/2208 [07:46<05:10,  2.89it/s][A
Epoch 1/5:  59%|█████▉    | 1313/2208 [07:47<05:17,  2.82it/s][A
Epoch 1/5:  60%|█████▉    | 1314/2208 [07:47<05:21,  2.78it/s][A
Epoch 1/5:  60%|█████▉    | 1315/2208 [07:48<05:26,  2.73it/s][A
Epoch 1/5:  60%|█████▉    | 1316/2208 [07:48<05:28,  2.72it/s][A
Epoch 1/5

Batch 1325: Training accuracy = 0.8516, F1 = 0.8339, Precision = 0.8451, Recall = 0.8516



Epoch 1/5:  60%|██████    | 1327/2208 [07:52<05:12,  2.82it/s][A
Epoch 1/5:  60%|██████    | 1328/2208 [07:52<05:14,  2.80it/s][A
Epoch 1/5:  60%|██████    | 1329/2208 [07:53<05:23,  2.72it/s][A
Epoch 1/5:  60%|██████    | 1330/2208 [07:53<05:25,  2.70it/s][A
Epoch 1/5:  60%|██████    | 1331/2208 [07:53<05:22,  2.72it/s][A
Epoch 1/5:  60%|██████    | 1332/2208 [07:54<05:21,  2.73it/s][A
Epoch 1/5:  60%|██████    | 1333/2208 [07:54<05:23,  2.71it/s][A
Epoch 1/5:  60%|██████    | 1334/2208 [07:54<05:16,  2.76it/s][A
Epoch 1/5:  60%|██████    | 1335/2208 [07:55<05:17,  2.75it/s][A
Epoch 1/5:  61%|██████    | 1336/2208 [07:55<05:15,  2.77it/s][A
Epoch 1/5:  61%|██████    | 1337/2208 [07:56<05:16,  2.75it/s][A
Epoch 1/5:  61%|██████    | 1338/2208 [07:56<05:08,  2.82it/s][A
Epoch 1/5:  61%|██████    | 1339/2208 [07:56<05:05,  2.85it/s][A
Epoch 1/5:  61%|██████    | 1340/2208 [07:57<05:02,  2.87it/s][A
Epoch 1/5:  61%|██████    | 1341/2208 [07:57<05:03,  2.85it/s][A
Epoch 1/5

Batch 1350: Training accuracy = 0.7812, F1 = 0.7625, Precision = 0.7578, Recall = 0.7812



Epoch 1/5:  61%|██████    | 1352/2208 [08:01<05:04,  2.81it/s][A
Epoch 1/5:  61%|██████▏   | 1353/2208 [08:01<05:09,  2.76it/s][A
Epoch 1/5:  61%|██████▏   | 1354/2208 [08:02<05:10,  2.75it/s][A
Epoch 1/5:  61%|██████▏   | 1355/2208 [08:02<05:05,  2.79it/s][A
Epoch 1/5:  61%|██████▏   | 1356/2208 [08:02<05:06,  2.78it/s][A
Epoch 1/5:  61%|██████▏   | 1357/2208 [08:03<05:10,  2.74it/s][A
Epoch 1/5:  62%|██████▏   | 1358/2208 [08:03<05:13,  2.71it/s][A
Epoch 1/5:  62%|██████▏   | 1359/2208 [08:03<05:09,  2.74it/s][A
Epoch 1/5:  62%|██████▏   | 1360/2208 [08:04<05:15,  2.69it/s][A
Epoch 1/5:  62%|██████▏   | 1361/2208 [08:04<05:18,  2.66it/s][A
Epoch 1/5:  62%|██████▏   | 1362/2208 [08:05<05:20,  2.64it/s][A
Epoch 1/5:  62%|██████▏   | 1363/2208 [08:05<05:10,  2.72it/s][A
Epoch 1/5:  62%|██████▏   | 1364/2208 [08:05<05:13,  2.69it/s][A
Epoch 1/5:  62%|██████▏   | 1365/2208 [08:06<05:04,  2.77it/s][A
Epoch 1/5:  62%|██████▏   | 1366/2208 [08:06<04:57,  2.83it/s][A
Epoch 1/5

Batch 1375: Training accuracy = 0.7969, F1 = 0.7735, Precision = 0.7773, Recall = 0.7969



Epoch 1/5:  62%|██████▏   | 1377/2208 [08:10<04:54,  2.82it/s][A
Epoch 1/5:  62%|██████▏   | 1378/2208 [08:10<04:51,  2.84it/s][A
Epoch 1/5:  62%|██████▏   | 1379/2208 [08:10<04:47,  2.88it/s][A
Epoch 1/5:  62%|██████▎   | 1380/2208 [08:11<04:44,  2.91it/s][A
Epoch 1/5:  63%|██████▎   | 1381/2208 [08:11<04:52,  2.83it/s][A
Epoch 1/5:  63%|██████▎   | 1382/2208 [08:12<04:50,  2.85it/s][A
Epoch 1/5:  63%|██████▎   | 1383/2208 [08:12<04:51,  2.83it/s][A
Epoch 1/5:  63%|██████▎   | 1384/2208 [08:12<04:52,  2.82it/s][A
Epoch 1/5:  63%|██████▎   | 1385/2208 [08:13<05:03,  2.71it/s][A
Epoch 1/5:  63%|██████▎   | 1386/2208 [08:13<04:56,  2.77it/s][A
Epoch 1/5:  63%|██████▎   | 1387/2208 [08:13<04:52,  2.80it/s][A
Epoch 1/5:  63%|██████▎   | 1388/2208 [08:14<04:48,  2.84it/s][A
Epoch 1/5:  63%|██████▎   | 1389/2208 [08:14<04:45,  2.87it/s][A
Epoch 1/5:  63%|██████▎   | 1390/2208 [08:14<04:42,  2.89it/s][A
Epoch 1/5:  63%|██████▎   | 1391/2208 [08:15<04:40,  2.91it/s][A
Epoch 1/5

Batch 1400: Training accuracy = 0.8516, F1 = 0.8422, Precision = 0.8398, Recall = 0.8516



Epoch 1/5:  63%|██████▎   | 1402/2208 [08:19<04:47,  2.81it/s][A
Epoch 1/5:  64%|██████▎   | 1403/2208 [08:19<04:52,  2.75it/s][A
Epoch 1/5:  64%|██████▎   | 1404/2208 [08:19<04:53,  2.74it/s][A
Epoch 1/5:  64%|██████▎   | 1405/2208 [08:20<04:46,  2.80it/s][A
Epoch 1/5:  64%|██████▎   | 1406/2208 [08:20<04:42,  2.83it/s][A
Epoch 1/5:  64%|██████▎   | 1407/2208 [08:20<04:39,  2.87it/s][A
Epoch 1/5:  64%|██████▍   | 1408/2208 [08:21<04:37,  2.89it/s][A
Epoch 1/5:  64%|██████▍   | 1409/2208 [08:21<04:37,  2.87it/s][A
Epoch 1/5:  64%|██████▍   | 1410/2208 [08:22<04:36,  2.89it/s][A
Epoch 1/5:  64%|██████▍   | 1411/2208 [08:22<04:34,  2.90it/s][A
Epoch 1/5:  64%|██████▍   | 1412/2208 [08:22<04:33,  2.91it/s][A
Epoch 1/5:  64%|██████▍   | 1413/2208 [08:23<04:32,  2.92it/s][A
Epoch 1/5:  64%|██████▍   | 1414/2208 [08:23<04:30,  2.93it/s][A
Epoch 1/5:  64%|██████▍   | 1415/2208 [08:23<04:41,  2.82it/s][A
Epoch 1/5:  64%|██████▍   | 1416/2208 [08:24<04:42,  2.80it/s][A
Epoch 1/5

Batch 1425: Training accuracy = 0.7578, F1 = 0.7449, Precision = 0.7585, Recall = 0.7578



Epoch 1/5:  65%|██████▍   | 1427/2208 [08:27<04:35,  2.83it/s][A
Epoch 1/5:  65%|██████▍   | 1428/2208 [08:28<04:32,  2.87it/s][A
Epoch 1/5:  65%|██████▍   | 1429/2208 [08:28<04:29,  2.89it/s][A
Epoch 1/5:  65%|██████▍   | 1430/2208 [08:29<04:35,  2.83it/s][A
Epoch 1/5:  65%|██████▍   | 1431/2208 [08:29<04:31,  2.86it/s][A
Epoch 1/5:  65%|██████▍   | 1432/2208 [08:29<04:28,  2.89it/s][A
Epoch 1/5:  65%|██████▍   | 1433/2208 [08:30<04:27,  2.90it/s][A
Epoch 1/5:  65%|██████▍   | 1434/2208 [08:30<04:37,  2.79it/s][A
Epoch 1/5:  65%|██████▍   | 1435/2208 [08:30<04:35,  2.81it/s][A
Epoch 1/5:  65%|██████▌   | 1436/2208 [08:31<04:31,  2.84it/s][A
Epoch 1/5:  65%|██████▌   | 1437/2208 [08:31<04:29,  2.86it/s][A
Epoch 1/5:  65%|██████▌   | 1438/2208 [08:31<04:29,  2.86it/s][A
Epoch 1/5:  65%|██████▌   | 1439/2208 [08:32<04:35,  2.79it/s][A
Epoch 1/5:  65%|██████▌   | 1440/2208 [08:32<04:32,  2.82it/s][A
Epoch 1/5:  65%|██████▌   | 1441/2208 [08:32<04:36,  2.78it/s][A
Epoch 1/5

Batch 1450: Training accuracy = 0.7812, F1 = 0.7654, Precision = 0.7682, Recall = 0.7812



Epoch 1/5:  66%|██████▌   | 1452/2208 [08:36<04:21,  2.89it/s][A
Epoch 1/5:  66%|██████▌   | 1453/2208 [08:37<04:26,  2.83it/s][A
Epoch 1/5:  66%|██████▌   | 1454/2208 [08:37<04:23,  2.86it/s][A
Epoch 1/5:  66%|██████▌   | 1455/2208 [08:37<04:32,  2.77it/s][A
Epoch 1/5:  66%|██████▌   | 1456/2208 [08:38<04:27,  2.81it/s][A
Epoch 1/5:  66%|██████▌   | 1457/2208 [08:38<04:26,  2.82it/s][A
Epoch 1/5:  66%|██████▌   | 1458/2208 [08:38<04:21,  2.86it/s][A
Epoch 1/5:  66%|██████▌   | 1459/2208 [08:39<04:26,  2.81it/s][A
Epoch 1/5:  66%|██████▌   | 1460/2208 [08:39<04:34,  2.72it/s][A
Epoch 1/5:  66%|██████▌   | 1461/2208 [08:40<04:34,  2.72it/s][A
Epoch 1/5:  66%|██████▌   | 1462/2208 [08:40<04:27,  2.79it/s][A
Epoch 1/5:  66%|██████▋   | 1463/2208 [08:40<04:27,  2.79it/s][A
Epoch 1/5:  66%|██████▋   | 1464/2208 [08:41<04:30,  2.75it/s][A
Epoch 1/5:  66%|██████▋   | 1465/2208 [08:41<04:31,  2.74it/s][A
Epoch 1/5:  66%|██████▋   | 1466/2208 [08:41<04:27,  2.77it/s][A
Epoch 1/5

Batch 1475: Training accuracy = 0.7188, F1 = 0.6992, Precision = 0.7057, Recall = 0.7188



Epoch 1/5:  67%|██████▋   | 1477/2208 [08:45<04:20,  2.81it/s][A
Epoch 1/5:  67%|██████▋   | 1478/2208 [08:46<04:19,  2.81it/s][A
Epoch 1/5:  67%|██████▋   | 1479/2208 [08:46<04:14,  2.86it/s][A
Epoch 1/5:  67%|██████▋   | 1480/2208 [08:46<04:19,  2.80it/s][A
Epoch 1/5:  67%|██████▋   | 1481/2208 [08:47<04:17,  2.82it/s][A
Epoch 1/5:  67%|██████▋   | 1482/2208 [08:47<04:14,  2.86it/s][A
Epoch 1/5:  67%|██████▋   | 1483/2208 [08:47<04:15,  2.84it/s][A
Epoch 1/5:  67%|██████▋   | 1484/2208 [08:48<04:12,  2.86it/s][A
Epoch 1/5:  67%|██████▋   | 1485/2208 [08:48<04:14,  2.85it/s][A
Epoch 1/5:  67%|██████▋   | 1486/2208 [08:48<04:14,  2.83it/s][A
Epoch 1/5:  67%|██████▋   | 1487/2208 [08:49<04:11,  2.87it/s][A
Epoch 1/5:  67%|██████▋   | 1488/2208 [08:49<04:12,  2.85it/s][A
Epoch 1/5:  67%|██████▋   | 1489/2208 [08:49<04:11,  2.86it/s][A
Epoch 1/5:  67%|██████▋   | 1490/2208 [08:50<04:16,  2.79it/s][A
Epoch 1/5:  68%|██████▊   | 1491/2208 [08:50<04:12,  2.84it/s][A
Epoch 1/5

Batch 1500: Training accuracy = 0.8281, F1 = 0.8138, Precision = 0.8177, Recall = 0.8281



Epoch 1/5:  68%|██████▊   | 1502/2208 [08:54<04:06,  2.86it/s][A
Epoch 1/5:  68%|██████▊   | 1503/2208 [08:54<04:03,  2.89it/s][A
Epoch 1/5:  68%|██████▊   | 1504/2208 [08:55<04:07,  2.85it/s][A
Epoch 1/5:  68%|██████▊   | 1505/2208 [08:55<04:03,  2.88it/s][A
Epoch 1/5:  68%|██████▊   | 1506/2208 [08:55<04:02,  2.89it/s][A
Epoch 1/5:  68%|██████▊   | 1507/2208 [08:56<04:07,  2.83it/s][A
Epoch 1/5:  68%|██████▊   | 1508/2208 [08:56<04:04,  2.87it/s][A
Epoch 1/5:  68%|██████▊   | 1509/2208 [08:56<04:01,  2.89it/s][A
Epoch 1/5:  68%|██████▊   | 1510/2208 [08:57<04:07,  2.82it/s][A
Epoch 1/5:  68%|██████▊   | 1511/2208 [08:57<04:04,  2.85it/s][A
Epoch 1/5:  68%|██████▊   | 1512/2208 [08:57<04:02,  2.87it/s][A
Epoch 1/5:  69%|██████▊   | 1513/2208 [08:58<04:00,  2.89it/s][A
Epoch 1/5:  69%|██████▊   | 1514/2208 [08:58<03:59,  2.90it/s][A
Epoch 1/5:  69%|██████▊   | 1515/2208 [08:59<03:59,  2.89it/s][A
Epoch 1/5:  69%|██████▊   | 1516/2208 [08:59<03:57,  2.91it/s][A
Epoch 1/5

Batch 1525: Training accuracy = 0.8359, F1 = 0.8224, Precision = 0.8229, Recall = 0.8359



Epoch 1/5:  69%|██████▉   | 1527/2208 [09:03<04:10,  2.72it/s][A
Epoch 1/5:  69%|██████▉   | 1528/2208 [09:03<04:10,  2.71it/s][A
Epoch 1/5:  69%|██████▉   | 1529/2208 [09:04<04:05,  2.77it/s][A
Epoch 1/5:  69%|██████▉   | 1530/2208 [09:04<04:01,  2.81it/s][A
Epoch 1/5:  69%|██████▉   | 1531/2208 [09:04<03:58,  2.84it/s][A
Epoch 1/5:  69%|██████▉   | 1532/2208 [09:05<03:57,  2.85it/s][A
Epoch 1/5:  69%|██████▉   | 1533/2208 [09:05<04:01,  2.80it/s][A
Epoch 1/5:  69%|██████▉   | 1534/2208 [09:05<03:57,  2.83it/s][A
Epoch 1/5:  70%|██████▉   | 1535/2208 [09:06<03:59,  2.82it/s][A
Epoch 1/5:  70%|██████▉   | 1536/2208 [09:06<04:01,  2.78it/s][A
Epoch 1/5:  70%|██████▉   | 1537/2208 [09:06<03:56,  2.83it/s][A
Epoch 1/5:  70%|██████▉   | 1538/2208 [09:07<03:53,  2.86it/s][A
Epoch 1/5:  70%|██████▉   | 1539/2208 [09:07<03:51,  2.89it/s][A
Epoch 1/5:  70%|██████▉   | 1540/2208 [09:07<03:56,  2.82it/s][A
Epoch 1/5:  70%|██████▉   | 1541/2208 [09:08<03:53,  2.86it/s][A
Epoch 1/5

Batch 1550: Training accuracy = 0.7734, F1 = 0.7468, Precision = 0.7372, Recall = 0.7734



Epoch 1/5:  70%|███████   | 1552/2208 [09:12<03:59,  2.74it/s][A
Epoch 1/5:  70%|███████   | 1553/2208 [09:12<03:54,  2.79it/s][A
Epoch 1/5:  70%|███████   | 1554/2208 [09:12<03:51,  2.82it/s][A
Epoch 1/5:  70%|███████   | 1555/2208 [09:13<03:48,  2.86it/s][A
Epoch 1/5:  70%|███████   | 1556/2208 [09:13<03:46,  2.88it/s][A
Epoch 1/5:  71%|███████   | 1557/2208 [09:13<03:44,  2.89it/s][A
Epoch 1/5:  71%|███████   | 1558/2208 [09:14<03:42,  2.92it/s][A
Epoch 1/5:  71%|███████   | 1559/2208 [09:14<03:41,  2.93it/s][A
Epoch 1/5:  71%|███████   | 1560/2208 [09:15<03:42,  2.92it/s][A
Epoch 1/5:  71%|███████   | 1561/2208 [09:15<03:52,  2.79it/s][A
Epoch 1/5:  71%|███████   | 1562/2208 [09:15<03:51,  2.79it/s][A
Epoch 1/5:  71%|███████   | 1563/2208 [09:16<03:52,  2.77it/s][A
Epoch 1/5:  71%|███████   | 1564/2208 [09:16<03:48,  2.82it/s][A
Epoch 1/5:  71%|███████   | 1565/2208 [09:16<03:46,  2.83it/s][A
Epoch 1/5:  71%|███████   | 1566/2208 [09:17<03:44,  2.85it/s][A
Epoch 1/5

Batch 1575: Training accuracy = 0.8438, F1 = 0.8352, Precision = 0.8464, Recall = 0.8438



Epoch 1/5:  71%|███████▏  | 1577/2208 [09:21<03:46,  2.78it/s][A
Epoch 1/5:  71%|███████▏  | 1578/2208 [09:21<03:42,  2.84it/s][A
Epoch 1/5:  72%|███████▏  | 1579/2208 [09:21<03:39,  2.87it/s][A
Epoch 1/5:  72%|███████▏  | 1580/2208 [09:22<03:37,  2.89it/s][A
Epoch 1/5:  72%|███████▏  | 1581/2208 [09:22<03:36,  2.89it/s][A
Epoch 1/5:  72%|███████▏  | 1582/2208 [09:22<03:38,  2.86it/s][A
Epoch 1/5:  72%|███████▏  | 1583/2208 [09:23<03:45,  2.77it/s][A
Epoch 1/5:  72%|███████▏  | 1584/2208 [09:23<03:41,  2.82it/s][A
Epoch 1/5:  72%|███████▏  | 1585/2208 [09:23<03:38,  2.85it/s][A
Epoch 1/5:  72%|███████▏  | 1586/2208 [09:24<03:36,  2.87it/s][A
Epoch 1/5:  72%|███████▏  | 1587/2208 [09:24<03:43,  2.78it/s][A
Epoch 1/5:  72%|███████▏  | 1588/2208 [09:24<03:40,  2.81it/s][A
Epoch 1/5:  72%|███████▏  | 1589/2208 [09:25<03:39,  2.82it/s][A
Epoch 1/5:  72%|███████▏  | 1590/2208 [09:25<03:37,  2.85it/s][A
Epoch 1/5:  72%|███████▏  | 1591/2208 [09:26<03:38,  2.82it/s][A
Epoch 1/5

Batch 1600: Training accuracy = 0.7422, F1 = 0.7370, Precision = 0.7539, Recall = 0.7422



Epoch 1/5:  73%|███████▎  | 1602/2208 [09:29<03:35,  2.81it/s][A
Epoch 1/5:  73%|███████▎  | 1603/2208 [09:30<03:34,  2.83it/s][A
Epoch 1/5:  73%|███████▎  | 1604/2208 [09:30<03:39,  2.76it/s][A
Epoch 1/5:  73%|███████▎  | 1605/2208 [09:31<03:42,  2.72it/s][A
Epoch 1/5:  73%|███████▎  | 1606/2208 [09:31<03:40,  2.73it/s][A
Epoch 1/5:  73%|███████▎  | 1607/2208 [09:31<03:39,  2.74it/s][A
Epoch 1/5:  73%|███████▎  | 1608/2208 [09:32<03:35,  2.79it/s][A
Epoch 1/5:  73%|███████▎  | 1609/2208 [09:32<03:35,  2.78it/s][A
Epoch 1/5:  73%|███████▎  | 1610/2208 [09:32<03:41,  2.70it/s][A
Epoch 1/5:  73%|███████▎  | 1611/2208 [09:33<03:39,  2.72it/s][A
Epoch 1/5:  73%|███████▎  | 1612/2208 [09:33<03:44,  2.66it/s][A
Epoch 1/5:  73%|███████▎  | 1613/2208 [09:33<03:43,  2.66it/s][A
Epoch 1/5:  73%|███████▎  | 1614/2208 [09:34<03:39,  2.70it/s][A
Epoch 1/5:  73%|███████▎  | 1615/2208 [09:34<03:33,  2.78it/s][A
Epoch 1/5:  73%|███████▎  | 1616/2208 [09:35<03:29,  2.82it/s][A
Epoch 1/5

Batch 1625: Training accuracy = 0.8125, F1 = 0.7826, Precision = 0.7760, Recall = 0.8125



Epoch 1/5:  74%|███████▎  | 1627/2208 [09:38<03:24,  2.84it/s][A
Epoch 1/5:  74%|███████▎  | 1628/2208 [09:39<03:21,  2.88it/s][A
Epoch 1/5:  74%|███████▍  | 1629/2208 [09:39<03:20,  2.89it/s][A
Epoch 1/5:  74%|███████▍  | 1630/2208 [09:39<03:21,  2.87it/s][A
Epoch 1/5:  74%|███████▍  | 1631/2208 [09:40<03:19,  2.89it/s][A
Epoch 1/5:  74%|███████▍  | 1632/2208 [09:40<03:21,  2.85it/s][A
Epoch 1/5:  74%|███████▍  | 1633/2208 [09:41<03:20,  2.86it/s][A
Epoch 1/5:  74%|███████▍  | 1634/2208 [09:41<03:25,  2.79it/s][A
Epoch 1/5:  74%|███████▍  | 1635/2208 [09:41<03:26,  2.77it/s][A
Epoch 1/5:  74%|███████▍  | 1636/2208 [09:42<03:26,  2.76it/s][A
Epoch 1/5:  74%|███████▍  | 1637/2208 [09:42<03:28,  2.74it/s][A
Epoch 1/5:  74%|███████▍  | 1638/2208 [09:42<03:25,  2.77it/s][A
Epoch 1/5:  74%|███████▍  | 1639/2208 [09:43<03:27,  2.75it/s][A
Epoch 1/5:  74%|███████▍  | 1640/2208 [09:43<03:30,  2.69it/s][A
Epoch 1/5:  74%|███████▍  | 1641/2208 [09:43<03:30,  2.70it/s][A
Epoch 1/5

Batch 1650: Training accuracy = 0.7812, F1 = 0.7625, Precision = 0.7695, Recall = 0.7812



Epoch 1/5:  75%|███████▍  | 1652/2208 [09:47<03:22,  2.75it/s][A
Epoch 1/5:  75%|███████▍  | 1653/2208 [09:48<03:18,  2.80it/s][A
Epoch 1/5:  75%|███████▍  | 1654/2208 [09:48<03:18,  2.79it/s][A
Epoch 1/5:  75%|███████▍  | 1655/2208 [09:48<03:17,  2.80it/s][A
Epoch 1/5:  75%|███████▌  | 1656/2208 [09:49<03:14,  2.84it/s][A
Epoch 1/5:  75%|███████▌  | 1657/2208 [09:49<03:12,  2.86it/s][A
Epoch 1/5:  75%|███████▌  | 1658/2208 [09:50<03:10,  2.88it/s][A
Epoch 1/5:  75%|███████▌  | 1659/2208 [09:50<03:12,  2.86it/s][A
Epoch 1/5:  75%|███████▌  | 1660/2208 [09:50<03:12,  2.84it/s][A
Epoch 1/5:  75%|███████▌  | 1661/2208 [09:51<03:11,  2.86it/s][A
Epoch 1/5:  75%|███████▌  | 1662/2208 [09:51<03:11,  2.85it/s][A
Epoch 1/5:  75%|███████▌  | 1663/2208 [09:51<03:16,  2.77it/s][A
Epoch 1/5:  75%|███████▌  | 1664/2208 [09:52<03:18,  2.74it/s][A
Epoch 1/5:  75%|███████▌  | 1665/2208 [09:52<03:15,  2.78it/s][A
Epoch 1/5:  75%|███████▌  | 1666/2208 [09:52<03:17,  2.75it/s][A
Epoch 1/5

Batch 1675: Training accuracy = 0.8672, F1 = 0.8594, Precision = 0.8581, Recall = 0.8672



Epoch 1/5:  76%|███████▌  | 1677/2208 [09:56<03:16,  2.70it/s][A
Epoch 1/5:  76%|███████▌  | 1678/2208 [09:57<03:11,  2.77it/s][A
Epoch 1/5:  76%|███████▌  | 1679/2208 [09:57<03:07,  2.83it/s][A
Epoch 1/5:  76%|███████▌  | 1680/2208 [09:57<03:05,  2.85it/s][A
Epoch 1/5:  76%|███████▌  | 1681/2208 [09:58<03:04,  2.86it/s][A
Epoch 1/5:  76%|███████▌  | 1682/2208 [09:58<03:02,  2.88it/s][A
Epoch 1/5:  76%|███████▌  | 1683/2208 [09:58<03:01,  2.88it/s][A
Epoch 1/5:  76%|███████▋  | 1684/2208 [09:59<03:04,  2.85it/s][A
Epoch 1/5:  76%|███████▋  | 1685/2208 [09:59<03:09,  2.76it/s][A
Epoch 1/5:  76%|███████▋  | 1686/2208 [09:59<03:05,  2.81it/s][A
Epoch 1/5:  76%|███████▋  | 1687/2208 [10:00<03:06,  2.80it/s][A
Epoch 1/5:  76%|███████▋  | 1688/2208 [10:00<03:06,  2.78it/s][A
Epoch 1/5:  76%|███████▋  | 1689/2208 [10:01<03:08,  2.76it/s][A
Epoch 1/5:  77%|███████▋  | 1690/2208 [10:01<03:08,  2.75it/s][A
Epoch 1/5:  77%|███████▋  | 1691/2208 [10:01<03:06,  2.77it/s][A
Epoch 1/5

Batch 1700: Training accuracy = 0.8594, F1 = 0.8539, Precision = 0.8607, Recall = 0.8594



Epoch 1/5:  77%|███████▋  | 1702/2208 [10:05<02:58,  2.83it/s][A
Epoch 1/5:  77%|███████▋  | 1703/2208 [10:06<02:56,  2.87it/s][A
Epoch 1/5:  77%|███████▋  | 1704/2208 [10:06<02:57,  2.84it/s][A
Epoch 1/5:  77%|███████▋  | 1705/2208 [10:06<02:55,  2.87it/s][A
Epoch 1/5:  77%|███████▋  | 1706/2208 [10:07<02:59,  2.80it/s][A
Epoch 1/5:  77%|███████▋  | 1707/2208 [10:07<02:56,  2.83it/s][A
Epoch 1/5:  77%|███████▋  | 1708/2208 [10:07<02:54,  2.86it/s][A
Epoch 1/5:  77%|███████▋  | 1709/2208 [10:08<02:53,  2.87it/s][A
Epoch 1/5:  77%|███████▋  | 1710/2208 [10:08<02:56,  2.82it/s][A
Epoch 1/5:  77%|███████▋  | 1711/2208 [10:08<02:54,  2.85it/s][A
Epoch 1/5:  78%|███████▊  | 1712/2208 [10:09<02:52,  2.88it/s][A
Epoch 1/5:  78%|███████▊  | 1713/2208 [10:09<02:52,  2.88it/s][A
Epoch 1/5:  78%|███████▊  | 1714/2208 [10:09<02:55,  2.81it/s][A
Epoch 1/5:  78%|███████▊  | 1715/2208 [10:10<02:53,  2.84it/s][A
Epoch 1/5:  78%|███████▊  | 1716/2208 [10:10<02:56,  2.79it/s][A
Epoch 1/5

Batch 1725: Training accuracy = 0.8516, F1 = 0.8307, Precision = 0.8288, Recall = 0.8516



Epoch 1/5:  78%|███████▊  | 1727/2208 [10:14<02:50,  2.83it/s][A
Epoch 1/5:  78%|███████▊  | 1728/2208 [10:14<02:51,  2.79it/s][A
Epoch 1/5:  78%|███████▊  | 1729/2208 [10:15<02:50,  2.82it/s][A
Epoch 1/5:  78%|███████▊  | 1730/2208 [10:15<02:47,  2.85it/s][A
Epoch 1/5:  78%|███████▊  | 1731/2208 [10:16<02:48,  2.84it/s][A
Epoch 1/5:  78%|███████▊  | 1732/2208 [10:16<02:46,  2.86it/s][A
Epoch 1/5:  78%|███████▊  | 1733/2208 [10:16<02:47,  2.83it/s][A
Epoch 1/5:  79%|███████▊  | 1734/2208 [10:17<02:52,  2.75it/s][A
Epoch 1/5:  79%|███████▊  | 1735/2208 [10:17<02:54,  2.71it/s][A
Epoch 1/5:  79%|███████▊  | 1736/2208 [10:17<02:57,  2.66it/s][A
Epoch 1/5:  79%|███████▊  | 1737/2208 [10:18<02:52,  2.73it/s][A
Epoch 1/5:  79%|███████▊  | 1738/2208 [10:18<02:48,  2.78it/s][A
Epoch 1/5:  79%|███████▉  | 1739/2208 [10:18<02:50,  2.75it/s][A
Epoch 1/5:  79%|███████▉  | 1740/2208 [10:19<02:46,  2.81it/s][A
Epoch 1/5:  79%|███████▉  | 1741/2208 [10:19<02:44,  2.83it/s][A
Epoch 1/5

Batch 1750: Training accuracy = 0.7734, F1 = 0.7577, Precision = 0.7596, Recall = 0.7734



Epoch 1/5:  79%|███████▉  | 1752/2208 [10:23<02:38,  2.88it/s][A
Epoch 1/5:  79%|███████▉  | 1753/2208 [10:23<02:40,  2.83it/s][A
Epoch 1/5:  79%|███████▉  | 1754/2208 [10:24<02:42,  2.80it/s][A
Epoch 1/5:  79%|███████▉  | 1755/2208 [10:24<02:39,  2.85it/s][A
Epoch 1/5:  80%|███████▉  | 1756/2208 [10:24<02:41,  2.79it/s][A
Epoch 1/5:  80%|███████▉  | 1757/2208 [10:25<02:43,  2.77it/s][A
Epoch 1/5:  80%|███████▉  | 1758/2208 [10:25<02:43,  2.74it/s][A
Epoch 1/5:  80%|███████▉  | 1759/2208 [10:26<02:40,  2.80it/s][A
Epoch 1/5:  80%|███████▉  | 1760/2208 [10:26<02:37,  2.84it/s][A
Epoch 1/5:  80%|███████▉  | 1761/2208 [10:26<02:36,  2.86it/s][A
Epoch 1/5:  80%|███████▉  | 1762/2208 [10:27<02:36,  2.85it/s][A
Epoch 1/5:  80%|███████▉  | 1763/2208 [10:27<02:38,  2.81it/s][A
Epoch 1/5:  80%|███████▉  | 1764/2208 [10:27<02:37,  2.81it/s][A
Epoch 1/5:  80%|███████▉  | 1765/2208 [10:28<02:38,  2.79it/s][A
Epoch 1/5:  80%|███████▉  | 1766/2208 [10:28<02:40,  2.76it/s][A
Epoch 1/5

Batch 1775: Training accuracy = 0.7969, F1 = 0.7865, Precision = 0.8021, Recall = 0.7969



Epoch 1/5:  80%|████████  | 1777/2208 [10:32<02:33,  2.80it/s][A
Epoch 1/5:  81%|████████  | 1778/2208 [10:32<02:32,  2.82it/s][A
Epoch 1/5:  81%|████████  | 1779/2208 [10:33<02:30,  2.84it/s][A
Epoch 1/5:  81%|████████  | 1780/2208 [10:33<02:34,  2.78it/s][A
Epoch 1/5:  81%|████████  | 1781/2208 [10:33<02:31,  2.82it/s][A
Epoch 1/5:  81%|████████  | 1782/2208 [10:34<02:29,  2.84it/s][A
Epoch 1/5:  81%|████████  | 1783/2208 [10:34<02:30,  2.82it/s][A
Epoch 1/5:  81%|████████  | 1784/2208 [10:34<02:28,  2.86it/s][A
Epoch 1/5:  81%|████████  | 1785/2208 [10:35<02:26,  2.89it/s][A
Epoch 1/5:  81%|████████  | 1786/2208 [10:35<02:25,  2.89it/s][A
Epoch 1/5:  81%|████████  | 1787/2208 [10:36<02:28,  2.84it/s][A
Epoch 1/5:  81%|████████  | 1788/2208 [10:36<02:29,  2.82it/s][A
Epoch 1/5:  81%|████████  | 1789/2208 [10:36<02:30,  2.78it/s][A
Epoch 1/5:  81%|████████  | 1790/2208 [10:37<02:34,  2.71it/s][A
Epoch 1/5:  81%|████████  | 1791/2208 [10:37<02:33,  2.72it/s][A
Epoch 1/5

Batch 1800: Training accuracy = 0.8516, F1 = 0.8469, Precision = 0.8711, Recall = 0.8516



Epoch 1/5:  82%|████████▏ | 1802/2208 [10:41<02:21,  2.87it/s][A
Epoch 1/5:  82%|████████▏ | 1803/2208 [10:41<02:19,  2.90it/s][A
Epoch 1/5:  82%|████████▏ | 1804/2208 [10:42<02:22,  2.84it/s][A
Epoch 1/5:  82%|████████▏ | 1805/2208 [10:42<02:21,  2.85it/s][A
Epoch 1/5:  82%|████████▏ | 1806/2208 [10:42<02:20,  2.87it/s][A
Epoch 1/5:  82%|████████▏ | 1807/2208 [10:43<02:19,  2.88it/s][A
Epoch 1/5:  82%|████████▏ | 1808/2208 [10:43<02:22,  2.80it/s][A
Epoch 1/5:  82%|████████▏ | 1809/2208 [10:43<02:25,  2.74it/s][A
Epoch 1/5:  82%|████████▏ | 1810/2208 [10:44<02:24,  2.74it/s][A
Epoch 1/5:  82%|████████▏ | 1811/2208 [10:44<02:25,  2.73it/s][A
Epoch 1/5:  82%|████████▏ | 1812/2208 [10:44<02:26,  2.70it/s][A
Epoch 1/5:  82%|████████▏ | 1813/2208 [10:45<02:24,  2.74it/s][A
Epoch 1/5:  82%|████████▏ | 1814/2208 [10:45<02:23,  2.75it/s][A
Epoch 1/5:  82%|████████▏ | 1815/2208 [10:45<02:20,  2.79it/s][A
Epoch 1/5:  82%|████████▏ | 1816/2208 [10:46<02:21,  2.77it/s][A
Epoch 1/5

Batch 1825: Training accuracy = 0.8594, F1 = 0.8408, Precision = 0.8372, Recall = 0.8594



Epoch 1/5:  83%|████████▎ | 1827/2208 [10:50<02:18,  2.74it/s][A
Epoch 1/5:  83%|████████▎ | 1828/2208 [10:50<02:18,  2.74it/s][A
Epoch 1/5:  83%|████████▎ | 1829/2208 [10:51<02:22,  2.67it/s][A
Epoch 1/5:  83%|████████▎ | 1830/2208 [10:51<02:20,  2.68it/s][A
Epoch 1/5:  83%|████████▎ | 1831/2208 [10:51<02:17,  2.75it/s][A
Epoch 1/5:  83%|████████▎ | 1832/2208 [10:52<02:14,  2.80it/s][A
Epoch 1/5:  83%|████████▎ | 1833/2208 [10:52<02:12,  2.83it/s][A
Epoch 1/5:  83%|████████▎ | 1834/2208 [10:52<02:15,  2.77it/s][A
Epoch 1/5:  83%|████████▎ | 1835/2208 [10:53<02:12,  2.82it/s][A
Epoch 1/5:  83%|████████▎ | 1836/2208 [10:53<02:11,  2.84it/s][A
Epoch 1/5:  83%|████████▎ | 1837/2208 [10:53<02:13,  2.77it/s][A
Epoch 1/5:  83%|████████▎ | 1838/2208 [10:54<02:16,  2.71it/s][A
Epoch 1/5:  83%|████████▎ | 1839/2208 [10:54<02:16,  2.71it/s][A
Epoch 1/5:  83%|████████▎ | 1840/2208 [10:55<02:14,  2.74it/s][A
Epoch 1/5:  83%|████████▎ | 1841/2208 [10:55<02:11,  2.80it/s][A
Epoch 1/5

Batch 1850: Training accuracy = 0.8672, F1 = 0.8484, Precision = 0.8424, Recall = 0.8672



Epoch 1/5:  84%|████████▍ | 1852/2208 [10:59<02:06,  2.82it/s][A
Epoch 1/5:  84%|████████▍ | 1853/2208 [10:59<02:07,  2.78it/s][A
Epoch 1/5:  84%|████████▍ | 1854/2208 [10:59<02:09,  2.74it/s][A
Epoch 1/5:  84%|████████▍ | 1855/2208 [11:00<02:08,  2.74it/s][A
Epoch 1/5:  84%|████████▍ | 1856/2208 [11:00<02:11,  2.68it/s][A
Epoch 1/5:  84%|████████▍ | 1857/2208 [11:01<02:07,  2.76it/s][A
Epoch 1/5:  84%|████████▍ | 1858/2208 [11:01<02:07,  2.75it/s][A
Epoch 1/5:  84%|████████▍ | 1859/2208 [11:01<02:11,  2.66it/s][A
Epoch 1/5:  84%|████████▍ | 1860/2208 [11:02<02:09,  2.70it/s][A
Epoch 1/5:  84%|████████▍ | 1861/2208 [11:02<02:08,  2.70it/s][A
Epoch 1/5:  84%|████████▍ | 1862/2208 [11:02<02:08,  2.70it/s][A
Epoch 1/5:  84%|████████▍ | 1863/2208 [11:03<02:10,  2.65it/s][A
Epoch 1/5:  84%|████████▍ | 1864/2208 [11:03<02:09,  2.66it/s][A
Epoch 1/5:  84%|████████▍ | 1865/2208 [11:04<02:05,  2.74it/s][A
Epoch 1/5:  85%|████████▍ | 1866/2208 [11:04<02:05,  2.74it/s][A
Epoch 1/5

Batch 1875: Training accuracy = 0.7891, F1 = 0.7600, Precision = 0.7523, Recall = 0.7891



Epoch 1/5:  85%|████████▌ | 1877/2208 [11:08<02:02,  2.71it/s][A
Epoch 1/5:  85%|████████▌ | 1878/2208 [11:08<01:58,  2.77it/s][A
Epoch 1/5:  85%|████████▌ | 1879/2208 [11:09<02:01,  2.71it/s][A
Epoch 1/5:  85%|████████▌ | 1880/2208 [11:09<01:59,  2.74it/s][A
Epoch 1/5:  85%|████████▌ | 1881/2208 [11:09<01:56,  2.81it/s][A
Epoch 1/5:  85%|████████▌ | 1882/2208 [11:10<01:54,  2.85it/s][A
Epoch 1/5:  85%|████████▌ | 1883/2208 [11:10<01:52,  2.88it/s][A
Epoch 1/5:  85%|████████▌ | 1884/2208 [11:10<01:54,  2.83it/s][A
Epoch 1/5:  85%|████████▌ | 1885/2208 [11:11<01:53,  2.84it/s][A
Epoch 1/5:  85%|████████▌ | 1886/2208 [11:11<01:55,  2.80it/s][A
Epoch 1/5:  85%|████████▌ | 1887/2208 [11:11<01:56,  2.76it/s][A
Epoch 1/5:  86%|████████▌ | 1888/2208 [11:12<01:57,  2.73it/s][A
Epoch 1/5:  86%|████████▌ | 1889/2208 [11:12<01:57,  2.71it/s][A
Epoch 1/5:  86%|████████▌ | 1890/2208 [11:12<01:54,  2.77it/s][A
Epoch 1/5:  86%|████████▌ | 1891/2208 [11:13<01:53,  2.80it/s][A
Epoch 1/5

Batch 1900: Training accuracy = 0.8594, F1 = 0.8302, Precision = 0.8242, Recall = 0.8594



Epoch 1/5:  86%|████████▌ | 1902/2208 [11:17<01:46,  2.86it/s][A
Epoch 1/5:  86%|████████▌ | 1903/2208 [11:17<01:45,  2.90it/s][A
Epoch 1/5:  86%|████████▌ | 1904/2208 [11:17<01:46,  2.86it/s][A
Epoch 1/5:  86%|████████▋ | 1905/2208 [11:18<01:45,  2.87it/s][A
Epoch 1/5:  86%|████████▋ | 1906/2208 [11:18<01:45,  2.87it/s][A
Epoch 1/5:  86%|████████▋ | 1907/2208 [11:18<01:43,  2.90it/s][A
Epoch 1/5:  86%|████████▋ | 1908/2208 [11:19<01:42,  2.92it/s][A
Epoch 1/5:  86%|████████▋ | 1909/2208 [11:19<01:44,  2.86it/s][A
Epoch 1/5:  87%|████████▋ | 1910/2208 [11:19<01:43,  2.89it/s][A
Epoch 1/5:  87%|████████▋ | 1911/2208 [11:20<01:41,  2.91it/s][A
Epoch 1/5:  87%|████████▋ | 1912/2208 [11:20<01:41,  2.93it/s][A
Epoch 1/5:  87%|████████▋ | 1913/2208 [11:20<01:40,  2.94it/s][A
Epoch 1/5:  87%|████████▋ | 1914/2208 [11:21<01:44,  2.81it/s][A
Epoch 1/5:  87%|████████▋ | 1915/2208 [11:21<01:45,  2.79it/s][A
Epoch 1/5:  87%|████████▋ | 1916/2208 [11:22<01:42,  2.84it/s][A
Epoch 1/5

Batch 1925: Training accuracy = 0.8203, F1 = 0.8060, Precision = 0.8079, Recall = 0.8203



Epoch 1/5:  87%|████████▋ | 1927/2208 [11:25<01:36,  2.90it/s][A
Epoch 1/5:  87%|████████▋ | 1928/2208 [11:26<01:38,  2.84it/s][A
Epoch 1/5:  87%|████████▋ | 1929/2208 [11:26<01:37,  2.86it/s][A
Epoch 1/5:  87%|████████▋ | 1930/2208 [11:26<01:35,  2.90it/s][A
Epoch 1/5:  87%|████████▋ | 1931/2208 [11:27<01:34,  2.92it/s][A
Epoch 1/5:  88%|████████▊ | 1932/2208 [11:27<01:36,  2.85it/s][A
Epoch 1/5:  88%|████████▊ | 1933/2208 [11:28<01:35,  2.88it/s][A
Epoch 1/5:  88%|████████▊ | 1934/2208 [11:28<01:34,  2.89it/s][A
Epoch 1/5:  88%|████████▊ | 1935/2208 [11:28<01:34,  2.87it/s][A
Epoch 1/5:  88%|████████▊ | 1936/2208 [11:29<01:35,  2.84it/s][A
Epoch 1/5:  88%|████████▊ | 1937/2208 [11:29<01:34,  2.87it/s][A
Epoch 1/5:  88%|████████▊ | 1938/2208 [11:29<01:36,  2.81it/s][A
Epoch 1/5:  88%|████████▊ | 1939/2208 [11:30<01:38,  2.72it/s][A
Epoch 1/5:  88%|████████▊ | 1940/2208 [11:30<01:38,  2.72it/s][A
Epoch 1/5:  88%|████████▊ | 1941/2208 [11:30<01:36,  2.77it/s][A
Epoch 1/5

Batch 1950: Training accuracy = 0.7500, F1 = 0.7448, Precision = 0.7617, Recall = 0.7500



Epoch 1/5:  88%|████████▊ | 1952/2208 [11:34<01:29,  2.86it/s][A
Epoch 1/5:  88%|████████▊ | 1953/2208 [11:35<01:32,  2.77it/s][A
Epoch 1/5:  88%|████████▊ | 1954/2208 [11:35<01:31,  2.78it/s][A
Epoch 1/5:  89%|████████▊ | 1955/2208 [11:35<01:29,  2.82it/s][A
Epoch 1/5:  89%|████████▊ | 1956/2208 [11:36<01:28,  2.86it/s][A
Epoch 1/5:  89%|████████▊ | 1957/2208 [11:36<01:27,  2.88it/s][A
Epoch 1/5:  89%|████████▊ | 1958/2208 [11:36<01:26,  2.91it/s][A
Epoch 1/5:  89%|████████▊ | 1959/2208 [11:37<01:26,  2.86it/s][A
Epoch 1/5:  89%|████████▉ | 1960/2208 [11:37<01:25,  2.89it/s][A
Epoch 1/5:  89%|████████▉ | 1961/2208 [11:37<01:25,  2.88it/s][A
Epoch 1/5:  89%|████████▉ | 1962/2208 [11:38<01:24,  2.90it/s][A
Epoch 1/5:  89%|████████▉ | 1963/2208 [11:38<01:24,  2.90it/s][A
Epoch 1/5:  89%|████████▉ | 1964/2208 [11:38<01:23,  2.91it/s][A
Epoch 1/5:  89%|████████▉ | 1965/2208 [11:39<01:24,  2.89it/s][A
Epoch 1/5:  89%|████████▉ | 1966/2208 [11:39<01:23,  2.89it/s][A
Epoch 1/5

Batch 1975: Training accuracy = 0.7969, F1 = 0.7716, Precision = 0.7650, Recall = 0.7969



Epoch 1/5:  90%|████████▉ | 1977/2208 [11:43<01:21,  2.82it/s][A
Epoch 1/5:  90%|████████▉ | 1978/2208 [11:43<01:21,  2.84it/s][A
Epoch 1/5:  90%|████████▉ | 1979/2208 [11:44<01:20,  2.86it/s][A
Epoch 1/5:  90%|████████▉ | 1980/2208 [11:44<01:22,  2.77it/s][A
Epoch 1/5:  90%|████████▉ | 1981/2208 [11:44<01:21,  2.79it/s][A
Epoch 1/5:  90%|████████▉ | 1982/2208 [11:45<01:20,  2.82it/s][A
Epoch 1/5:  90%|████████▉ | 1983/2208 [11:45<01:21,  2.78it/s][A
Epoch 1/5:  90%|████████▉ | 1984/2208 [11:45<01:19,  2.83it/s][A
Epoch 1/5:  90%|████████▉ | 1985/2208 [11:46<01:18,  2.84it/s][A
Epoch 1/5:  90%|████████▉ | 1986/2208 [11:46<01:19,  2.79it/s][A
Epoch 1/5:  90%|████████▉ | 1987/2208 [11:47<01:17,  2.84it/s][A
Epoch 1/5:  90%|█████████ | 1988/2208 [11:47<01:19,  2.76it/s][A
Epoch 1/5:  90%|█████████ | 1989/2208 [11:47<01:19,  2.77it/s][A
Epoch 1/5:  90%|█████████ | 1990/2208 [11:48<01:19,  2.75it/s][A
Epoch 1/5:  90%|█████████ | 1991/2208 [11:48<01:18,  2.76it/s][A
Epoch 1/5

Batch 2000: Training accuracy = 0.7891, F1 = 0.7652, Precision = 0.7737, Recall = 0.7891



Epoch 1/5:  91%|█████████ | 2002/2208 [11:52<01:13,  2.80it/s][A
Epoch 1/5:  91%|█████████ | 2003/2208 [11:52<01:12,  2.83it/s][A
Epoch 1/5:  91%|█████████ | 2004/2208 [11:53<01:12,  2.81it/s][A
Epoch 1/5:  91%|█████████ | 2005/2208 [11:53<01:11,  2.86it/s][A
Epoch 1/5:  91%|█████████ | 2006/2208 [11:53<01:09,  2.89it/s][A
Epoch 1/5:  91%|█████████ | 2007/2208 [11:54<01:08,  2.92it/s][A
Epoch 1/5:  91%|█████████ | 2008/2208 [11:54<01:08,  2.92it/s][A
Epoch 1/5:  91%|█████████ | 2009/2208 [11:54<01:08,  2.92it/s][A
Epoch 1/5:  91%|█████████ | 2010/2208 [11:55<01:08,  2.90it/s][A
Epoch 1/5:  91%|█████████ | 2011/2208 [11:55<01:07,  2.90it/s][A
Epoch 1/5:  91%|█████████ | 2012/2208 [11:55<01:08,  2.84it/s][A
Epoch 1/5:  91%|█████████ | 2013/2208 [11:56<01:08,  2.87it/s][A
Epoch 1/5:  91%|█████████ | 2014/2208 [11:56<01:08,  2.82it/s][A
Epoch 1/5:  91%|█████████▏| 2015/2208 [11:56<01:07,  2.85it/s][A
Epoch 1/5:  91%|█████████▏| 2016/2208 [11:57<01:06,  2.88it/s][A
Epoch 1/5

Batch 2025: Training accuracy = 0.8125, F1 = 0.7995, Precision = 0.8115, Recall = 0.8125



Epoch 1/5:  92%|█████████▏| 2027/2208 [12:01<01:04,  2.82it/s][A
Epoch 1/5:  92%|█████████▏| 2028/2208 [12:01<01:02,  2.86it/s][A
Epoch 1/5:  92%|█████████▏| 2029/2208 [12:01<01:02,  2.87it/s][A
Epoch 1/5:  92%|█████████▏| 2030/2208 [12:02<01:04,  2.77it/s][A
Epoch 1/5:  92%|█████████▏| 2031/2208 [12:02<01:04,  2.76it/s][A
Epoch 1/5:  92%|█████████▏| 2032/2208 [12:02<01:02,  2.79it/s][A
Epoch 1/5:  92%|█████████▏| 2033/2208 [12:03<01:01,  2.84it/s][A
Epoch 1/5:  92%|█████████▏| 2034/2208 [12:03<01:00,  2.87it/s][A
Epoch 1/5:  92%|█████████▏| 2035/2208 [12:03<01:00,  2.88it/s][A
Epoch 1/5:  92%|█████████▏| 2036/2208 [12:04<00:59,  2.90it/s][A
Epoch 1/5:  92%|█████████▏| 2037/2208 [12:04<00:58,  2.90it/s][A
Epoch 1/5:  92%|█████████▏| 2038/2208 [12:05<01:00,  2.83it/s][A
Epoch 1/5:  92%|█████████▏| 2039/2208 [12:05<01:00,  2.78it/s][A
Epoch 1/5:  92%|█████████▏| 2040/2208 [12:05<00:59,  2.80it/s][A
Epoch 1/5:  92%|█████████▏| 2041/2208 [12:06<00:58,  2.85it/s][A
Epoch 1/5

Batch 2050: Training accuracy = 0.8359, F1 = 0.8185, Precision = 0.8216, Recall = 0.8359



Epoch 1/5:  93%|█████████▎| 2052/2208 [12:10<00:54,  2.84it/s][A
Epoch 1/5:  93%|█████████▎| 2053/2208 [12:10<00:53,  2.88it/s][A
Epoch 1/5:  93%|█████████▎| 2054/2208 [12:10<00:53,  2.89it/s][A
Epoch 1/5:  93%|█████████▎| 2055/2208 [12:11<00:52,  2.91it/s][A
Epoch 1/5:  93%|█████████▎| 2056/2208 [12:11<00:51,  2.92it/s][A
Epoch 1/5:  93%|█████████▎| 2057/2208 [12:11<00:51,  2.92it/s][A
Epoch 1/5:  93%|█████████▎| 2058/2208 [12:12<00:51,  2.92it/s][A
Epoch 1/5:  93%|█████████▎| 2059/2208 [12:12<00:50,  2.93it/s][A
Epoch 1/5:  93%|█████████▎| 2060/2208 [12:12<00:51,  2.89it/s][A
Epoch 1/5:  93%|█████████▎| 2061/2208 [12:13<00:51,  2.88it/s][A
Epoch 1/5:  93%|█████████▎| 2062/2208 [12:13<00:50,  2.87it/s][A
Epoch 1/5:  93%|█████████▎| 2063/2208 [12:13<00:50,  2.88it/s][A
Epoch 1/5:  93%|█████████▎| 2064/2208 [12:14<00:50,  2.83it/s][A
Epoch 1/5:  94%|█████████▎| 2065/2208 [12:14<00:50,  2.85it/s][A
Epoch 1/5:  94%|█████████▎| 2066/2208 [12:14<00:49,  2.88it/s][A
Epoch 1/5

Batch 2075: Training accuracy = 0.8125, F1 = 0.7971, Precision = 0.7969, Recall = 0.8125



Epoch 1/5:  94%|█████████▍| 2077/2208 [12:18<00:45,  2.88it/s][A
Epoch 1/5:  94%|█████████▍| 2078/2208 [12:19<00:44,  2.90it/s][A
Epoch 1/5:  94%|█████████▍| 2079/2208 [12:19<00:44,  2.92it/s][A
Epoch 1/5:  94%|█████████▍| 2080/2208 [12:19<00:43,  2.93it/s][A
Epoch 1/5:  94%|█████████▍| 2081/2208 [12:20<00:43,  2.93it/s][A
Epoch 1/5:  94%|█████████▍| 2082/2208 [12:20<00:43,  2.89it/s][A
Epoch 1/5:  94%|█████████▍| 2083/2208 [12:20<00:44,  2.83it/s][A
Epoch 1/5:  94%|█████████▍| 2084/2208 [12:21<00:44,  2.80it/s][A
Epoch 1/5:  94%|█████████▍| 2085/2208 [12:21<00:43,  2.82it/s][A
Epoch 1/5:  94%|█████████▍| 2086/2208 [12:21<00:43,  2.80it/s][A
Epoch 1/5:  95%|█████████▍| 2087/2208 [12:22<00:43,  2.76it/s][A
Epoch 1/5:  95%|█████████▍| 2088/2208 [12:22<00:42,  2.81it/s][A
Epoch 1/5:  95%|█████████▍| 2089/2208 [12:22<00:41,  2.85it/s][A
Epoch 1/5:  95%|█████████▍| 2090/2208 [12:23<00:41,  2.87it/s][A
Epoch 1/5:  95%|█████████▍| 2091/2208 [12:23<00:40,  2.86it/s][A
Epoch 1/5

Batch 2100: Training accuracy = 0.8672, F1 = 0.8536, Precision = 0.8542, Recall = 0.8672



Epoch 1/5:  95%|█████████▌| 2102/2208 [12:27<00:37,  2.86it/s][A
Epoch 1/5:  95%|█████████▌| 2103/2208 [12:27<00:36,  2.88it/s][A
Epoch 1/5:  95%|█████████▌| 2104/2208 [12:28<00:35,  2.90it/s][A
Epoch 1/5:  95%|█████████▌| 2105/2208 [12:28<00:35,  2.89it/s][A
Epoch 1/5:  95%|█████████▌| 2106/2208 [12:28<00:36,  2.82it/s][A
Epoch 1/5:  95%|█████████▌| 2107/2208 [12:29<00:36,  2.78it/s][A
Epoch 1/5:  95%|█████████▌| 2108/2208 [12:29<00:35,  2.78it/s][A
Epoch 1/5:  96%|█████████▌| 2109/2208 [12:29<00:35,  2.81it/s][A
Epoch 1/5:  96%|█████████▌| 2110/2208 [12:30<00:34,  2.85it/s][A
Epoch 1/5:  96%|█████████▌| 2111/2208 [12:30<00:34,  2.82it/s][A
Epoch 1/5:  96%|█████████▌| 2112/2208 [12:31<00:34,  2.82it/s][A
Epoch 1/5:  96%|█████████▌| 2113/2208 [12:31<00:33,  2.86it/s][A
Epoch 1/5:  96%|█████████▌| 2114/2208 [12:31<00:33,  2.84it/s][A
Epoch 1/5:  96%|█████████▌| 2115/2208 [12:32<00:32,  2.85it/s][A
Epoch 1/5:  96%|█████████▌| 2116/2208 [12:32<00:32,  2.85it/s][A
Epoch 1/5

Batch 2125: Training accuracy = 0.7969, F1 = 0.7647, Precision = 0.7513, Recall = 0.7969



Epoch 1/5:  96%|█████████▋| 2127/2208 [12:36<00:29,  2.77it/s][A
Epoch 1/5:  96%|█████████▋| 2128/2208 [12:36<00:28,  2.82it/s][A
Epoch 1/5:  96%|█████████▋| 2129/2208 [12:37<00:28,  2.75it/s][A
Epoch 1/5:  96%|█████████▋| 2130/2208 [12:37<00:27,  2.80it/s][A
Epoch 1/5:  97%|█████████▋| 2131/2208 [12:37<00:27,  2.83it/s][A
Epoch 1/5:  97%|█████████▋| 2132/2208 [12:38<00:26,  2.87it/s][A
Epoch 1/5:  97%|█████████▋| 2133/2208 [12:38<00:25,  2.89it/s][A
Epoch 1/5:  97%|█████████▋| 2134/2208 [12:38<00:26,  2.83it/s][A
Epoch 1/5:  97%|█████████▋| 2135/2208 [12:39<00:25,  2.86it/s][A
Epoch 1/5:  97%|█████████▋| 2136/2208 [12:39<00:24,  2.90it/s][A
Epoch 1/5:  97%|█████████▋| 2137/2208 [12:39<00:24,  2.91it/s][A
Epoch 1/5:  97%|█████████▋| 2138/2208 [12:40<00:23,  2.93it/s][A
Epoch 1/5:  97%|█████████▋| 2139/2208 [12:40<00:23,  2.93it/s][A
Epoch 1/5:  97%|█████████▋| 2140/2208 [12:40<00:23,  2.94it/s][A
Epoch 1/5:  97%|█████████▋| 2141/2208 [12:41<00:23,  2.90it/s][A
Epoch 1/5

Batch 2150: Training accuracy = 0.8906, F1 = 0.8828, Precision = 0.8828, Recall = 0.8906



Epoch 1/5:  97%|█████████▋| 2152/2208 [12:45<00:20,  2.69it/s][A
Epoch 1/5:  98%|█████████▊| 2153/2208 [12:45<00:19,  2.76it/s][A
Epoch 1/5:  98%|█████████▊| 2154/2208 [12:45<00:20,  2.67it/s][A
Epoch 1/5:  98%|█████████▊| 2155/2208 [12:46<00:20,  2.62it/s][A
Epoch 1/5:  98%|█████████▊| 2156/2208 [12:46<00:19,  2.70it/s][A
Epoch 1/5:  98%|█████████▊| 2157/2208 [12:47<00:18,  2.70it/s][A
Epoch 1/5:  98%|█████████▊| 2158/2208 [12:47<00:18,  2.77it/s][A
Epoch 1/5:  98%|█████████▊| 2159/2208 [12:47<00:17,  2.82it/s][A
Epoch 1/5:  98%|█████████▊| 2160/2208 [12:48<00:16,  2.84it/s][A
Epoch 1/5:  98%|█████████▊| 2161/2208 [12:48<00:17,  2.76it/s][A
Epoch 1/5:  98%|█████████▊| 2162/2208 [12:48<00:16,  2.77it/s][A
Epoch 1/5:  98%|█████████▊| 2163/2208 [12:49<00:16,  2.81it/s][A
Epoch 1/5:  98%|█████████▊| 2164/2208 [12:49<00:15,  2.85it/s][A
Epoch 1/5:  98%|█████████▊| 2165/2208 [12:49<00:15,  2.75it/s][A
Epoch 1/5:  98%|█████████▊| 2166/2208 [12:50<00:14,  2.81it/s][A
Epoch 1/5

Batch 2175: Training accuracy = 0.7891, F1 = 0.7807, Precision = 0.7930, Recall = 0.7891



Epoch 1/5:  99%|█████████▊| 2177/2208 [12:54<00:11,  2.79it/s][A
Epoch 1/5:  99%|█████████▊| 2178/2208 [12:54<00:10,  2.82it/s][A
Epoch 1/5:  99%|█████████▊| 2179/2208 [12:54<00:10,  2.73it/s][A
Epoch 1/5:  99%|█████████▊| 2180/2208 [12:55<00:10,  2.77it/s][A
Epoch 1/5:  99%|█████████▉| 2181/2208 [12:55<00:09,  2.82it/s][A
Epoch 1/5:  99%|█████████▉| 2182/2208 [12:56<00:09,  2.79it/s][A
Epoch 1/5:  99%|█████████▉| 2183/2208 [12:56<00:08,  2.78it/s][A
Epoch 1/5:  99%|█████████▉| 2184/2208 [12:56<00:08,  2.83it/s][A
Epoch 1/5:  99%|█████████▉| 2185/2208 [12:57<00:08,  2.85it/s][A
Epoch 1/5:  99%|█████████▉| 2186/2208 [12:57<00:07,  2.88it/s][A
Epoch 1/5:  99%|█████████▉| 2187/2208 [12:57<00:07,  2.84it/s][A
Epoch 1/5:  99%|█████████▉| 2188/2208 [12:58<00:07,  2.78it/s][A
Epoch 1/5:  99%|█████████▉| 2189/2208 [12:58<00:06,  2.80it/s][A
Epoch 1/5:  99%|█████████▉| 2190/2208 [12:58<00:06,  2.80it/s][A
Epoch 1/5:  99%|█████████▉| 2191/2208 [12:59<00:06,  2.79it/s][A
Epoch 1/5

Batch 2200: Training accuracy = 0.8359, F1 = 0.8318, Precision = 0.8438, Recall = 0.8359



Epoch 1/5: 100%|█████████▉| 2202/2208 [13:03<00:02,  2.86it/s][A
Epoch 1/5: 100%|█████████▉| 2203/2208 [13:03<00:01,  2.88it/s][A
Epoch 1/5: 100%|█████████▉| 2204/2208 [13:03<00:01,  2.88it/s][A
Epoch 1/5: 100%|█████████▉| 2205/2208 [13:04<00:01,  2.90it/s][A
Epoch 1/5: 100%|█████████▉| 2206/2208 [13:04<00:00,  2.91it/s][A
Epoch 1/5: 100%|█████████▉| 2207/2208 [13:04<00:00,  2.91it/s][A
Epoch 1/5: 100%|██████████| 2208/2208 [13:05<00:00,  2.93it/s][A
                                                              [A


Epoch 1 training accuracy: 0.74%
Epoch 1 training F1 score: 0.7486
Epoch 1 training precision: 0.7604
Epoch 1 training recall: 0.7444

Starting validation...



Validation:   0%|          | 0/552 [00:00<?, ?it/s][A
Validation:   0%|          | 1/552 [00:01<15:27,  1.68s/it][A
Validation:   1%|          | 4/552 [00:01<03:11,  2.87it/s][A
Validation:   1%|          | 6/552 [00:01<02:06,  4.32it/s][A
Validation:   1%|▏         | 8/552 [00:02<01:28,  6.12it/s][A
Validation:   2%|▏         | 10/552 [00:02<01:15,  7.17it/s][A
Validation:   2%|▏         | 12/552 [00:02<00:59,  9.05it/s][A
Validation:   3%|▎         | 14/552 [00:02<00:52, 10.24it/s][A
Validation:   3%|▎         | 16/552 [00:02<00:49, 10.73it/s][A
Validation:   3%|▎         | 18/552 [00:02<00:52, 10.24it/s][A
Validation:   4%|▎         | 20/552 [00:03<00:58,  9.08it/s][A
Validation:   4%|▍         | 23/552 [00:03<00:42, 12.55it/s][A
Validation:   5%|▍         | 25/552 [00:03<00:44, 11.88it/s][A
Validation:   5%|▌         | 28/552 [00:03<00:34, 14.99it/s][A
Validation:   5%|▌         | 30/552 [00:03<00:37, 13.88it/s][A
Validation:   6%|▌         | 32/552 [00:04<00:45, 11

Validation accuracy: 0.65%
Validation F1 score: 0.6672
Validation precision: 0.7966
Validation recall: 0.6512

Starting epoch 2/5



  _warn_prf(average, modifier, f"{metric.capitalize()} is", len(result))
  _warn_prf(average, modifier, f"{metric.capitalize()} is", len(result))

Epoch 2/5:   0%|          | 1/2208 [00:01<1:12:46,  1.98s/it][A

Batch 0: Training accuracy = 0.8203, F1 = 0.8099, Precision = 0.8177, Recall = 0.8203



Epoch 2/5:   0%|          | 2/2208 [00:02<37:17,  1.01s/it]  [A
Epoch 2/5:   0%|          | 3/2208 [00:02<25:56,  1.42it/s][A
Epoch 2/5:   0%|          | 4/2208 [00:02<20:34,  1.79it/s][A
Epoch 2/5:   0%|          | 5/2208 [00:03<18:01,  2.04it/s][A
Epoch 2/5:   0%|          | 6/2208 [00:03<16:11,  2.27it/s][A
Epoch 2/5:   0%|          | 7/2208 [00:04<14:57,  2.45it/s][A
Epoch 2/5:   0%|          | 8/2208 [00:04<14:09,  2.59it/s][A
Epoch 2/5:   0%|          | 9/2208 [00:04<13:36,  2.69it/s][A
Epoch 2/5:   0%|          | 10/2208 [00:05<13:16,  2.76it/s][A
Epoch 2/5:   0%|          | 11/2208 [00:05<13:00,  2.82it/s][A
Epoch 2/5:   1%|          | 12/2208 [00:05<12:49,  2.85it/s][A
Epoch 2/5:   1%|          | 13/2208 [00:06<12:40,  2.89it/s][A
Epoch 2/5:   1%|          | 14/2208 [00:06<12:35,  2.90it/s][A
Epoch 2/5:   1%|          | 15/2208 [00:06<12:31,  2.92it/s][A
Epoch 2/5:   1%|          | 16/2208 [00:07<12:31,  2.92it/s][A
Epoch 2/5:   1%|          | 17/2208 [00:07<12

Batch 25: Training accuracy = 0.8750, F1 = 0.8724, Precision = 0.8750, Recall = 0.8750



Epoch 2/5:   1%|          | 27/2208 [00:10<12:55,  2.81it/s][A
Epoch 2/5:   1%|▏         | 28/2208 [00:11<12:44,  2.85it/s][A
Epoch 2/5:   1%|▏         | 29/2208 [00:11<12:46,  2.84it/s][A
Epoch 2/5:   1%|▏         | 30/2208 [00:12<12:45,  2.84it/s][A
Epoch 2/5:   1%|▏         | 31/2208 [00:12<12:43,  2.85it/s][A
Epoch 2/5:   1%|▏         | 32/2208 [00:12<12:51,  2.82it/s][A
Epoch 2/5:   1%|▏         | 33/2208 [00:13<13:05,  2.77it/s][A
Epoch 2/5:   2%|▏         | 34/2208 [00:13<12:55,  2.80it/s][A
Epoch 2/5:   2%|▏         | 35/2208 [00:13<12:45,  2.84it/s][A
Epoch 2/5:   2%|▏         | 36/2208 [00:14<12:39,  2.86it/s][A
Epoch 2/5:   2%|▏         | 37/2208 [00:14<12:59,  2.79it/s][A
Epoch 2/5:   2%|▏         | 38/2208 [00:14<12:57,  2.79it/s][A
Epoch 2/5:   2%|▏         | 39/2208 [00:15<12:51,  2.81it/s][A
Epoch 2/5:   2%|▏         | 40/2208 [00:15<12:45,  2.83it/s][A
Epoch 2/5:   2%|▏         | 41/2208 [00:15<12:36,  2.86it/s][A
Epoch 2/5:   2%|▏         | 42/2208 [00

Batch 50: Training accuracy = 0.8438, F1 = 0.8230, Precision = 0.8161, Recall = 0.8438



Epoch 2/5:   2%|▏         | 52/2208 [00:19<12:45,  2.82it/s][A
Epoch 2/5:   2%|▏         | 53/2208 [00:20<12:34,  2.86it/s][A
Epoch 2/5:   2%|▏         | 54/2208 [00:20<12:42,  2.82it/s][A
Epoch 2/5:   2%|▏         | 55/2208 [00:20<13:08,  2.73it/s][A
Epoch 2/5:   3%|▎         | 56/2208 [00:21<13:09,  2.73it/s][A
Epoch 2/5:   3%|▎         | 57/2208 [00:21<13:05,  2.74it/s][A
Epoch 2/5:   3%|▎         | 58/2208 [00:21<13:03,  2.74it/s][A
Epoch 2/5:   3%|▎         | 59/2208 [00:22<12:50,  2.79it/s][A
Epoch 2/5:   3%|▎         | 60/2208 [00:22<12:41,  2.82it/s][A
Epoch 2/5:   3%|▎         | 61/2208 [00:23<12:42,  2.82it/s][A
Epoch 2/5:   3%|▎         | 62/2208 [00:23<12:35,  2.84it/s][A
Epoch 2/5:   3%|▎         | 63/2208 [00:23<12:24,  2.88it/s][A
Epoch 2/5:   3%|▎         | 64/2208 [00:24<12:41,  2.82it/s][A
Epoch 2/5:   3%|▎         | 65/2208 [00:24<12:55,  2.76it/s][A
Epoch 2/5:   3%|▎         | 66/2208 [00:24<12:46,  2.79it/s][A
Epoch 2/5:   3%|▎         | 67/2208 [00

Batch 75: Training accuracy = 0.8125, F1 = 0.7930, Precision = 0.7965, Recall = 0.8125



Epoch 2/5:   3%|▎         | 77/2208 [00:28<12:37,  2.81it/s][A
Epoch 2/5:   4%|▎         | 78/2208 [00:29<12:26,  2.85it/s][A
Epoch 2/5:   4%|▎         | 79/2208 [00:29<12:23,  2.86it/s][A
Epoch 2/5:   4%|▎         | 80/2208 [00:29<12:29,  2.84it/s][A
Epoch 2/5:   4%|▎         | 81/2208 [00:30<12:27,  2.85it/s][A
Epoch 2/5:   4%|▎         | 82/2208 [00:30<12:47,  2.77it/s][A
Epoch 2/5:   4%|▍         | 83/2208 [00:30<12:34,  2.82it/s][A
Epoch 2/5:   4%|▍         | 84/2208 [00:31<12:44,  2.78it/s][A
Epoch 2/5:   4%|▍         | 85/2208 [00:31<12:30,  2.83it/s][A
Epoch 2/5:   4%|▍         | 86/2208 [00:31<12:38,  2.80it/s][A
Epoch 2/5:   4%|▍         | 87/2208 [00:32<12:28,  2.83it/s][A
Epoch 2/5:   4%|▍         | 88/2208 [00:32<12:22,  2.85it/s][A
Epoch 2/5:   4%|▍         | 89/2208 [00:32<12:22,  2.86it/s][A
Epoch 2/5:   4%|▍         | 90/2208 [00:33<12:20,  2.86it/s][A
Epoch 2/5:   4%|▍         | 91/2208 [00:33<12:14,  2.88it/s][A
Epoch 2/5:   4%|▍         | 92/2208 [00

Batch 100: Training accuracy = 0.8359, F1 = 0.8260, Precision = 0.8340, Recall = 0.8359



Epoch 2/5:   5%|▍         | 102/2208 [00:37<12:20,  2.85it/s][A
Epoch 2/5:   5%|▍         | 103/2208 [00:37<12:29,  2.81it/s][A
Epoch 2/5:   5%|▍         | 104/2208 [00:38<12:17,  2.85it/s][A
Epoch 2/5:   5%|▍         | 105/2208 [00:38<12:17,  2.85it/s][A
Epoch 2/5:   5%|▍         | 106/2208 [00:38<12:17,  2.85it/s][A
Epoch 2/5:   5%|▍         | 107/2208 [00:39<12:15,  2.86it/s][A
Epoch 2/5:   5%|▍         | 108/2208 [00:39<12:11,  2.87it/s][A
Epoch 2/5:   5%|▍         | 109/2208 [00:39<12:23,  2.82it/s][A
Epoch 2/5:   5%|▍         | 110/2208 [00:40<12:17,  2.85it/s][A
Epoch 2/5:   5%|▌         | 111/2208 [00:40<12:12,  2.86it/s][A
Epoch 2/5:   5%|▌         | 112/2208 [00:41<12:08,  2.88it/s][A
Epoch 2/5:   5%|▌         | 113/2208 [00:41<12:08,  2.88it/s][A
Epoch 2/5:   5%|▌         | 114/2208 [00:41<12:24,  2.81it/s][A
Epoch 2/5:   5%|▌         | 115/2208 [00:42<12:37,  2.76it/s][A
Epoch 2/5:   5%|▌         | 116/2208 [00:42<12:44,  2.74it/s][A
Epoch 2/5:   5%|▌       

Batch 125: Training accuracy = 0.8203, F1 = 0.7917, Precision = 0.7906, Recall = 0.8203



Epoch 2/5:   6%|▌         | 127/2208 [00:46<12:32,  2.76it/s][A
Epoch 2/5:   6%|▌         | 128/2208 [00:46<12:20,  2.81it/s][A
Epoch 2/5:   6%|▌         | 129/2208 [00:47<12:07,  2.86it/s][A
Epoch 2/5:   6%|▌         | 130/2208 [00:47<12:03,  2.87it/s][A
Epoch 2/5:   6%|▌         | 131/2208 [00:47<12:04,  2.87it/s][A
Epoch 2/5:   6%|▌         | 132/2208 [00:48<12:09,  2.85it/s][A
Epoch 2/5:   6%|▌         | 133/2208 [00:48<12:03,  2.87it/s][A
Epoch 2/5:   6%|▌         | 134/2208 [00:48<12:07,  2.85it/s][A
Epoch 2/5:   6%|▌         | 135/2208 [00:49<11:59,  2.88it/s][A
Epoch 2/5:   6%|▌         | 136/2208 [00:49<11:51,  2.91it/s][A
Epoch 2/5:   6%|▌         | 137/2208 [00:49<12:04,  2.86it/s][A
Epoch 2/5:   6%|▋         | 138/2208 [00:50<11:57,  2.89it/s][A
Epoch 2/5:   6%|▋         | 139/2208 [00:50<11:55,  2.89it/s][A
Epoch 2/5:   6%|▋         | 140/2208 [00:50<11:54,  2.89it/s][A
Epoch 2/5:   6%|▋         | 141/2208 [00:51<11:57,  2.88it/s][A
Epoch 2/5:   6%|▋       

Batch 150: Training accuracy = 0.8438, F1 = 0.8234, Precision = 0.8301, Recall = 0.8438



Epoch 2/5:   7%|▋         | 152/2208 [00:55<12:00,  2.85it/s][A
Epoch 2/5:   7%|▋         | 153/2208 [00:55<11:54,  2.87it/s][A
Epoch 2/5:   7%|▋         | 154/2208 [00:55<12:06,  2.83it/s][A
Epoch 2/5:   7%|▋         | 155/2208 [00:56<12:04,  2.83it/s][A
Epoch 2/5:   7%|▋         | 156/2208 [00:56<12:21,  2.77it/s][A
Epoch 2/5:   7%|▋         | 157/2208 [00:56<12:16,  2.79it/s][A
Epoch 2/5:   7%|▋         | 158/2208 [00:57<12:08,  2.81it/s][A
Epoch 2/5:   7%|▋         | 159/2208 [00:57<12:01,  2.84it/s][A
Epoch 2/5:   7%|▋         | 160/2208 [00:58<12:06,  2.82it/s][A
Epoch 2/5:   7%|▋         | 161/2208 [00:58<12:03,  2.83it/s][A
Epoch 2/5:   7%|▋         | 162/2208 [00:58<12:37,  2.70it/s][A
Epoch 2/5:   7%|▋         | 163/2208 [00:59<12:43,  2.68it/s][A
Epoch 2/5:   7%|▋         | 164/2208 [00:59<12:35,  2.70it/s][A
Epoch 2/5:   7%|▋         | 165/2208 [00:59<12:16,  2.78it/s][A
Epoch 2/5:   8%|▊         | 166/2208 [01:00<12:05,  2.81it/s][A
Epoch 2/5:   8%|▊       

Batch 175: Training accuracy = 0.8125, F1 = 0.8107, Precision = 0.8255, Recall = 0.8125



Epoch 2/5:   8%|▊         | 177/2208 [01:04<12:32,  2.70it/s][A
Epoch 2/5:   8%|▊         | 178/2208 [01:04<12:13,  2.77it/s][A
Epoch 2/5:   8%|▊         | 179/2208 [01:04<11:58,  2.82it/s][A
Epoch 2/5:   8%|▊         | 180/2208 [01:05<11:48,  2.86it/s][A
Epoch 2/5:   8%|▊         | 181/2208 [01:05<11:42,  2.88it/s][A
Epoch 2/5:   8%|▊         | 182/2208 [01:05<11:56,  2.83it/s][A
Epoch 2/5:   8%|▊         | 183/2208 [01:06<11:57,  2.82it/s][A
Epoch 2/5:   8%|▊         | 184/2208 [01:06<11:54,  2.83it/s][A
Epoch 2/5:   8%|▊         | 185/2208 [01:07<11:54,  2.83it/s][A
Epoch 2/5:   8%|▊         | 186/2208 [01:07<12:01,  2.80it/s][A
Epoch 2/5:   8%|▊         | 187/2208 [01:07<11:53,  2.83it/s][A
Epoch 2/5:   9%|▊         | 188/2208 [01:08<11:45,  2.86it/s][A
Epoch 2/5:   9%|▊         | 189/2208 [01:08<11:42,  2.87it/s][A
Epoch 2/5:   9%|▊         | 190/2208 [01:08<11:34,  2.90it/s][A
Epoch 2/5:   9%|▊         | 191/2208 [01:09<11:48,  2.85it/s][A
Epoch 2/5:   9%|▊       

Batch 200: Training accuracy = 0.8438, F1 = 0.8294, Precision = 0.8307, Recall = 0.8438



Epoch 2/5:   9%|▉         | 202/2208 [01:12<11:45,  2.84it/s][A
Epoch 2/5:   9%|▉         | 203/2208 [01:13<12:00,  2.78it/s][A
Epoch 2/5:   9%|▉         | 204/2208 [01:13<12:07,  2.75it/s][A
Epoch 2/5:   9%|▉         | 205/2208 [01:14<11:58,  2.79it/s][A
Epoch 2/5:   9%|▉         | 206/2208 [01:14<11:51,  2.81it/s][A
Epoch 2/5:   9%|▉         | 207/2208 [01:14<11:49,  2.82it/s][A
Epoch 2/5:   9%|▉         | 208/2208 [01:15<11:50,  2.82it/s][A
Epoch 2/5:   9%|▉         | 209/2208 [01:15<11:45,  2.83it/s][A
Epoch 2/5:  10%|▉         | 210/2208 [01:15<11:36,  2.87it/s][A
Epoch 2/5:  10%|▉         | 211/2208 [01:16<11:37,  2.86it/s][A
Epoch 2/5:  10%|▉         | 212/2208 [01:16<11:47,  2.82it/s][A
Epoch 2/5:  10%|▉         | 213/2208 [01:16<11:56,  2.78it/s][A
Epoch 2/5:  10%|▉         | 214/2208 [01:17<11:44,  2.83it/s][A
Epoch 2/5:  10%|▉         | 215/2208 [01:17<11:37,  2.86it/s][A
Epoch 2/5:  10%|▉         | 216/2208 [01:17<11:53,  2.79it/s][A
Epoch 2/5:  10%|▉       

Batch 225: Training accuracy = 0.7969, F1 = 0.7781, Precision = 0.7799, Recall = 0.7969



Epoch 2/5:  10%|█         | 227/2208 [01:21<11:51,  2.78it/s][A
Epoch 2/5:  10%|█         | 228/2208 [01:22<12:02,  2.74it/s][A
Epoch 2/5:  10%|█         | 229/2208 [01:22<11:48,  2.79it/s][A
Epoch 2/5:  10%|█         | 230/2208 [01:23<11:37,  2.83it/s][A
Epoch 2/5:  10%|█         | 231/2208 [01:23<11:32,  2.86it/s][A
Epoch 2/5:  11%|█         | 232/2208 [01:23<11:38,  2.83it/s][A
Epoch 2/5:  11%|█         | 233/2208 [01:24<11:56,  2.75it/s][A
Epoch 2/5:  11%|█         | 234/2208 [01:24<11:46,  2.80it/s][A
Epoch 2/5:  11%|█         | 235/2208 [01:24<12:00,  2.74it/s][A
Epoch 2/5:  11%|█         | 236/2208 [01:25<12:15,  2.68it/s][A
Epoch 2/5:  11%|█         | 237/2208 [01:25<12:04,  2.72it/s][A
Epoch 2/5:  11%|█         | 238/2208 [01:25<11:49,  2.78it/s][A
Epoch 2/5:  11%|█         | 239/2208 [01:26<12:12,  2.69it/s][A
Epoch 2/5:  11%|█         | 240/2208 [01:26<11:58,  2.74it/s][A
Epoch 2/5:  11%|█         | 241/2208 [01:27<12:09,  2.70it/s][A
Epoch 2/5:  11%|█       

Batch 250: Training accuracy = 0.7266, F1 = 0.7151, Precision = 0.7240, Recall = 0.7266



Epoch 2/5:  11%|█▏        | 252/2208 [01:31<11:59,  2.72it/s][A
Epoch 2/5:  11%|█▏        | 253/2208 [01:31<12:08,  2.68it/s][A
Epoch 2/5:  12%|█▏        | 254/2208 [01:31<11:58,  2.72it/s][A
Epoch 2/5:  12%|█▏        | 255/2208 [01:32<12:00,  2.71it/s][A
Epoch 2/5:  12%|█▏        | 256/2208 [01:32<11:49,  2.75it/s][A
Epoch 2/5:  12%|█▏        | 257/2208 [01:32<11:34,  2.81it/s][A
Epoch 2/5:  12%|█▏        | 258/2208 [01:33<11:23,  2.85it/s][A
Epoch 2/5:  12%|█▏        | 259/2208 [01:33<11:17,  2.88it/s][A
Epoch 2/5:  12%|█▏        | 260/2208 [01:33<11:15,  2.88it/s][A
Epoch 2/5:  12%|█▏        | 261/2208 [01:34<11:11,  2.90it/s][A
Epoch 2/5:  12%|█▏        | 262/2208 [01:34<11:11,  2.90it/s][A
Epoch 2/5:  12%|█▏        | 263/2208 [01:34<11:26,  2.83it/s][A
Epoch 2/5:  12%|█▏        | 264/2208 [01:35<11:19,  2.86it/s][A
Epoch 2/5:  12%|█▏        | 265/2208 [01:35<11:34,  2.80it/s][A
Epoch 2/5:  12%|█▏        | 266/2208 [01:35<11:36,  2.79it/s][A
Epoch 2/5:  12%|█▏      

Batch 275: Training accuracy = 0.8828, F1 = 0.8782, Precision = 0.8861, Recall = 0.8828



Epoch 2/5:  13%|█▎        | 277/2208 [01:39<11:34,  2.78it/s][A
Epoch 2/5:  13%|█▎        | 278/2208 [01:40<11:28,  2.80it/s][A
Epoch 2/5:  13%|█▎        | 279/2208 [01:40<11:27,  2.81it/s][A
Epoch 2/5:  13%|█▎        | 280/2208 [01:40<11:22,  2.83it/s][A
Epoch 2/5:  13%|█▎        | 281/2208 [01:41<11:23,  2.82it/s][A
Epoch 2/5:  13%|█▎        | 282/2208 [01:41<11:19,  2.83it/s][A
Epoch 2/5:  13%|█▎        | 283/2208 [01:41<11:13,  2.86it/s][A
Epoch 2/5:  13%|█▎        | 284/2208 [01:42<11:22,  2.82it/s][A
Epoch 2/5:  13%|█▎        | 285/2208 [01:42<11:48,  2.71it/s][A
Epoch 2/5:  13%|█▎        | 286/2208 [01:43<11:47,  2.72it/s][A
Epoch 2/5:  13%|█▎        | 287/2208 [01:43<11:51,  2.70it/s][A
Epoch 2/5:  13%|█▎        | 288/2208 [01:43<11:52,  2.70it/s][A
Epoch 2/5:  13%|█▎        | 289/2208 [01:44<12:05,  2.65it/s][A
Epoch 2/5:  13%|█▎        | 290/2208 [01:44<12:07,  2.64it/s][A
Epoch 2/5:  13%|█▎        | 291/2208 [01:44<11:57,  2.67it/s][A
Epoch 2/5:  13%|█▎      

Batch 300: Training accuracy = 0.8516, F1 = 0.8346, Precision = 0.8349, Recall = 0.8516



Epoch 2/5:  14%|█▎        | 302/2208 [01:48<11:09,  2.85it/s][A
Epoch 2/5:  14%|█▎        | 303/2208 [01:49<11:02,  2.88it/s][A
Epoch 2/5:  14%|█▍        | 304/2208 [01:49<10:58,  2.89it/s][A
Epoch 2/5:  14%|█▍        | 305/2208 [01:49<10:53,  2.91it/s][A
Epoch 2/5:  14%|█▍        | 306/2208 [01:50<11:09,  2.84it/s][A
Epoch 2/5:  14%|█▍        | 307/2208 [01:50<11:30,  2.75it/s][A
Epoch 2/5:  14%|█▍        | 308/2208 [01:51<11:15,  2.81it/s][A
Epoch 2/5:  14%|█▍        | 309/2208 [01:51<11:25,  2.77it/s][A
Epoch 2/5:  14%|█▍        | 310/2208 [01:51<11:13,  2.82it/s][A
Epoch 2/5:  14%|█▍        | 311/2208 [01:52<11:19,  2.79it/s][A
Epoch 2/5:  14%|█▍        | 312/2208 [01:52<11:09,  2.83it/s][A
Epoch 2/5:  14%|█▍        | 313/2208 [01:52<11:24,  2.77it/s][A
Epoch 2/5:  14%|█▍        | 314/2208 [01:53<11:14,  2.81it/s][A
Epoch 2/5:  14%|█▍        | 315/2208 [01:53<11:08,  2.83it/s][A
Epoch 2/5:  14%|█▍        | 316/2208 [01:53<11:06,  2.84it/s][A
Epoch 2/5:  14%|█▍      

Batch 325: Training accuracy = 0.7969, F1 = 0.7820, Precision = 0.7910, Recall = 0.7969



Epoch 2/5:  15%|█▍        | 327/2208 [01:57<11:06,  2.82it/s][A
Epoch 2/5:  15%|█▍        | 328/2208 [01:58<10:57,  2.86it/s][A
Epoch 2/5:  15%|█▍        | 329/2208 [01:58<10:52,  2.88it/s][A
Epoch 2/5:  15%|█▍        | 330/2208 [01:58<10:59,  2.85it/s][A
Epoch 2/5:  15%|█▍        | 331/2208 [01:59<10:59,  2.85it/s][A
Epoch 2/5:  15%|█▌        | 332/2208 [01:59<11:14,  2.78it/s][A
Epoch 2/5:  15%|█▌        | 333/2208 [01:59<11:05,  2.82it/s][A
Epoch 2/5:  15%|█▌        | 334/2208 [02:00<11:14,  2.78it/s][A
Epoch 2/5:  15%|█▌        | 335/2208 [02:00<11:09,  2.80it/s][A
Epoch 2/5:  15%|█▌        | 336/2208 [02:00<10:59,  2.84it/s][A
Epoch 2/5:  15%|█▌        | 337/2208 [02:01<10:51,  2.87it/s][A
Epoch 2/5:  15%|█▌        | 338/2208 [02:01<10:45,  2.90it/s][A
Epoch 2/5:  15%|█▌        | 339/2208 [02:02<11:09,  2.79it/s][A
Epoch 2/5:  15%|█▌        | 340/2208 [02:02<11:10,  2.78it/s][A
Epoch 2/5:  15%|█▌        | 341/2208 [02:02<10:57,  2.84it/s][A
Epoch 2/5:  15%|█▌      

Batch 350: Training accuracy = 0.8438, F1 = 0.8305, Precision = 0.8307, Recall = 0.8438



Epoch 2/5:  16%|█▌        | 352/2208 [02:06<11:08,  2.78it/s][A
Epoch 2/5:  16%|█▌        | 353/2208 [02:07<11:12,  2.76it/s][A
Epoch 2/5:  16%|█▌        | 354/2208 [02:07<11:08,  2.77it/s][A
Epoch 2/5:  16%|█▌        | 355/2208 [02:07<10:52,  2.84it/s][A
Epoch 2/5:  16%|█▌        | 356/2208 [02:08<10:44,  2.88it/s][A
Epoch 2/5:  16%|█▌        | 357/2208 [02:08<10:40,  2.89it/s][A
Epoch 2/5:  16%|█▌        | 358/2208 [02:08<10:54,  2.83it/s][A
Epoch 2/5:  16%|█▋        | 359/2208 [02:09<11:05,  2.78it/s][A
Epoch 2/5:  16%|█▋        | 360/2208 [02:09<11:07,  2.77it/s][A
Epoch 2/5:  16%|█▋        | 361/2208 [02:09<11:03,  2.78it/s][A
Epoch 2/5:  16%|█▋        | 362/2208 [02:10<10:53,  2.82it/s][A
Epoch 2/5:  16%|█▋        | 363/2208 [02:10<10:59,  2.80it/s][A
Epoch 2/5:  16%|█▋        | 364/2208 [02:10<10:55,  2.81it/s][A
Epoch 2/5:  17%|█▋        | 365/2208 [02:11<10:58,  2.80it/s][A
Epoch 2/5:  17%|█▋        | 366/2208 [02:11<10:52,  2.82it/s][A
Epoch 2/5:  17%|█▋      

Batch 375: Training accuracy = 0.8438, F1 = 0.8237, Precision = 0.8255, Recall = 0.8438



Epoch 2/5:  17%|█▋        | 377/2208 [02:15<10:49,  2.82it/s][A
Epoch 2/5:  17%|█▋        | 378/2208 [02:15<10:41,  2.85it/s][A
Epoch 2/5:  17%|█▋        | 379/2208 [02:16<10:35,  2.88it/s][A
Epoch 2/5:  17%|█▋        | 380/2208 [02:16<10:33,  2.88it/s][A
Epoch 2/5:  17%|█▋        | 381/2208 [02:16<10:48,  2.82it/s][A
Epoch 2/5:  17%|█▋        | 382/2208 [02:17<10:38,  2.86it/s][A
Epoch 2/5:  17%|█▋        | 383/2208 [02:17<10:32,  2.88it/s][A
Epoch 2/5:  17%|█▋        | 384/2208 [02:18<10:47,  2.82it/s][A
Epoch 2/5:  17%|█▋        | 385/2208 [02:18<10:54,  2.79it/s][A
Epoch 2/5:  17%|█▋        | 386/2208 [02:18<10:43,  2.83it/s][A
Epoch 2/5:  18%|█▊        | 387/2208 [02:19<10:41,  2.84it/s][A
Epoch 2/5:  18%|█▊        | 388/2208 [02:19<10:35,  2.86it/s][A
Epoch 2/5:  18%|█▊        | 389/2208 [02:19<10:29,  2.89it/s][A
Epoch 2/5:  18%|█▊        | 390/2208 [02:20<10:27,  2.90it/s][A
Epoch 2/5:  18%|█▊        | 391/2208 [02:20<10:42,  2.83it/s][A
Epoch 2/5:  18%|█▊      

Batch 400: Training accuracy = 0.8984, F1 = 0.8789, Precision = 0.8698, Recall = 0.8984



Epoch 2/5:  18%|█▊        | 402/2208 [02:24<10:23,  2.90it/s][A
Epoch 2/5:  18%|█▊        | 403/2208 [02:24<10:27,  2.88it/s][A
Epoch 2/5:  18%|█▊        | 404/2208 [02:25<10:26,  2.88it/s][A
Epoch 2/5:  18%|█▊        | 405/2208 [02:25<10:29,  2.86it/s][A
Epoch 2/5:  18%|█▊        | 406/2208 [02:25<10:59,  2.73it/s][A
Epoch 2/5:  18%|█▊        | 407/2208 [02:26<11:01,  2.72it/s][A
Epoch 2/5:  18%|█▊        | 408/2208 [02:26<11:09,  2.69it/s][A
Epoch 2/5:  19%|█▊        | 409/2208 [02:26<10:58,  2.73it/s][A
Epoch 2/5:  19%|█▊        | 410/2208 [02:27<11:07,  2.70it/s][A
Epoch 2/5:  19%|█▊        | 411/2208 [02:27<11:15,  2.66it/s][A
Epoch 2/5:  19%|█▊        | 412/2208 [02:28<10:59,  2.72it/s][A
Epoch 2/5:  19%|█▊        | 413/2208 [02:28<11:02,  2.71it/s][A
Epoch 2/5:  19%|█▉        | 414/2208 [02:28<11:07,  2.69it/s][A
Epoch 2/5:  19%|█▉        | 415/2208 [02:29<11:07,  2.69it/s][A
Epoch 2/5:  19%|█▉        | 416/2208 [02:29<10:51,  2.75it/s][A
Epoch 2/5:  19%|█▉      

Batch 425: Training accuracy = 0.8516, F1 = 0.8372, Precision = 0.8372, Recall = 0.8516



Epoch 2/5:  19%|█▉        | 427/2208 [02:33<10:39,  2.78it/s][A
Epoch 2/5:  19%|█▉        | 428/2208 [02:33<10:50,  2.74it/s][A
Epoch 2/5:  19%|█▉        | 429/2208 [02:34<10:37,  2.79it/s][A
Epoch 2/5:  19%|█▉        | 430/2208 [02:34<10:32,  2.81it/s][A
Epoch 2/5:  20%|█▉        | 431/2208 [02:34<10:25,  2.84it/s][A
Epoch 2/5:  20%|█▉        | 432/2208 [02:35<10:20,  2.86it/s][A
Epoch 2/5:  20%|█▉        | 433/2208 [02:35<10:21,  2.86it/s][A
Epoch 2/5:  20%|█▉        | 434/2208 [02:35<10:17,  2.87it/s][A
Epoch 2/5:  20%|█▉        | 435/2208 [02:36<10:15,  2.88it/s][A
Epoch 2/5:  20%|█▉        | 436/2208 [02:36<10:12,  2.89it/s][A
Epoch 2/5:  20%|█▉        | 437/2208 [02:36<10:08,  2.91it/s][A
Epoch 2/5:  20%|█▉        | 438/2208 [02:37<10:12,  2.89it/s][A
Epoch 2/5:  20%|█▉        | 439/2208 [02:37<10:13,  2.88it/s][A
Epoch 2/5:  20%|█▉        | 440/2208 [02:37<10:10,  2.90it/s][A
Epoch 2/5:  20%|█▉        | 441/2208 [02:38<10:10,  2.89it/s][A
Epoch 2/5:  20%|██      

Batch 450: Training accuracy = 0.8438, F1 = 0.8398, Precision = 0.8607, Recall = 0.8438



Epoch 2/5:  20%|██        | 452/2208 [02:42<10:31,  2.78it/s][A
Epoch 2/5:  21%|██        | 453/2208 [02:42<10:36,  2.76it/s][A
Epoch 2/5:  21%|██        | 454/2208 [02:42<10:44,  2.72it/s][A
Epoch 2/5:  21%|██        | 455/2208 [02:43<10:48,  2.71it/s][A
Epoch 2/5:  21%|██        | 456/2208 [02:43<10:45,  2.71it/s][A
Epoch 2/5:  21%|██        | 457/2208 [02:43<10:35,  2.75it/s][A
Epoch 2/5:  21%|██        | 458/2208 [02:44<10:25,  2.80it/s][A
Epoch 2/5:  21%|██        | 459/2208 [02:44<10:17,  2.83it/s][A
Epoch 2/5:  21%|██        | 460/2208 [02:45<10:11,  2.86it/s][A
Epoch 2/5:  21%|██        | 461/2208 [02:45<10:24,  2.80it/s][A
Epoch 2/5:  21%|██        | 462/2208 [02:45<10:14,  2.84it/s][A
Epoch 2/5:  21%|██        | 463/2208 [02:46<10:06,  2.88it/s][A
Epoch 2/5:  21%|██        | 464/2208 [02:46<10:05,  2.88it/s][A
Epoch 2/5:  21%|██        | 465/2208 [02:46<10:00,  2.90it/s][A
Epoch 2/5:  21%|██        | 466/2208 [02:47<09:56,  2.92it/s][A
Epoch 2/5:  21%|██      

Batch 475: Training accuracy = 0.8125, F1 = 0.7938, Precision = 0.7949, Recall = 0.8125



Epoch 2/5:  22%|██▏       | 477/2208 [02:50<09:58,  2.89it/s][A
Epoch 2/5:  22%|██▏       | 478/2208 [02:51<09:55,  2.90it/s][A
Epoch 2/5:  22%|██▏       | 479/2208 [02:51<09:59,  2.88it/s][A
Epoch 2/5:  22%|██▏       | 480/2208 [02:51<09:59,  2.88it/s][A
Epoch 2/5:  22%|██▏       | 481/2208 [02:52<09:58,  2.89it/s][A
Epoch 2/5:  22%|██▏       | 482/2208 [02:52<10:13,  2.81it/s][A
Epoch 2/5:  22%|██▏       | 483/2208 [02:52<10:05,  2.85it/s][A
Epoch 2/5:  22%|██▏       | 484/2208 [02:53<09:59,  2.88it/s][A
Epoch 2/5:  22%|██▏       | 485/2208 [02:53<09:55,  2.89it/s][A
Epoch 2/5:  22%|██▏       | 486/2208 [02:54<10:07,  2.83it/s][A
Epoch 2/5:  22%|██▏       | 487/2208 [02:54<10:15,  2.80it/s][A
Epoch 2/5:  22%|██▏       | 488/2208 [02:54<10:07,  2.83it/s][A
Epoch 2/5:  22%|██▏       | 489/2208 [02:55<10:04,  2.84it/s][A
Epoch 2/5:  22%|██▏       | 490/2208 [02:55<10:08,  2.83it/s][A
Epoch 2/5:  22%|██▏       | 491/2208 [02:55<10:25,  2.74it/s][A
Epoch 2/5:  22%|██▏     

Batch 500: Training accuracy = 0.8125, F1 = 0.7896, Precision = 0.7831, Recall = 0.8125



Epoch 2/5:  23%|██▎       | 502/2208 [02:59<09:53,  2.87it/s][A
Epoch 2/5:  23%|██▎       | 503/2208 [03:00<09:49,  2.89it/s][A
Epoch 2/5:  23%|██▎       | 504/2208 [03:00<09:46,  2.91it/s][A
Epoch 2/5:  23%|██▎       | 505/2208 [03:00<09:59,  2.84it/s][A
Epoch 2/5:  23%|██▎       | 506/2208 [03:01<09:58,  2.84it/s][A
Epoch 2/5:  23%|██▎       | 507/2208 [03:01<09:52,  2.87it/s][A
Epoch 2/5:  23%|██▎       | 508/2208 [03:01<09:49,  2.88it/s][A
Epoch 2/5:  23%|██▎       | 509/2208 [03:02<09:46,  2.90it/s][A
Epoch 2/5:  23%|██▎       | 510/2208 [03:02<09:44,  2.91it/s][A
Epoch 2/5:  23%|██▎       | 511/2208 [03:02<09:54,  2.85it/s][A
Epoch 2/5:  23%|██▎       | 512/2208 [03:03<09:48,  2.88it/s][A
Epoch 2/5:  23%|██▎       | 513/2208 [03:03<10:02,  2.81it/s][A
Epoch 2/5:  23%|██▎       | 514/2208 [03:03<09:54,  2.85it/s][A
Epoch 2/5:  23%|██▎       | 515/2208 [03:04<10:03,  2.80it/s][A
Epoch 2/5:  23%|██▎       | 516/2208 [03:04<09:53,  2.85it/s][A
Epoch 2/5:  23%|██▎     

Batch 525: Training accuracy = 0.8203, F1 = 0.8167, Precision = 0.8294, Recall = 0.8203



Epoch 2/5:  24%|██▍       | 527/2208 [03:08<10:00,  2.80it/s][A
Epoch 2/5:  24%|██▍       | 528/2208 [03:08<09:49,  2.85it/s][A
Epoch 2/5:  24%|██▍       | 529/2208 [03:09<09:46,  2.86it/s][A
Epoch 2/5:  24%|██▍       | 530/2208 [03:09<09:51,  2.84it/s][A
Epoch 2/5:  24%|██▍       | 531/2208 [03:09<09:44,  2.87it/s][A
Epoch 2/5:  24%|██▍       | 532/2208 [03:10<09:53,  2.83it/s][A
Epoch 2/5:  24%|██▍       | 533/2208 [03:10<09:52,  2.82it/s][A
Epoch 2/5:  24%|██▍       | 534/2208 [03:11<09:56,  2.81it/s][A
Epoch 2/5:  24%|██▍       | 535/2208 [03:11<09:48,  2.84it/s][A
Epoch 2/5:  24%|██▍       | 536/2208 [03:11<10:04,  2.77it/s][A
Epoch 2/5:  24%|██▍       | 537/2208 [03:12<10:10,  2.74it/s][A
Epoch 2/5:  24%|██▍       | 538/2208 [03:12<09:59,  2.78it/s][A
Epoch 2/5:  24%|██▍       | 539/2208 [03:12<10:04,  2.76it/s][A
Epoch 2/5:  24%|██▍       | 540/2208 [03:13<09:53,  2.81it/s][A
Epoch 2/5:  25%|██▍       | 541/2208 [03:13<09:51,  2.82it/s][A
Epoch 2/5:  25%|██▍     

Batch 550: Training accuracy = 0.8281, F1 = 0.8124, Precision = 0.8294, Recall = 0.8281



Epoch 2/5:  25%|██▌       | 552/2208 [03:17<10:03,  2.74it/s][A
Epoch 2/5:  25%|██▌       | 553/2208 [03:17<09:57,  2.77it/s][A
Epoch 2/5:  25%|██▌       | 554/2208 [03:18<10:01,  2.75it/s][A
Epoch 2/5:  25%|██▌       | 555/2208 [03:18<10:08,  2.72it/s][A
Epoch 2/5:  25%|██▌       | 556/2208 [03:18<09:57,  2.77it/s][A
Epoch 2/5:  25%|██▌       | 557/2208 [03:19<09:53,  2.78it/s][A
Epoch 2/5:  25%|██▌       | 558/2208 [03:19<09:55,  2.77it/s][A
Epoch 2/5:  25%|██▌       | 559/2208 [03:20<09:52,  2.78it/s][A
Epoch 2/5:  25%|██▌       | 560/2208 [03:20<09:44,  2.82it/s][A
Epoch 2/5:  25%|██▌       | 561/2208 [03:20<09:36,  2.86it/s][A
Epoch 2/5:  25%|██▌       | 562/2208 [03:21<09:29,  2.89it/s][A
Epoch 2/5:  25%|██▌       | 563/2208 [03:21<09:26,  2.91it/s][A
Epoch 2/5:  26%|██▌       | 564/2208 [03:21<09:26,  2.90it/s][A
Epoch 2/5:  26%|██▌       | 565/2208 [03:22<09:24,  2.91it/s][A
Epoch 2/5:  26%|██▌       | 566/2208 [03:22<09:22,  2.92it/s][A
Epoch 2/5:  26%|██▌     

Batch 575: Training accuracy = 0.8281, F1 = 0.7987, Precision = 0.7917, Recall = 0.8281



Epoch 2/5:  26%|██▌       | 577/2208 [03:26<09:37,  2.82it/s][A
Epoch 2/5:  26%|██▌       | 578/2208 [03:26<09:29,  2.86it/s][A
Epoch 2/5:  26%|██▌       | 579/2208 [03:27<09:38,  2.82it/s][A
Epoch 2/5:  26%|██▋       | 580/2208 [03:27<09:34,  2.83it/s][A
Epoch 2/5:  26%|██▋       | 581/2208 [03:27<09:31,  2.85it/s][A
Epoch 2/5:  26%|██▋       | 582/2208 [03:28<09:45,  2.78it/s][A
Epoch 2/5:  26%|██▋       | 583/2208 [03:28<10:03,  2.69it/s][A
Epoch 2/5:  26%|██▋       | 584/2208 [03:28<10:05,  2.68it/s][A
Epoch 2/5:  26%|██▋       | 585/2208 [03:29<10:07,  2.67it/s][A
Epoch 2/5:  27%|██▋       | 586/2208 [03:29<09:52,  2.74it/s][A
Epoch 2/5:  27%|██▋       | 587/2208 [03:29<09:50,  2.74it/s][A
Epoch 2/5:  27%|██▋       | 588/2208 [03:30<09:43,  2.77it/s][A
Epoch 2/5:  27%|██▋       | 589/2208 [03:30<09:32,  2.83it/s][A
Epoch 2/5:  27%|██▋       | 590/2208 [03:30<09:30,  2.84it/s][A
Epoch 2/5:  27%|██▋       | 591/2208 [03:31<09:37,  2.80it/s][A
Epoch 2/5:  27%|██▋     

Batch 600: Training accuracy = 0.8281, F1 = 0.7982, Precision = 0.7871, Recall = 0.8281



Epoch 2/5:  27%|██▋       | 602/2208 [03:35<09:23,  2.85it/s][A
Epoch 2/5:  27%|██▋       | 603/2208 [03:35<09:18,  2.87it/s][A
Epoch 2/5:  27%|██▋       | 604/2208 [03:35<09:14,  2.89it/s][A
Epoch 2/5:  27%|██▋       | 605/2208 [03:36<09:11,  2.91it/s][A
Epoch 2/5:  27%|██▋       | 606/2208 [03:36<09:12,  2.90it/s][A
Epoch 2/5:  27%|██▋       | 607/2208 [03:36<09:18,  2.87it/s][A
Epoch 2/5:  28%|██▊       | 608/2208 [03:37<09:14,  2.88it/s][A
Epoch 2/5:  28%|██▊       | 609/2208 [03:37<09:12,  2.89it/s][A
Epoch 2/5:  28%|██▊       | 610/2208 [03:38<09:17,  2.86it/s][A
Epoch 2/5:  28%|██▊       | 611/2208 [03:38<09:15,  2.87it/s][A
Epoch 2/5:  28%|██▊       | 612/2208 [03:38<09:20,  2.85it/s][A
Epoch 2/5:  28%|██▊       | 613/2208 [03:39<09:33,  2.78it/s][A
Epoch 2/5:  28%|██▊       | 614/2208 [03:39<09:24,  2.82it/s][A
Epoch 2/5:  28%|██▊       | 615/2208 [03:39<09:33,  2.78it/s][A
Epoch 2/5:  28%|██▊       | 616/2208 [03:40<09:32,  2.78it/s][A
Epoch 2/5:  28%|██▊     

Batch 625: Training accuracy = 0.8672, F1 = 0.8506, Precision = 0.8480, Recall = 0.8672



Epoch 2/5:  28%|██▊       | 627/2208 [03:43<09:13,  2.85it/s][A
Epoch 2/5:  28%|██▊       | 628/2208 [03:44<09:09,  2.88it/s][A
Epoch 2/5:  28%|██▊       | 629/2208 [03:44<09:16,  2.84it/s][A
Epoch 2/5:  29%|██▊       | 630/2208 [03:45<09:35,  2.74it/s][A
Epoch 2/5:  29%|██▊       | 631/2208 [03:45<09:26,  2.78it/s][A
Epoch 2/5:  29%|██▊       | 632/2208 [03:45<09:31,  2.76it/s][A
Epoch 2/5:  29%|██▊       | 633/2208 [03:46<09:20,  2.81it/s][A
Epoch 2/5:  29%|██▊       | 634/2208 [03:46<09:15,  2.83it/s][A
Epoch 2/5:  29%|██▉       | 635/2208 [03:46<09:08,  2.87it/s][A
Epoch 2/5:  29%|██▉       | 636/2208 [03:47<09:17,  2.82it/s][A
Epoch 2/5:  29%|██▉       | 637/2208 [03:47<09:15,  2.83it/s][A
Epoch 2/5:  29%|██▉       | 638/2208 [03:47<09:08,  2.86it/s][A
Epoch 2/5:  29%|██▉       | 639/2208 [03:48<09:17,  2.81it/s][A
Epoch 2/5:  29%|██▉       | 640/2208 [03:48<09:16,  2.82it/s][A
Epoch 2/5:  29%|██▉       | 641/2208 [03:48<09:27,  2.76it/s][A
Epoch 2/5:  29%|██▉     

Batch 650: Training accuracy = 0.8281, F1 = 0.8273, Precision = 0.8509, Recall = 0.8281



Epoch 2/5:  30%|██▉       | 652/2208 [03:52<09:04,  2.86it/s][A
Epoch 2/5:  30%|██▉       | 653/2208 [03:53<09:00,  2.87it/s][A
Epoch 2/5:  30%|██▉       | 654/2208 [03:53<09:19,  2.78it/s][A
Epoch 2/5:  30%|██▉       | 655/2208 [03:53<09:18,  2.78it/s][A
Epoch 2/5:  30%|██▉       | 656/2208 [03:54<09:11,  2.81it/s][A
Epoch 2/5:  30%|██▉       | 657/2208 [03:54<09:06,  2.84it/s][A
Epoch 2/5:  30%|██▉       | 658/2208 [03:54<09:10,  2.82it/s][A
Epoch 2/5:  30%|██▉       | 659/2208 [03:55<09:01,  2.86it/s][A
Epoch 2/5:  30%|██▉       | 660/2208 [03:55<09:03,  2.85it/s][A
Epoch 2/5:  30%|██▉       | 661/2208 [03:56<09:01,  2.86it/s][A
Epoch 2/5:  30%|██▉       | 662/2208 [03:56<08:57,  2.87it/s][A
Epoch 2/5:  30%|███       | 663/2208 [03:56<09:11,  2.80it/s][A
Epoch 2/5:  30%|███       | 664/2208 [03:57<09:19,  2.76it/s][A
Epoch 2/5:  30%|███       | 665/2208 [03:57<09:24,  2.74it/s][A
Epoch 2/5:  30%|███       | 666/2208 [03:57<09:27,  2.72it/s][A
Epoch 2/5:  30%|███     

Batch 675: Training accuracy = 0.8281, F1 = 0.8065, Precision = 0.8017, Recall = 0.8281



Epoch 2/5:  31%|███       | 677/2208 [04:01<09:10,  2.78it/s][A
Epoch 2/5:  31%|███       | 678/2208 [04:02<09:04,  2.81it/s][A
Epoch 2/5:  31%|███       | 679/2208 [04:02<09:14,  2.76it/s][A
Epoch 2/5:  31%|███       | 680/2208 [04:02<09:20,  2.73it/s][A
Epoch 2/5:  31%|███       | 681/2208 [04:03<09:25,  2.70it/s][A
Epoch 2/5:  31%|███       | 682/2208 [04:03<09:22,  2.71it/s][A
Epoch 2/5:  31%|███       | 683/2208 [04:04<09:07,  2.78it/s][A
Epoch 2/5:  31%|███       | 684/2208 [04:04<08:58,  2.83it/s][A
Epoch 2/5:  31%|███       | 685/2208 [04:04<09:06,  2.79it/s][A
Epoch 2/5:  31%|███       | 686/2208 [04:05<09:12,  2.76it/s][A
Epoch 2/5:  31%|███       | 687/2208 [04:05<09:02,  2.80it/s][A
Epoch 2/5:  31%|███       | 688/2208 [04:05<09:06,  2.78it/s][A
Epoch 2/5:  31%|███       | 689/2208 [04:06<08:58,  2.82it/s][A
Epoch 2/5:  31%|███▏      | 690/2208 [04:06<08:59,  2.81it/s][A
Epoch 2/5:  31%|███▏      | 691/2208 [04:06<08:50,  2.86it/s][A
Epoch 2/5:  31%|███▏    

Batch 700: Training accuracy = 0.8359, F1 = 0.8251, Precision = 0.8418, Recall = 0.8359



Epoch 2/5:  32%|███▏      | 702/2208 [04:10<08:55,  2.81it/s][A
Epoch 2/5:  32%|███▏      | 703/2208 [04:11<08:52,  2.83it/s][A
Epoch 2/5:  32%|███▏      | 704/2208 [04:11<08:51,  2.83it/s][A
Epoch 2/5:  32%|███▏      | 705/2208 [04:11<09:07,  2.74it/s][A
Epoch 2/5:  32%|███▏      | 706/2208 [04:12<09:03,  2.76it/s][A
Epoch 2/5:  32%|███▏      | 707/2208 [04:12<09:10,  2.73it/s][A
Epoch 2/5:  32%|███▏      | 708/2208 [04:13<09:12,  2.72it/s][A
Epoch 2/5:  32%|███▏      | 709/2208 [04:13<09:01,  2.77it/s][A
Epoch 2/5:  32%|███▏      | 710/2208 [04:13<08:53,  2.81it/s][A
Epoch 2/5:  32%|███▏      | 711/2208 [04:14<08:48,  2.83it/s][A
Epoch 2/5:  32%|███▏      | 712/2208 [04:14<08:45,  2.85it/s][A
Epoch 2/5:  32%|███▏      | 713/2208 [04:14<08:39,  2.88it/s][A
Epoch 2/5:  32%|███▏      | 714/2208 [04:15<08:48,  2.82it/s][A
Epoch 2/5:  32%|███▏      | 715/2208 [04:15<08:44,  2.85it/s][A
Epoch 2/5:  32%|███▏      | 716/2208 [04:15<08:40,  2.87it/s][A
Epoch 2/5:  32%|███▏    

Batch 725: Training accuracy = 0.8750, F1 = 0.8609, Precision = 0.8607, Recall = 0.8750



Epoch 2/5:  33%|███▎      | 727/2208 [04:19<08:36,  2.87it/s][A
Epoch 2/5:  33%|███▎      | 728/2208 [04:20<08:38,  2.86it/s][A
Epoch 2/5:  33%|███▎      | 729/2208 [04:20<08:52,  2.78it/s][A
Epoch 2/5:  33%|███▎      | 730/2208 [04:20<08:55,  2.76it/s][A
Epoch 2/5:  33%|███▎      | 731/2208 [04:21<08:45,  2.81it/s][A
Epoch 2/5:  33%|███▎      | 732/2208 [04:21<08:53,  2.77it/s][A
Epoch 2/5:  33%|███▎      | 733/2208 [04:21<08:45,  2.81it/s][A
Epoch 2/5:  33%|███▎      | 734/2208 [04:22<08:37,  2.85it/s][A
Epoch 2/5:  33%|███▎      | 735/2208 [04:22<08:33,  2.87it/s][A
Epoch 2/5:  33%|███▎      | 736/2208 [04:22<08:30,  2.88it/s][A
Epoch 2/5:  33%|███▎      | 737/2208 [04:23<08:28,  2.89it/s][A
Epoch 2/5:  33%|███▎      | 738/2208 [04:23<08:34,  2.86it/s][A
Epoch 2/5:  33%|███▎      | 739/2208 [04:23<08:28,  2.89it/s][A
Epoch 2/5:  34%|███▎      | 740/2208 [04:24<08:34,  2.85it/s][A
Epoch 2/5:  34%|███▎      | 741/2208 [04:24<08:38,  2.83it/s][A
Epoch 2/5:  34%|███▎    

Batch 750: Training accuracy = 0.7734, F1 = 0.7677, Precision = 0.7754, Recall = 0.7734



Epoch 2/5:  34%|███▍      | 752/2208 [04:28<08:40,  2.80it/s][A
Epoch 2/5:  34%|███▍      | 753/2208 [04:28<08:31,  2.84it/s][A
Epoch 2/5:  34%|███▍      | 754/2208 [04:29<08:24,  2.88it/s][A
Epoch 2/5:  34%|███▍      | 755/2208 [04:29<08:32,  2.84it/s][A
Epoch 2/5:  34%|███▍      | 756/2208 [04:29<08:24,  2.88it/s][A
Epoch 2/5:  34%|███▍      | 757/2208 [04:30<08:42,  2.78it/s][A
Epoch 2/5:  34%|███▍      | 758/2208 [04:30<08:51,  2.73it/s][A
Epoch 2/5:  34%|███▍      | 759/2208 [04:31<08:40,  2.79it/s][A
Epoch 2/5:  34%|███▍      | 760/2208 [04:31<08:42,  2.77it/s][A
Epoch 2/5:  34%|███▍      | 761/2208 [04:31<08:33,  2.82it/s][A
Epoch 2/5:  35%|███▍      | 762/2208 [04:32<08:42,  2.77it/s][A
Epoch 2/5:  35%|███▍      | 763/2208 [04:32<08:33,  2.82it/s][A
Epoch 2/5:  35%|███▍      | 764/2208 [04:32<08:38,  2.78it/s][A
Epoch 2/5:  35%|███▍      | 765/2208 [04:33<08:47,  2.73it/s][A
Epoch 2/5:  35%|███▍      | 766/2208 [04:33<08:53,  2.70it/s][A
Epoch 2/5:  35%|███▍    

Batch 775: Training accuracy = 0.8594, F1 = 0.8419, Precision = 0.8411, Recall = 0.8594



Epoch 2/5:  35%|███▌      | 777/2208 [04:37<08:23,  2.84it/s][A
Epoch 2/5:  35%|███▌      | 778/2208 [04:37<08:33,  2.78it/s][A
Epoch 2/5:  35%|███▌      | 779/2208 [04:38<08:25,  2.83it/s][A
Epoch 2/5:  35%|███▌      | 780/2208 [04:38<08:43,  2.73it/s][A
Epoch 2/5:  35%|███▌      | 781/2208 [04:39<08:44,  2.72it/s][A
Epoch 2/5:  35%|███▌      | 782/2208 [04:39<08:44,  2.72it/s][A
Epoch 2/5:  35%|███▌      | 783/2208 [04:39<08:34,  2.77it/s][A
Epoch 2/5:  36%|███▌      | 784/2208 [04:40<08:39,  2.74it/s][A
Epoch 2/5:  36%|███▌      | 785/2208 [04:40<08:39,  2.74it/s][A
Epoch 2/5:  36%|███▌      | 786/2208 [04:40<08:38,  2.74it/s][A
Epoch 2/5:  36%|███▌      | 787/2208 [04:41<08:40,  2.73it/s][A
Epoch 2/5:  36%|███▌      | 788/2208 [04:41<08:29,  2.79it/s][A
Epoch 2/5:  36%|███▌      | 789/2208 [04:41<08:21,  2.83it/s][A
Epoch 2/5:  36%|███▌      | 790/2208 [04:42<08:16,  2.86it/s][A
Epoch 2/5:  36%|███▌      | 791/2208 [04:42<08:18,  2.84it/s][A
Epoch 2/5:  36%|███▌    

Batch 800: Training accuracy = 0.9219, F1 = 0.9135, Precision = 0.9128, Recall = 0.9219



Epoch 2/5:  36%|███▋      | 802/2208 [04:46<08:10,  2.87it/s][A
Epoch 2/5:  36%|███▋      | 803/2208 [04:46<08:06,  2.89it/s][A
Epoch 2/5:  36%|███▋      | 804/2208 [04:47<08:03,  2.90it/s][A
Epoch 2/5:  36%|███▋      | 805/2208 [04:47<08:03,  2.90it/s][A
Epoch 2/5:  37%|███▋      | 806/2208 [04:47<08:01,  2.91it/s][A
Epoch 2/5:  37%|███▋      | 807/2208 [04:48<07:59,  2.92it/s][A
Epoch 2/5:  37%|███▋      | 808/2208 [04:48<07:59,  2.92it/s][A
Epoch 2/5:  37%|███▋      | 809/2208 [04:48<08:10,  2.85it/s][A
Epoch 2/5:  37%|███▋      | 810/2208 [04:49<08:04,  2.88it/s][A
Epoch 2/5:  37%|███▋      | 811/2208 [04:49<08:02,  2.89it/s][A
Epoch 2/5:  37%|███▋      | 812/2208 [04:49<08:13,  2.83it/s][A
Epoch 2/5:  37%|███▋      | 813/2208 [04:50<08:08,  2.86it/s][A
Epoch 2/5:  37%|███▋      | 814/2208 [04:50<08:05,  2.87it/s][A
Epoch 2/5:  37%|███▋      | 815/2208 [04:50<08:15,  2.81it/s][A
Epoch 2/5:  37%|███▋      | 816/2208 [04:51<08:09,  2.84it/s][A
Epoch 2/5:  37%|███▋    

Batch 825: Training accuracy = 0.8281, F1 = 0.8130, Precision = 0.8206, Recall = 0.8281



Epoch 2/5:  37%|███▋      | 827/2208 [04:55<08:22,  2.75it/s][A
Epoch 2/5:  38%|███▊      | 828/2208 [04:55<08:12,  2.80it/s][A
Epoch 2/5:  38%|███▊      | 829/2208 [04:56<08:21,  2.75it/s][A
Epoch 2/5:  38%|███▊      | 830/2208 [04:56<08:14,  2.79it/s][A
Epoch 2/5:  38%|███▊      | 831/2208 [04:56<08:08,  2.82it/s][A
Epoch 2/5:  38%|███▊      | 832/2208 [04:57<08:06,  2.83it/s][A
Epoch 2/5:  38%|███▊      | 833/2208 [04:57<08:01,  2.85it/s][A
Epoch 2/5:  38%|███▊      | 834/2208 [04:57<07:58,  2.87it/s][A
Epoch 2/5:  38%|███▊      | 835/2208 [04:58<07:56,  2.88it/s][A
Epoch 2/5:  38%|███▊      | 836/2208 [04:58<07:58,  2.87it/s][A
Epoch 2/5:  38%|███▊      | 837/2208 [04:58<07:54,  2.89it/s][A
Epoch 2/5:  38%|███▊      | 838/2208 [04:59<07:52,  2.90it/s][A
Epoch 2/5:  38%|███▊      | 839/2208 [04:59<07:50,  2.91it/s][A
Epoch 2/5:  38%|███▊      | 840/2208 [04:59<07:48,  2.92it/s][A
Epoch 2/5:  38%|███▊      | 841/2208 [05:00<07:50,  2.90it/s][A
Epoch 2/5:  38%|███▊    

Batch 850: Training accuracy = 0.7969, F1 = 0.7967, Precision = 0.8184, Recall = 0.7969



Epoch 2/5:  39%|███▊      | 852/2208 [05:04<07:59,  2.83it/s][A
Epoch 2/5:  39%|███▊      | 853/2208 [05:04<07:55,  2.85it/s][A
Epoch 2/5:  39%|███▊      | 854/2208 [05:04<07:53,  2.86it/s][A
Epoch 2/5:  39%|███▊      | 855/2208 [05:05<07:50,  2.88it/s][A
Epoch 2/5:  39%|███▉      | 856/2208 [05:05<07:54,  2.85it/s][A
Epoch 2/5:  39%|███▉      | 857/2208 [05:05<08:01,  2.81it/s][A
Epoch 2/5:  39%|███▉      | 858/2208 [05:06<07:53,  2.85it/s][A
Epoch 2/5:  39%|███▉      | 859/2208 [05:06<07:50,  2.87it/s][A
Epoch 2/5:  39%|███▉      | 860/2208 [05:06<07:46,  2.89it/s][A
Epoch 2/5:  39%|███▉      | 861/2208 [05:07<07:43,  2.91it/s][A
Epoch 2/5:  39%|███▉      | 862/2208 [05:07<07:45,  2.89it/s][A
Epoch 2/5:  39%|███▉      | 863/2208 [05:07<07:56,  2.82it/s][A
Epoch 2/5:  39%|███▉      | 864/2208 [05:08<08:03,  2.78it/s][A
Epoch 2/5:  39%|███▉      | 865/2208 [05:08<07:59,  2.80it/s][A
Epoch 2/5:  39%|███▉      | 866/2208 [05:08<07:57,  2.81it/s][A
Epoch 2/5:  39%|███▉    

Batch 875: Training accuracy = 0.8281, F1 = 0.8083, Precision = 0.8118, Recall = 0.8281



Epoch 2/5:  40%|███▉      | 877/2208 [05:12<07:59,  2.78it/s][A
Epoch 2/5:  40%|███▉      | 878/2208 [05:13<07:51,  2.82it/s][A
Epoch 2/5:  40%|███▉      | 879/2208 [05:13<07:45,  2.86it/s][A
Epoch 2/5:  40%|███▉      | 880/2208 [05:13<07:41,  2.88it/s][A
Epoch 2/5:  40%|███▉      | 881/2208 [05:14<07:38,  2.89it/s][A
Epoch 2/5:  40%|███▉      | 882/2208 [05:14<07:49,  2.82it/s][A
Epoch 2/5:  40%|███▉      | 883/2208 [05:15<07:54,  2.79it/s][A
Epoch 2/5:  40%|████      | 884/2208 [05:15<07:48,  2.82it/s][A
Epoch 2/5:  40%|████      | 885/2208 [05:15<07:48,  2.82it/s][A
Epoch 2/5:  40%|████      | 886/2208 [05:16<07:43,  2.85it/s][A
Epoch 2/5:  40%|████      | 887/2208 [05:16<07:56,  2.77it/s][A
Epoch 2/5:  40%|████      | 888/2208 [05:16<07:51,  2.80it/s][A
Epoch 2/5:  40%|████      | 889/2208 [05:17<07:44,  2.84it/s][A
Epoch 2/5:  40%|████      | 890/2208 [05:17<07:39,  2.87it/s][A
Epoch 2/5:  40%|████      | 891/2208 [05:17<07:38,  2.88it/s][A
Epoch 2/5:  40%|████    

Batch 900: Training accuracy = 0.8281, F1 = 0.8255, Precision = 0.8438, Recall = 0.8281



Epoch 2/5:  41%|████      | 902/2208 [05:21<07:48,  2.79it/s][A
Epoch 2/5:  41%|████      | 903/2208 [05:22<07:43,  2.81it/s][A
Epoch 2/5:  41%|████      | 904/2208 [05:22<07:47,  2.79it/s][A
Epoch 2/5:  41%|████      | 905/2208 [05:22<07:48,  2.78it/s][A
Epoch 2/5:  41%|████      | 906/2208 [05:23<07:44,  2.80it/s][A
Epoch 2/5:  41%|████      | 907/2208 [05:23<07:39,  2.83it/s][A
Epoch 2/5:  41%|████      | 908/2208 [05:23<07:46,  2.79it/s][A
Epoch 2/5:  41%|████      | 909/2208 [05:24<07:51,  2.76it/s][A
Epoch 2/5:  41%|████      | 910/2208 [05:24<07:51,  2.75it/s][A
Epoch 2/5:  41%|████▏     | 911/2208 [05:24<07:43,  2.80it/s][A
Epoch 2/5:  41%|████▏     | 912/2208 [05:25<07:39,  2.82it/s][A
Epoch 2/5:  41%|████▏     | 913/2208 [05:25<07:32,  2.86it/s][A
Epoch 2/5:  41%|████▏     | 914/2208 [05:26<07:30,  2.87it/s][A
Epoch 2/5:  41%|████▏     | 915/2208 [05:26<07:27,  2.89it/s][A
Epoch 2/5:  41%|████▏     | 916/2208 [05:26<07:32,  2.85it/s][A
Epoch 2/5:  42%|████▏   

Batch 925: Training accuracy = 0.8906, F1 = 0.8784, Precision = 0.8802, Recall = 0.8906



Epoch 2/5:  42%|████▏     | 927/2208 [05:30<07:30,  2.84it/s][A
Epoch 2/5:  42%|████▏     | 928/2208 [05:30<07:24,  2.88it/s][A
Epoch 2/5:  42%|████▏     | 929/2208 [05:31<07:23,  2.89it/s][A
Epoch 2/5:  42%|████▏     | 930/2208 [05:31<07:20,  2.90it/s][A
Epoch 2/5:  42%|████▏     | 931/2208 [05:31<07:17,  2.92it/s][A
Epoch 2/5:  42%|████▏     | 932/2208 [05:32<07:16,  2.93it/s][A
Epoch 2/5:  42%|████▏     | 933/2208 [05:32<07:17,  2.92it/s][A
Epoch 2/5:  42%|████▏     | 934/2208 [05:32<07:16,  2.92it/s][A
Epoch 2/5:  42%|████▏     | 935/2208 [05:33<07:14,  2.93it/s][A
Epoch 2/5:  42%|████▏     | 936/2208 [05:33<07:15,  2.92it/s][A
Epoch 2/5:  42%|████▏     | 937/2208 [05:34<07:15,  2.92it/s][A
Epoch 2/5:  42%|████▏     | 938/2208 [05:34<07:15,  2.91it/s][A
Epoch 2/5:  43%|████▎     | 939/2208 [05:34<07:13,  2.93it/s][A
Epoch 2/5:  43%|████▎     | 940/2208 [05:35<07:11,  2.94it/s][A
Epoch 2/5:  43%|████▎     | 941/2208 [05:35<07:12,  2.93it/s][A
Epoch 2/5:  43%|████▎   

Batch 950: Training accuracy = 0.8203, F1 = 0.8146, Precision = 0.8307, Recall = 0.8203



Epoch 2/5:  43%|████▎     | 952/2208 [05:39<07:23,  2.83it/s][A
Epoch 2/5:  43%|████▎     | 953/2208 [05:39<07:24,  2.82it/s][A
Epoch 2/5:  43%|████▎     | 954/2208 [05:40<07:18,  2.86it/s][A
Epoch 2/5:  43%|████▎     | 955/2208 [05:40<07:19,  2.85it/s][A
Epoch 2/5:  43%|████▎     | 956/2208 [05:40<07:18,  2.86it/s][A
Epoch 2/5:  43%|████▎     | 957/2208 [05:41<07:17,  2.86it/s][A
Epoch 2/5:  43%|████▎     | 958/2208 [05:41<07:17,  2.85it/s][A
Epoch 2/5:  43%|████▎     | 959/2208 [05:41<07:29,  2.78it/s][A
Epoch 2/5:  43%|████▎     | 960/2208 [05:42<07:20,  2.83it/s][A
Epoch 2/5:  44%|████▎     | 961/2208 [05:42<07:27,  2.79it/s][A
Epoch 2/5:  44%|████▎     | 962/2208 [05:42<07:28,  2.78it/s][A
Epoch 2/5:  44%|████▎     | 963/2208 [05:43<07:30,  2.76it/s][A
Epoch 2/5:  44%|████▎     | 964/2208 [05:43<07:22,  2.81it/s][A
Epoch 2/5:  44%|████▎     | 965/2208 [05:43<07:17,  2.84it/s][A
Epoch 2/5:  44%|████▍     | 966/2208 [05:44<07:28,  2.77it/s][A
Epoch 2/5:  44%|████▍   

Batch 975: Training accuracy = 0.8594, F1 = 0.8477, Precision = 0.8503, Recall = 0.8594



Epoch 2/5:  44%|████▍     | 977/2208 [05:48<07:06,  2.89it/s][A
Epoch 2/5:  44%|████▍     | 978/2208 [05:48<07:03,  2.90it/s][A
Epoch 2/5:  44%|████▍     | 979/2208 [05:48<07:01,  2.91it/s][A
Epoch 2/5:  44%|████▍     | 980/2208 [05:49<07:11,  2.84it/s][A
Epoch 2/5:  44%|████▍     | 981/2208 [05:49<07:14,  2.83it/s][A
Epoch 2/5:  44%|████▍     | 982/2208 [05:49<07:26,  2.74it/s][A
Epoch 2/5:  45%|████▍     | 983/2208 [05:50<07:28,  2.73it/s][A
Epoch 2/5:  45%|████▍     | 984/2208 [05:50<07:29,  2.72it/s][A
Epoch 2/5:  45%|████▍     | 985/2208 [05:51<07:19,  2.78it/s][A
Epoch 2/5:  45%|████▍     | 986/2208 [05:51<07:28,  2.72it/s][A
Epoch 2/5:  45%|████▍     | 987/2208 [05:51<07:26,  2.73it/s][A
Epoch 2/5:  45%|████▍     | 988/2208 [05:52<07:23,  2.75it/s][A
Epoch 2/5:  45%|████▍     | 989/2208 [05:52<07:16,  2.80it/s][A
Epoch 2/5:  45%|████▍     | 990/2208 [05:52<07:23,  2.75it/s][A
Epoch 2/5:  45%|████▍     | 991/2208 [05:53<07:14,  2.80it/s][A
Epoch 2/5:  45%|████▍   

Batch 1000: Training accuracy = 0.8438, F1 = 0.8321, Precision = 0.8461, Recall = 0.8438



Epoch 2/5:  45%|████▌     | 1002/2208 [05:57<07:07,  2.82it/s][A
Epoch 2/5:  45%|████▌     | 1003/2208 [05:57<07:06,  2.83it/s][A
Epoch 2/5:  45%|████▌     | 1004/2208 [05:57<07:03,  2.85it/s][A
Epoch 2/5:  46%|████▌     | 1005/2208 [05:58<07:00,  2.86it/s][A
Epoch 2/5:  46%|████▌     | 1006/2208 [05:58<06:58,  2.87it/s][A
Epoch 2/5:  46%|████▌     | 1007/2208 [05:58<07:03,  2.84it/s][A
Epoch 2/5:  46%|████▌     | 1008/2208 [05:59<06:57,  2.87it/s][A
Epoch 2/5:  46%|████▌     | 1009/2208 [05:59<06:55,  2.89it/s][A
Epoch 2/5:  46%|████▌     | 1010/2208 [05:59<07:07,  2.81it/s][A
Epoch 2/5:  46%|████▌     | 1011/2208 [06:00<07:02,  2.84it/s][A
Epoch 2/5:  46%|████▌     | 1012/2208 [06:00<07:08,  2.79it/s][A
Epoch 2/5:  46%|████▌     | 1013/2208 [06:00<07:01,  2.83it/s][A
Epoch 2/5:  46%|████▌     | 1014/2208 [06:01<07:02,  2.82it/s][A
Epoch 2/5:  46%|████▌     | 1015/2208 [06:01<07:04,  2.81it/s][A
Epoch 2/5:  46%|████▌     | 1016/2208 [06:02<07:00,  2.84it/s][A
Epoch 2/5

Batch 1025: Training accuracy = 0.8438, F1 = 0.8229, Precision = 0.8141, Recall = 0.8438



Epoch 2/5:  47%|████▋     | 1027/2208 [06:05<06:59,  2.81it/s][A
Epoch 2/5:  47%|████▋     | 1028/2208 [06:06<07:04,  2.78it/s][A
Epoch 2/5:  47%|████▋     | 1029/2208 [06:06<07:00,  2.81it/s][A
Epoch 2/5:  47%|████▋     | 1030/2208 [06:07<06:56,  2.83it/s][A
Epoch 2/5:  47%|████▋     | 1031/2208 [06:07<07:03,  2.78it/s][A
Epoch 2/5:  47%|████▋     | 1032/2208 [06:07<07:07,  2.75it/s][A
Epoch 2/5:  47%|████▋     | 1033/2208 [06:08<07:10,  2.73it/s][A
Epoch 2/5:  47%|████▋     | 1034/2208 [06:08<07:12,  2.71it/s][A
Epoch 2/5:  47%|████▋     | 1035/2208 [06:08<07:11,  2.72it/s][A
Epoch 2/5:  47%|████▋     | 1036/2208 [06:09<07:14,  2.70it/s][A
Epoch 2/5:  47%|████▋     | 1037/2208 [06:09<07:06,  2.75it/s][A
Epoch 2/5:  47%|████▋     | 1038/2208 [06:09<06:56,  2.81it/s][A
Epoch 2/5:  47%|████▋     | 1039/2208 [06:10<06:57,  2.80it/s][A
Epoch 2/5:  47%|████▋     | 1040/2208 [06:10<07:09,  2.72it/s][A
Epoch 2/5:  47%|████▋     | 1041/2208 [06:11<07:01,  2.77it/s][A
Epoch 2/5

Batch 1050: Training accuracy = 0.8516, F1 = 0.8365, Precision = 0.8346, Recall = 0.8516



Epoch 2/5:  48%|████▊     | 1052/2208 [06:14<06:50,  2.82it/s][A
Epoch 2/5:  48%|████▊     | 1053/2208 [06:15<06:46,  2.84it/s][A
Epoch 2/5:  48%|████▊     | 1054/2208 [06:15<06:47,  2.83it/s][A
Epoch 2/5:  48%|████▊     | 1055/2208 [06:15<06:43,  2.86it/s][A
Epoch 2/5:  48%|████▊     | 1056/2208 [06:16<06:50,  2.81it/s][A
Epoch 2/5:  48%|████▊     | 1057/2208 [06:16<06:51,  2.80it/s][A
Epoch 2/5:  48%|████▊     | 1058/2208 [06:17<06:44,  2.84it/s][A
Epoch 2/5:  48%|████▊     | 1059/2208 [06:17<06:44,  2.84it/s][A
Epoch 2/5:  48%|████▊     | 1060/2208 [06:17<06:40,  2.87it/s][A
Epoch 2/5:  48%|████▊     | 1061/2208 [06:18<06:37,  2.89it/s][A
Epoch 2/5:  48%|████▊     | 1062/2208 [06:18<06:43,  2.84it/s][A
Epoch 2/5:  48%|████▊     | 1063/2208 [06:18<06:40,  2.86it/s][A
Epoch 2/5:  48%|████▊     | 1064/2208 [06:19<06:36,  2.89it/s][A
Epoch 2/5:  48%|████▊     | 1065/2208 [06:19<06:47,  2.81it/s][A
Epoch 2/5:  48%|████▊     | 1066/2208 [06:19<06:41,  2.84it/s][A
Epoch 2/5

Batch 1075: Training accuracy = 0.8516, F1 = 0.8490, Precision = 0.8633, Recall = 0.8516



Epoch 2/5:  49%|████▉     | 1077/2208 [06:23<06:48,  2.77it/s][A
Epoch 2/5:  49%|████▉     | 1078/2208 [06:24<06:55,  2.72it/s][A
Epoch 2/5:  49%|████▉     | 1079/2208 [06:24<06:51,  2.74it/s][A
Epoch 2/5:  49%|████▉     | 1080/2208 [06:24<06:49,  2.75it/s][A
Epoch 2/5:  49%|████▉     | 1081/2208 [06:25<06:47,  2.77it/s][A
Epoch 2/5:  49%|████▉     | 1082/2208 [06:25<06:58,  2.69it/s][A
Epoch 2/5:  49%|████▉     | 1083/2208 [06:26<06:56,  2.70it/s][A
Epoch 2/5:  49%|████▉     | 1084/2208 [06:26<06:49,  2.75it/s][A
Epoch 2/5:  49%|████▉     | 1085/2208 [06:26<06:43,  2.78it/s][A
Epoch 2/5:  49%|████▉     | 1086/2208 [06:27<06:41,  2.80it/s][A
Epoch 2/5:  49%|████▉     | 1087/2208 [06:27<06:41,  2.80it/s][A
Epoch 2/5:  49%|████▉     | 1088/2208 [06:27<06:44,  2.77it/s][A
Epoch 2/5:  49%|████▉     | 1089/2208 [06:28<06:35,  2.83it/s][A
Epoch 2/5:  49%|████▉     | 1090/2208 [06:28<06:30,  2.86it/s][A
Epoch 2/5:  49%|████▉     | 1091/2208 [06:28<06:27,  2.88it/s][A
Epoch 2/5

Batch 1100: Training accuracy = 0.8594, F1 = 0.8542, Precision = 0.8646, Recall = 0.8594



Epoch 2/5:  50%|████▉     | 1102/2208 [06:32<06:34,  2.80it/s][A
Epoch 2/5:  50%|████▉     | 1103/2208 [06:33<06:33,  2.81it/s][A
Epoch 2/5:  50%|█████     | 1104/2208 [06:33<06:29,  2.84it/s][A
Epoch 2/5:  50%|█████     | 1105/2208 [06:33<06:24,  2.87it/s][A
Epoch 2/5:  50%|█████     | 1106/2208 [06:34<06:30,  2.82it/s][A
Epoch 2/5:  50%|█████     | 1107/2208 [06:34<06:28,  2.83it/s][A
Epoch 2/5:  50%|█████     | 1108/2208 [06:34<06:25,  2.85it/s][A
Epoch 2/5:  50%|█████     | 1109/2208 [06:35<06:24,  2.86it/s][A
Epoch 2/5:  50%|█████     | 1110/2208 [06:35<06:24,  2.85it/s][A
Epoch 2/5:  50%|█████     | 1111/2208 [06:35<06:32,  2.79it/s][A
Epoch 2/5:  50%|█████     | 1112/2208 [06:36<06:28,  2.82it/s][A
Epoch 2/5:  50%|█████     | 1113/2208 [06:36<06:23,  2.85it/s][A
Epoch 2/5:  50%|█████     | 1114/2208 [06:36<06:22,  2.86it/s][A
Epoch 2/5:  50%|█████     | 1115/2208 [06:37<06:24,  2.84it/s][A
Epoch 2/5:  51%|█████     | 1116/2208 [06:37<06:31,  2.79it/s][A
Epoch 2/5

Batch 1125: Training accuracy = 0.8516, F1 = 0.8334, Precision = 0.8353, Recall = 0.8516



Epoch 2/5:  51%|█████     | 1127/2208 [06:41<06:37,  2.72it/s][A
Epoch 2/5:  51%|█████     | 1128/2208 [06:42<06:46,  2.65it/s][A
Epoch 2/5:  51%|█████     | 1129/2208 [06:42<06:39,  2.70it/s][A
Epoch 2/5:  51%|█████     | 1130/2208 [06:42<06:31,  2.75it/s][A
Epoch 2/5:  51%|█████     | 1131/2208 [06:43<06:27,  2.78it/s][A
Epoch 2/5:  51%|█████▏    | 1132/2208 [06:43<06:22,  2.81it/s][A
Epoch 2/5:  51%|█████▏    | 1133/2208 [06:43<06:18,  2.84it/s][A
Epoch 2/5:  51%|█████▏    | 1134/2208 [06:44<06:22,  2.81it/s][A
Epoch 2/5:  51%|█████▏    | 1135/2208 [06:44<06:29,  2.76it/s][A
Epoch 2/5:  51%|█████▏    | 1136/2208 [06:44<06:25,  2.78it/s][A
Epoch 2/5:  51%|█████▏    | 1137/2208 [06:45<06:20,  2.82it/s][A
Epoch 2/5:  52%|█████▏    | 1138/2208 [06:45<06:27,  2.76it/s][A
Epoch 2/5:  52%|█████▏    | 1139/2208 [06:45<06:19,  2.81it/s][A
Epoch 2/5:  52%|█████▏    | 1140/2208 [06:46<06:25,  2.77it/s][A
Epoch 2/5:  52%|█████▏    | 1141/2208 [06:46<06:19,  2.81it/s][A
Epoch 2/5

Batch 1150: Training accuracy = 0.8516, F1 = 0.8503, Precision = 0.8646, Recall = 0.8516



Epoch 2/5:  52%|█████▏    | 1152/2208 [06:50<06:09,  2.86it/s][A
Epoch 2/5:  52%|█████▏    | 1153/2208 [06:50<06:05,  2.89it/s][A
Epoch 2/5:  52%|█████▏    | 1154/2208 [06:51<06:17,  2.79it/s][A
Epoch 2/5:  52%|█████▏    | 1155/2208 [06:51<06:19,  2.77it/s][A
Epoch 2/5:  52%|█████▏    | 1156/2208 [06:51<06:19,  2.77it/s][A
Epoch 2/5:  52%|█████▏    | 1157/2208 [06:52<06:11,  2.83it/s][A
Epoch 2/5:  52%|█████▏    | 1158/2208 [06:52<06:24,  2.73it/s][A
Epoch 2/5:  52%|█████▏    | 1159/2208 [06:53<06:20,  2.75it/s][A
Epoch 2/5:  53%|█████▎    | 1160/2208 [06:53<06:15,  2.79it/s][A
Epoch 2/5:  53%|█████▎    | 1161/2208 [06:53<06:26,  2.71it/s][A
Epoch 2/5:  53%|█████▎    | 1162/2208 [06:54<06:25,  2.71it/s][A
Epoch 2/5:  53%|█████▎    | 1163/2208 [06:54<06:27,  2.70it/s][A
Epoch 2/5:  53%|█████▎    | 1164/2208 [06:54<06:33,  2.66it/s][A
Epoch 2/5:  53%|█████▎    | 1165/2208 [06:55<06:29,  2.67it/s][A
Epoch 2/5:  53%|█████▎    | 1166/2208 [06:55<06:20,  2.74it/s][A
Epoch 2/5

Batch 1175: Training accuracy = 0.8828, F1 = 0.8753, Precision = 0.8917, Recall = 0.8828



Epoch 2/5:  53%|█████▎    | 1177/2208 [06:59<06:01,  2.85it/s][A
Epoch 2/5:  53%|█████▎    | 1178/2208 [06:59<06:01,  2.85it/s][A
Epoch 2/5:  53%|█████▎    | 1179/2208 [07:00<05:58,  2.87it/s][A
Epoch 2/5:  53%|█████▎    | 1180/2208 [07:00<06:10,  2.77it/s][A
Epoch 2/5:  53%|█████▎    | 1181/2208 [07:01<06:06,  2.80it/s][A
Epoch 2/5:  54%|█████▎    | 1182/2208 [07:01<06:02,  2.83it/s][A
Epoch 2/5:  54%|█████▎    | 1183/2208 [07:01<06:01,  2.84it/s][A
Epoch 2/5:  54%|█████▎    | 1184/2208 [07:02<05:58,  2.86it/s][A
Epoch 2/5:  54%|█████▎    | 1185/2208 [07:02<06:03,  2.81it/s][A
Epoch 2/5:  54%|█████▎    | 1186/2208 [07:02<06:03,  2.81it/s][A
Epoch 2/5:  54%|█████▍    | 1187/2208 [07:03<05:59,  2.84it/s][A
Epoch 2/5:  54%|█████▍    | 1188/2208 [07:03<05:54,  2.88it/s][A
Epoch 2/5:  54%|█████▍    | 1189/2208 [07:03<05:52,  2.89it/s][A
Epoch 2/5:  54%|█████▍    | 1190/2208 [07:04<05:53,  2.88it/s][A
Epoch 2/5:  54%|█████▍    | 1191/2208 [07:04<05:59,  2.83it/s][A
Epoch 2/5

Batch 1200: Training accuracy = 0.8203, F1 = 0.8066, Precision = 0.8136, Recall = 0.8203



Epoch 2/5:  54%|█████▍    | 1202/2208 [07:08<05:59,  2.80it/s][A
Epoch 2/5:  54%|█████▍    | 1203/2208 [07:08<05:52,  2.85it/s][A
Epoch 2/5:  55%|█████▍    | 1204/2208 [07:09<05:56,  2.81it/s][A
Epoch 2/5:  55%|█████▍    | 1205/2208 [07:09<05:55,  2.82it/s][A
Epoch 2/5:  55%|█████▍    | 1206/2208 [07:09<05:52,  2.85it/s][A
Epoch 2/5:  55%|█████▍    | 1207/2208 [07:10<05:48,  2.87it/s][A
Epoch 2/5:  55%|█████▍    | 1208/2208 [07:10<05:57,  2.80it/s][A
Epoch 2/5:  55%|█████▍    | 1209/2208 [07:10<05:57,  2.80it/s][A
Epoch 2/5:  55%|█████▍    | 1210/2208 [07:11<05:59,  2.78it/s][A
Epoch 2/5:  55%|█████▍    | 1211/2208 [07:11<06:10,  2.69it/s][A
Epoch 2/5:  55%|█████▍    | 1212/2208 [07:11<05:59,  2.77it/s][A
Epoch 2/5:  55%|█████▍    | 1213/2208 [07:12<05:53,  2.82it/s][A
Epoch 2/5:  55%|█████▍    | 1214/2208 [07:12<05:54,  2.80it/s][A
Epoch 2/5:  55%|█████▌    | 1215/2208 [07:13<06:03,  2.73it/s][A
Epoch 2/5:  55%|█████▌    | 1216/2208 [07:13<05:57,  2.77it/s][A
Epoch 2/5

Batch 1225: Training accuracy = 0.8906, F1 = 0.8862, Precision = 0.8919, Recall = 0.8906



Epoch 2/5:  56%|█████▌    | 1227/2208 [07:17<05:43,  2.86it/s][A
Epoch 2/5:  56%|█████▌    | 1228/2208 [07:17<05:46,  2.83it/s][A
Epoch 2/5:  56%|█████▌    | 1229/2208 [07:17<05:42,  2.85it/s][A
Epoch 2/5:  56%|█████▌    | 1230/2208 [07:18<05:39,  2.88it/s][A
Epoch 2/5:  56%|█████▌    | 1231/2208 [07:18<05:46,  2.82it/s][A
Epoch 2/5:  56%|█████▌    | 1232/2208 [07:19<05:44,  2.83it/s][A
Epoch 2/5:  56%|█████▌    | 1233/2208 [07:19<05:41,  2.86it/s][A
Epoch 2/5:  56%|█████▌    | 1234/2208 [07:19<05:41,  2.85it/s][A
Epoch 2/5:  56%|█████▌    | 1235/2208 [07:20<05:53,  2.75it/s][A
Epoch 2/5:  56%|█████▌    | 1236/2208 [07:20<05:51,  2.76it/s][A
Epoch 2/5:  56%|█████▌    | 1237/2208 [07:20<05:46,  2.80it/s][A
Epoch 2/5:  56%|█████▌    | 1238/2208 [07:21<05:45,  2.81it/s][A
Epoch 2/5:  56%|█████▌    | 1239/2208 [07:21<05:47,  2.79it/s][A
Epoch 2/5:  56%|█████▌    | 1240/2208 [07:21<05:41,  2.83it/s][A
Epoch 2/5:  56%|█████▌    | 1241/2208 [07:22<05:46,  2.79it/s][A
Epoch 2/5

Batch 1250: Training accuracy = 0.8906, F1 = 0.8760, Precision = 0.8750, Recall = 0.8906



Epoch 2/5:  57%|█████▋    | 1252/2208 [07:26<05:37,  2.84it/s][A
Epoch 2/5:  57%|█████▋    | 1253/2208 [07:26<05:36,  2.84it/s][A
Epoch 2/5:  57%|█████▋    | 1254/2208 [07:26<05:33,  2.86it/s][A
Epoch 2/5:  57%|█████▋    | 1255/2208 [07:27<05:30,  2.88it/s][A
Epoch 2/5:  57%|█████▋    | 1256/2208 [07:27<05:38,  2.81it/s][A
Epoch 2/5:  57%|█████▋    | 1257/2208 [07:27<05:33,  2.85it/s][A
Epoch 2/5:  57%|█████▋    | 1258/2208 [07:28<05:30,  2.88it/s][A
Epoch 2/5:  57%|█████▋    | 1259/2208 [07:28<05:44,  2.75it/s][A
Epoch 2/5:  57%|█████▋    | 1260/2208 [07:29<05:37,  2.81it/s][A
Epoch 2/5:  57%|█████▋    | 1261/2208 [07:29<05:43,  2.75it/s][A
Epoch 2/5:  57%|█████▋    | 1262/2208 [07:29<05:47,  2.73it/s][A
Epoch 2/5:  57%|█████▋    | 1263/2208 [07:30<05:43,  2.75it/s][A
Epoch 2/5:  57%|█████▋    | 1264/2208 [07:30<05:44,  2.74it/s][A
Epoch 2/5:  57%|█████▋    | 1265/2208 [07:30<05:39,  2.78it/s][A
Epoch 2/5:  57%|█████▋    | 1266/2208 [07:31<05:44,  2.73it/s][A
Epoch 2/5

Batch 1275: Training accuracy = 0.8594, F1 = 0.8430, Precision = 0.8522, Recall = 0.8594



Epoch 2/5:  58%|█████▊    | 1277/2208 [07:35<05:23,  2.87it/s][A
Epoch 2/5:  58%|█████▊    | 1278/2208 [07:35<05:23,  2.87it/s][A
Epoch 2/5:  58%|█████▊    | 1279/2208 [07:35<05:28,  2.83it/s][A
Epoch 2/5:  58%|█████▊    | 1280/2208 [07:36<05:25,  2.85it/s][A
Epoch 2/5:  58%|█████▊    | 1281/2208 [07:36<05:34,  2.77it/s][A
Epoch 2/5:  58%|█████▊    | 1282/2208 [07:36<05:38,  2.73it/s][A
Epoch 2/5:  58%|█████▊    | 1283/2208 [07:37<05:41,  2.71it/s][A
Epoch 2/5:  58%|█████▊    | 1284/2208 [07:37<05:41,  2.70it/s][A
Epoch 2/5:  58%|█████▊    | 1285/2208 [07:38<05:41,  2.71it/s][A
Epoch 2/5:  58%|█████▊    | 1286/2208 [07:38<05:32,  2.77it/s][A
Epoch 2/5:  58%|█████▊    | 1287/2208 [07:38<05:45,  2.67it/s][A
Epoch 2/5:  58%|█████▊    | 1288/2208 [07:39<05:36,  2.74it/s][A
Epoch 2/5:  58%|█████▊    | 1289/2208 [07:39<05:38,  2.72it/s][A
Epoch 2/5:  58%|█████▊    | 1290/2208 [07:39<05:31,  2.77it/s][A
Epoch 2/5:  58%|█████▊    | 1291/2208 [07:40<05:27,  2.80it/s][A
Epoch 2/5

Batch 1300: Training accuracy = 0.8516, F1 = 0.8307, Precision = 0.8336, Recall = 0.8516



Epoch 2/5:  59%|█████▉    | 1302/2208 [07:44<05:16,  2.86it/s][A
Epoch 2/5:  59%|█████▉    | 1303/2208 [07:44<05:13,  2.88it/s][A
Epoch 2/5:  59%|█████▉    | 1304/2208 [07:44<05:11,  2.90it/s][A
Epoch 2/5:  59%|█████▉    | 1305/2208 [07:45<05:17,  2.85it/s][A
Epoch 2/5:  59%|█████▉    | 1306/2208 [07:45<05:13,  2.87it/s][A
Epoch 2/5:  59%|█████▉    | 1307/2208 [07:45<05:10,  2.90it/s][A
Epoch 2/5:  59%|█████▉    | 1308/2208 [07:46<05:16,  2.85it/s][A
Epoch 2/5:  59%|█████▉    | 1309/2208 [07:46<05:21,  2.79it/s][A
Epoch 2/5:  59%|█████▉    | 1310/2208 [07:46<05:18,  2.82it/s][A
Epoch 2/5:  59%|█████▉    | 1311/2208 [07:47<05:23,  2.77it/s][A
Epoch 2/5:  59%|█████▉    | 1312/2208 [07:47<05:23,  2.77it/s][A
Epoch 2/5:  59%|█████▉    | 1313/2208 [07:47<05:26,  2.74it/s][A
Epoch 2/5:  60%|█████▉    | 1314/2208 [07:48<05:21,  2.78it/s][A
Epoch 2/5:  60%|█████▉    | 1315/2208 [07:48<05:15,  2.83it/s][A
Epoch 2/5:  60%|█████▉    | 1316/2208 [07:48<05:11,  2.87it/s][A
Epoch 2/5

Batch 1325: Training accuracy = 0.9219, F1 = 0.9224, Precision = 0.9336, Recall = 0.9219



Epoch 2/5:  60%|██████    | 1327/2208 [07:52<05:29,  2.67it/s][A
Epoch 2/5:  60%|██████    | 1328/2208 [07:53<05:30,  2.66it/s][A
Epoch 2/5:  60%|██████    | 1329/2208 [07:53<05:23,  2.72it/s][A
Epoch 2/5:  60%|██████    | 1330/2208 [07:54<05:24,  2.71it/s][A
Epoch 2/5:  60%|██████    | 1331/2208 [07:54<05:28,  2.67it/s][A
Epoch 2/5:  60%|██████    | 1332/2208 [07:54<05:20,  2.73it/s][A
Epoch 2/5:  60%|██████    | 1333/2208 [07:55<05:15,  2.77it/s][A
Epoch 2/5:  60%|██████    | 1334/2208 [07:55<05:12,  2.80it/s][A
Epoch 2/5:  60%|██████    | 1335/2208 [07:55<05:10,  2.81it/s][A
Epoch 2/5:  61%|██████    | 1336/2208 [07:56<05:07,  2.83it/s][A
Epoch 2/5:  61%|██████    | 1337/2208 [07:56<05:06,  2.84it/s][A
Epoch 2/5:  61%|██████    | 1338/2208 [07:56<05:06,  2.84it/s][A
Epoch 2/5:  61%|██████    | 1339/2208 [07:57<05:12,  2.78it/s][A
Epoch 2/5:  61%|██████    | 1340/2208 [07:57<05:09,  2.80it/s][A
Epoch 2/5:  61%|██████    | 1341/2208 [07:58<05:21,  2.69it/s][A
Epoch 2/5

Batch 1350: Training accuracy = 0.8281, F1 = 0.8247, Precision = 0.8385, Recall = 0.8281



Epoch 2/5:  61%|██████    | 1352/2208 [08:02<05:12,  2.74it/s][A
Epoch 2/5:  61%|██████▏   | 1353/2208 [08:02<05:05,  2.80it/s][A
Epoch 2/5:  61%|██████▏   | 1354/2208 [08:02<05:08,  2.76it/s][A
Epoch 2/5:  61%|██████▏   | 1355/2208 [08:03<05:03,  2.81it/s][A
Epoch 2/5:  61%|██████▏   | 1356/2208 [08:03<05:00,  2.84it/s][A
Epoch 2/5:  61%|██████▏   | 1357/2208 [08:03<04:56,  2.87it/s][A
Epoch 2/5:  62%|██████▏   | 1358/2208 [08:04<04:54,  2.89it/s][A
Epoch 2/5:  62%|██████▏   | 1359/2208 [08:04<04:53,  2.89it/s][A
Epoch 2/5:  62%|██████▏   | 1360/2208 [08:04<05:00,  2.82it/s][A
Epoch 2/5:  62%|██████▏   | 1361/2208 [08:05<04:58,  2.83it/s][A
Epoch 2/5:  62%|██████▏   | 1362/2208 [08:05<05:01,  2.81it/s][A
Epoch 2/5:  62%|██████▏   | 1363/2208 [08:05<05:05,  2.77it/s][A
Epoch 2/5:  62%|██████▏   | 1364/2208 [08:06<05:00,  2.81it/s][A
Epoch 2/5:  62%|██████▏   | 1365/2208 [08:06<04:58,  2.82it/s][A
Epoch 2/5:  62%|██████▏   | 1366/2208 [08:06<05:01,  2.80it/s][A
Epoch 2/5

Batch 1375: Training accuracy = 0.8516, F1 = 0.8503, Precision = 0.8698, Recall = 0.8516



Epoch 2/5:  62%|██████▏   | 1377/2208 [08:10<04:55,  2.81it/s][A
Epoch 2/5:  62%|██████▏   | 1378/2208 [08:11<04:50,  2.86it/s][A
Epoch 2/5:  62%|██████▏   | 1379/2208 [08:11<04:48,  2.88it/s][A
Epoch 2/5:  62%|██████▎   | 1380/2208 [08:12<04:45,  2.90it/s][A
Epoch 2/5:  63%|██████▎   | 1381/2208 [08:12<04:44,  2.91it/s][A
Epoch 2/5:  63%|██████▎   | 1382/2208 [08:12<04:42,  2.92it/s][A
Epoch 2/5:  63%|██████▎   | 1383/2208 [08:13<04:48,  2.86it/s][A
Epoch 2/5:  63%|██████▎   | 1384/2208 [08:13<04:52,  2.82it/s][A
Epoch 2/5:  63%|██████▎   | 1385/2208 [08:13<04:49,  2.84it/s][A
Epoch 2/5:  63%|██████▎   | 1386/2208 [08:14<04:46,  2.87it/s][A
Epoch 2/5:  63%|██████▎   | 1387/2208 [08:14<04:49,  2.83it/s][A
Epoch 2/5:  63%|██████▎   | 1388/2208 [08:14<04:49,  2.83it/s][A
Epoch 2/5:  63%|██████▎   | 1389/2208 [08:15<04:47,  2.85it/s][A
Epoch 2/5:  63%|██████▎   | 1390/2208 [08:15<04:46,  2.86it/s][A
Epoch 2/5:  63%|██████▎   | 1391/2208 [08:15<04:46,  2.85it/s][A
Epoch 2/5

Batch 1400: Training accuracy = 0.8750, F1 = 0.8776, Precision = 0.9000, Recall = 0.8750



Epoch 2/5:  63%|██████▎   | 1402/2208 [08:19<04:51,  2.76it/s][A
Epoch 2/5:  64%|██████▎   | 1403/2208 [08:20<04:57,  2.71it/s][A
Epoch 2/5:  64%|██████▎   | 1404/2208 [08:20<04:51,  2.75it/s][A
Epoch 2/5:  64%|██████▎   | 1405/2208 [08:20<04:47,  2.79it/s][A
Epoch 2/5:  64%|██████▎   | 1406/2208 [08:21<04:56,  2.71it/s][A
Epoch 2/5:  64%|██████▎   | 1407/2208 [08:21<04:49,  2.76it/s][A
Epoch 2/5:  64%|██████▍   | 1408/2208 [08:21<04:49,  2.77it/s][A
Epoch 2/5:  64%|██████▍   | 1409/2208 [08:22<04:44,  2.81it/s][A
Epoch 2/5:  64%|██████▍   | 1410/2208 [08:22<04:42,  2.83it/s][A
Epoch 2/5:  64%|██████▍   | 1411/2208 [08:23<04:41,  2.83it/s][A
Epoch 2/5:  64%|██████▍   | 1412/2208 [08:23<04:47,  2.77it/s][A
Epoch 2/5:  64%|██████▍   | 1413/2208 [08:23<04:53,  2.71it/s][A
Epoch 2/5:  64%|██████▍   | 1414/2208 [08:24<04:51,  2.73it/s][A
Epoch 2/5:  64%|██████▍   | 1415/2208 [08:24<04:47,  2.76it/s][A
Epoch 2/5:  64%|██████▍   | 1416/2208 [08:24<04:50,  2.73it/s][A
Epoch 2/5

Batch 1425: Training accuracy = 0.7969, F1 = 0.7906, Precision = 0.8047, Recall = 0.7969



Epoch 2/5:  65%|██████▍   | 1427/2208 [08:28<04:38,  2.81it/s][A
Epoch 2/5:  65%|██████▍   | 1428/2208 [08:29<04:40,  2.78it/s][A
Epoch 2/5:  65%|██████▍   | 1429/2208 [08:29<04:45,  2.72it/s][A
Epoch 2/5:  65%|██████▍   | 1430/2208 [08:29<04:49,  2.68it/s][A
Epoch 2/5:  65%|██████▍   | 1431/2208 [08:30<04:41,  2.76it/s][A
Epoch 2/5:  65%|██████▍   | 1432/2208 [08:30<04:36,  2.80it/s][A
Epoch 2/5:  65%|██████▍   | 1433/2208 [08:30<04:37,  2.79it/s][A
Epoch 2/5:  65%|██████▍   | 1434/2208 [08:31<04:33,  2.83it/s][A
Epoch 2/5:  65%|██████▍   | 1435/2208 [08:31<04:30,  2.86it/s][A
Epoch 2/5:  65%|██████▌   | 1436/2208 [08:32<04:30,  2.85it/s][A
Epoch 2/5:  65%|██████▌   | 1437/2208 [08:32<04:28,  2.88it/s][A
Epoch 2/5:  65%|██████▌   | 1438/2208 [08:32<04:25,  2.90it/s][A
Epoch 2/5:  65%|██████▌   | 1439/2208 [08:33<04:25,  2.90it/s][A
Epoch 2/5:  65%|██████▌   | 1440/2208 [08:33<04:23,  2.91it/s][A
Epoch 2/5:  65%|██████▌   | 1441/2208 [08:33<04:24,  2.90it/s][A
Epoch 2/5

Batch 1450: Training accuracy = 0.8906, F1 = 0.8771, Precision = 0.8776, Recall = 0.8906



Epoch 2/5:  66%|██████▌   | 1452/2208 [08:37<04:45,  2.65it/s][A
Epoch 2/5:  66%|██████▌   | 1453/2208 [08:38<04:36,  2.73it/s][A
Epoch 2/5:  66%|██████▌   | 1454/2208 [08:38<04:32,  2.77it/s][A
Epoch 2/5:  66%|██████▌   | 1455/2208 [08:38<04:30,  2.79it/s][A
Epoch 2/5:  66%|██████▌   | 1456/2208 [08:39<04:26,  2.83it/s][A
Epoch 2/5:  66%|██████▌   | 1457/2208 [08:39<04:27,  2.81it/s][A
Epoch 2/5:  66%|██████▌   | 1458/2208 [08:39<04:22,  2.85it/s][A
Epoch 2/5:  66%|██████▌   | 1459/2208 [08:40<04:20,  2.87it/s][A
Epoch 2/5:  66%|██████▌   | 1460/2208 [08:40<04:18,  2.89it/s][A
Epoch 2/5:  66%|██████▌   | 1461/2208 [08:40<04:19,  2.88it/s][A
Epoch 2/5:  66%|██████▌   | 1462/2208 [08:41<04:17,  2.90it/s][A
Epoch 2/5:  66%|██████▋   | 1463/2208 [08:41<04:15,  2.91it/s][A
Epoch 2/5:  66%|██████▋   | 1464/2208 [08:41<04:21,  2.85it/s][A
Epoch 2/5:  66%|██████▋   | 1465/2208 [08:42<04:18,  2.87it/s][A
Epoch 2/5:  66%|██████▋   | 1466/2208 [08:42<04:16,  2.89it/s][A
Epoch 2/5

Batch 1475: Training accuracy = 0.8359, F1 = 0.8333, Precision = 0.8477, Recall = 0.8359



Epoch 2/5:  67%|██████▋   | 1477/2208 [08:46<04:15,  2.86it/s][A
Epoch 2/5:  67%|██████▋   | 1478/2208 [08:46<04:12,  2.89it/s][A
Epoch 2/5:  67%|██████▋   | 1479/2208 [08:47<04:12,  2.89it/s][A
Epoch 2/5:  67%|██████▋   | 1480/2208 [08:47<04:11,  2.89it/s][A
Epoch 2/5:  67%|██████▋   | 1481/2208 [08:47<04:13,  2.87it/s][A
Epoch 2/5:  67%|██████▋   | 1482/2208 [08:48<04:21,  2.77it/s][A
Epoch 2/5:  67%|██████▋   | 1483/2208 [08:48<04:17,  2.81it/s][A
Epoch 2/5:  67%|██████▋   | 1484/2208 [08:48<04:15,  2.83it/s][A
Epoch 2/5:  67%|██████▋   | 1485/2208 [08:49<04:15,  2.83it/s][A
Epoch 2/5:  67%|██████▋   | 1486/2208 [08:49<04:15,  2.82it/s][A
Epoch 2/5:  67%|██████▋   | 1487/2208 [08:50<04:18,  2.79it/s][A
Epoch 2/5:  67%|██████▋   | 1488/2208 [08:50<04:16,  2.80it/s][A
Epoch 2/5:  67%|██████▋   | 1489/2208 [08:50<04:15,  2.81it/s][A
Epoch 2/5:  67%|██████▋   | 1490/2208 [08:51<04:21,  2.74it/s][A
Epoch 2/5:  68%|██████▊   | 1491/2208 [08:51<04:17,  2.79it/s][A
Epoch 2/5

Batch 1500: Training accuracy = 0.8672, F1 = 0.8483, Precision = 0.8435, Recall = 0.8672



Epoch 2/5:  68%|██████▊   | 1502/2208 [08:55<04:14,  2.77it/s][A
Epoch 2/5:  68%|██████▊   | 1503/2208 [08:55<04:10,  2.81it/s][A
Epoch 2/5:  68%|██████▊   | 1504/2208 [08:56<04:09,  2.82it/s][A
Epoch 2/5:  68%|██████▊   | 1505/2208 [08:56<04:13,  2.77it/s][A
Epoch 2/5:  68%|██████▊   | 1506/2208 [08:56<04:14,  2.76it/s][A
Epoch 2/5:  68%|██████▊   | 1507/2208 [08:57<04:08,  2.82it/s][A
Epoch 2/5:  68%|██████▊   | 1508/2208 [08:57<04:04,  2.86it/s][A
Epoch 2/5:  68%|██████▊   | 1509/2208 [08:57<04:08,  2.81it/s][A
Epoch 2/5:  68%|██████▊   | 1510/2208 [08:58<04:04,  2.85it/s][A
Epoch 2/5:  68%|██████▊   | 1511/2208 [08:58<04:02,  2.88it/s][A
Epoch 2/5:  68%|██████▊   | 1512/2208 [08:58<04:00,  2.89it/s][A
Epoch 2/5:  69%|██████▊   | 1513/2208 [08:59<04:07,  2.80it/s][A
Epoch 2/5:  69%|██████▊   | 1514/2208 [08:59<04:09,  2.78it/s][A
Epoch 2/5:  69%|██████▊   | 1515/2208 [09:00<04:11,  2.75it/s][A
Epoch 2/5:  69%|██████▊   | 1516/2208 [09:00<04:12,  2.74it/s][A
Epoch 2/5

Batch 1525: Training accuracy = 0.8516, F1 = 0.8372, Precision = 0.8411, Recall = 0.8516



Epoch 2/5:  69%|██████▉   | 1527/2208 [09:04<04:03,  2.80it/s][A
Epoch 2/5:  69%|██████▉   | 1528/2208 [09:04<04:02,  2.80it/s][A
Epoch 2/5:  69%|██████▉   | 1529/2208 [09:05<03:58,  2.84it/s][A
Epoch 2/5:  69%|██████▉   | 1530/2208 [09:05<03:58,  2.85it/s][A
Epoch 2/5:  69%|██████▉   | 1531/2208 [09:05<03:56,  2.86it/s][A
Epoch 2/5:  69%|██████▉   | 1532/2208 [09:06<03:56,  2.86it/s][A
Epoch 2/5:  69%|██████▉   | 1533/2208 [09:06<03:58,  2.82it/s][A
Epoch 2/5:  69%|██████▉   | 1534/2208 [09:06<03:55,  2.86it/s][A
Epoch 2/5:  70%|██████▉   | 1535/2208 [09:07<04:01,  2.79it/s][A
Epoch 2/5:  70%|██████▉   | 1536/2208 [09:07<04:02,  2.78it/s][A
Epoch 2/5:  70%|██████▉   | 1537/2208 [09:08<03:57,  2.83it/s][A
Epoch 2/5:  70%|██████▉   | 1538/2208 [09:08<03:59,  2.80it/s][A
Epoch 2/5:  70%|██████▉   | 1539/2208 [09:08<04:01,  2.77it/s][A
Epoch 2/5:  70%|██████▉   | 1540/2208 [09:09<03:57,  2.82it/s][A
Epoch 2/5:  70%|██████▉   | 1541/2208 [09:09<03:55,  2.83it/s][A
Epoch 2/5

Batch 1550: Training accuracy = 0.8516, F1 = 0.8354, Precision = 0.8307, Recall = 0.8516



Epoch 2/5:  70%|███████   | 1552/2208 [09:13<03:53,  2.81it/s][A
Epoch 2/5:  70%|███████   | 1553/2208 [09:13<03:50,  2.84it/s][A
Epoch 2/5:  70%|███████   | 1554/2208 [09:14<03:48,  2.86it/s][A
Epoch 2/5:  70%|███████   | 1555/2208 [09:14<03:53,  2.79it/s][A
Epoch 2/5:  70%|███████   | 1556/2208 [09:14<03:49,  2.84it/s][A
Epoch 2/5:  71%|███████   | 1557/2208 [09:15<03:46,  2.87it/s][A
Epoch 2/5:  71%|███████   | 1558/2208 [09:15<03:46,  2.87it/s][A
Epoch 2/5:  71%|███████   | 1559/2208 [09:15<03:44,  2.88it/s][A
Epoch 2/5:  71%|███████   | 1560/2208 [09:16<03:42,  2.91it/s][A
Epoch 2/5:  71%|███████   | 1561/2208 [09:16<03:47,  2.85it/s][A
Epoch 2/5:  71%|███████   | 1562/2208 [09:16<03:45,  2.87it/s][A
Epoch 2/5:  71%|███████   | 1563/2208 [09:17<03:42,  2.89it/s][A
Epoch 2/5:  71%|███████   | 1564/2208 [09:17<03:41,  2.90it/s][A
Epoch 2/5:  71%|███████   | 1565/2208 [09:17<03:40,  2.91it/s][A
Epoch 2/5:  71%|███████   | 1566/2208 [09:18<03:39,  2.93it/s][A
Epoch 2/5

Batch 1575: Training accuracy = 0.8750, F1 = 0.8667, Precision = 0.8698, Recall = 0.8750



Epoch 2/5:  71%|███████▏  | 1577/2208 [09:22<03:53,  2.70it/s][A
Epoch 2/5:  71%|███████▏  | 1578/2208 [09:22<03:48,  2.75it/s][A
Epoch 2/5:  72%|███████▏  | 1579/2208 [09:22<03:48,  2.76it/s][A
Epoch 2/5:  72%|███████▏  | 1580/2208 [09:23<03:50,  2.73it/s][A
Epoch 2/5:  72%|███████▏  | 1581/2208 [09:23<03:46,  2.77it/s][A
Epoch 2/5:  72%|███████▏  | 1582/2208 [09:24<03:43,  2.81it/s][A
Epoch 2/5:  72%|███████▏  | 1583/2208 [09:24<03:39,  2.85it/s][A
Epoch 2/5:  72%|███████▏  | 1584/2208 [09:24<03:38,  2.85it/s][A
Epoch 2/5:  72%|███████▏  | 1585/2208 [09:25<03:38,  2.85it/s][A
Epoch 2/5:  72%|███████▏  | 1586/2208 [09:25<03:37,  2.86it/s][A
Epoch 2/5:  72%|███████▏  | 1587/2208 [09:25<03:36,  2.87it/s][A
Epoch 2/5:  72%|███████▏  | 1588/2208 [09:26<03:34,  2.90it/s][A
Epoch 2/5:  72%|███████▏  | 1589/2208 [09:26<03:40,  2.81it/s][A
Epoch 2/5:  72%|███████▏  | 1590/2208 [09:26<03:40,  2.81it/s][A
Epoch 2/5:  72%|███████▏  | 1591/2208 [09:27<03:37,  2.84it/s][A
Epoch 2/5

Batch 1600: Training accuracy = 0.8359, F1 = 0.8193, Precision = 0.8099, Recall = 0.8359



Epoch 2/5:  73%|███████▎  | 1602/2208 [09:31<03:37,  2.78it/s][A
Epoch 2/5:  73%|███████▎  | 1603/2208 [09:31<03:37,  2.78it/s][A
Epoch 2/5:  73%|███████▎  | 1604/2208 [09:31<03:34,  2.82it/s][A
Epoch 2/5:  73%|███████▎  | 1605/2208 [09:32<03:31,  2.85it/s][A
Epoch 2/5:  73%|███████▎  | 1606/2208 [09:32<03:29,  2.87it/s][A
Epoch 2/5:  73%|███████▎  | 1607/2208 [09:32<03:34,  2.81it/s][A
Epoch 2/5:  73%|███████▎  | 1608/2208 [09:33<03:33,  2.82it/s][A
Epoch 2/5:  73%|███████▎  | 1609/2208 [09:33<03:33,  2.80it/s][A
Epoch 2/5:  73%|███████▎  | 1610/2208 [09:33<03:31,  2.82it/s][A
Epoch 2/5:  73%|███████▎  | 1611/2208 [09:34<03:29,  2.86it/s][A
Epoch 2/5:  73%|███████▎  | 1612/2208 [09:34<03:28,  2.85it/s][A
Epoch 2/5:  73%|███████▎  | 1613/2208 [09:35<03:28,  2.85it/s][A
Epoch 2/5:  73%|███████▎  | 1614/2208 [09:35<03:27,  2.86it/s][A
Epoch 2/5:  73%|███████▎  | 1615/2208 [09:35<03:27,  2.86it/s][A
Epoch 2/5:  73%|███████▎  | 1616/2208 [09:36<03:29,  2.83it/s][A
Epoch 2/5

Batch 1625: Training accuracy = 0.8047, F1 = 0.7889, Precision = 0.8060, Recall = 0.8047



Epoch 2/5:  74%|███████▎  | 1627/2208 [09:40<03:25,  2.82it/s][A
Epoch 2/5:  74%|███████▎  | 1628/2208 [09:40<03:23,  2.85it/s][A
Epoch 2/5:  74%|███████▍  | 1629/2208 [09:40<03:27,  2.79it/s][A
Epoch 2/5:  74%|███████▍  | 1630/2208 [09:41<03:28,  2.77it/s][A
Epoch 2/5:  74%|███████▍  | 1631/2208 [09:41<03:24,  2.82it/s][A
Epoch 2/5:  74%|███████▍  | 1632/2208 [09:41<03:23,  2.83it/s][A
Epoch 2/5:  74%|███████▍  | 1633/2208 [09:42<03:22,  2.83it/s][A
Epoch 2/5:  74%|███████▍  | 1634/2208 [09:42<03:25,  2.79it/s][A
Epoch 2/5:  74%|███████▍  | 1635/2208 [09:42<03:30,  2.72it/s][A
Epoch 2/5:  74%|███████▍  | 1636/2208 [09:43<03:31,  2.71it/s][A
Epoch 2/5:  74%|███████▍  | 1637/2208 [09:43<03:28,  2.74it/s][A
Epoch 2/5:  74%|███████▍  | 1638/2208 [09:43<03:29,  2.72it/s][A
Epoch 2/5:  74%|███████▍  | 1639/2208 [09:44<03:30,  2.71it/s][A
Epoch 2/5:  74%|███████▍  | 1640/2208 [09:44<03:31,  2.69it/s][A
Epoch 2/5:  74%|███████▍  | 1641/2208 [09:45<03:28,  2.72it/s][A
Epoch 2/5

Batch 1650: Training accuracy = 0.8125, F1 = 0.8008, Precision = 0.8118, Recall = 0.8125



Epoch 2/5:  75%|███████▍  | 1652/2208 [09:49<03:22,  2.75it/s][A
Epoch 2/5:  75%|███████▍  | 1653/2208 [09:49<03:18,  2.79it/s][A
Epoch 2/5:  75%|███████▍  | 1654/2208 [09:49<03:19,  2.77it/s][A
Epoch 2/5:  75%|███████▍  | 1655/2208 [09:50<03:15,  2.82it/s][A
Epoch 2/5:  75%|███████▌  | 1656/2208 [09:50<03:19,  2.77it/s][A
Epoch 2/5:  75%|███████▌  | 1657/2208 [09:50<03:15,  2.82it/s][A
Epoch 2/5:  75%|███████▌  | 1658/2208 [09:51<03:12,  2.86it/s][A
Epoch 2/5:  75%|███████▌  | 1659/2208 [09:51<03:16,  2.80it/s][A
Epoch 2/5:  75%|███████▌  | 1660/2208 [09:51<03:17,  2.77it/s][A
Epoch 2/5:  75%|███████▌  | 1661/2208 [09:52<03:18,  2.76it/s][A
Epoch 2/5:  75%|███████▌  | 1662/2208 [09:52<03:23,  2.68it/s][A
Epoch 2/5:  75%|███████▌  | 1663/2208 [09:53<03:23,  2.68it/s][A
Epoch 2/5:  75%|███████▌  | 1664/2208 [09:53<03:17,  2.75it/s][A
Epoch 2/5:  75%|███████▌  | 1665/2208 [09:53<03:17,  2.75it/s][A
Epoch 2/5:  75%|███████▌  | 1666/2208 [09:54<03:13,  2.80it/s][A
Epoch 2/5

Batch 1675: Training accuracy = 0.8672, F1 = 0.8607, Precision = 0.8685, Recall = 0.8672



Epoch 2/5:  76%|███████▌  | 1677/2208 [09:58<03:12,  2.75it/s][A
Epoch 2/5:  76%|███████▌  | 1678/2208 [09:58<03:10,  2.78it/s][A
Epoch 2/5:  76%|███████▌  | 1679/2208 [09:58<03:11,  2.76it/s][A
Epoch 2/5:  76%|███████▌  | 1680/2208 [09:59<03:07,  2.82it/s][A
Epoch 2/5:  76%|███████▌  | 1681/2208 [09:59<03:05,  2.84it/s][A
Epoch 2/5:  76%|███████▌  | 1682/2208 [09:59<03:11,  2.74it/s][A
Epoch 2/5:  76%|███████▌  | 1683/2208 [10:00<03:12,  2.73it/s][A
Epoch 2/5:  76%|███████▋  | 1684/2208 [10:00<03:13,  2.71it/s][A
Epoch 2/5:  76%|███████▋  | 1685/2208 [10:00<03:08,  2.77it/s][A
Epoch 2/5:  76%|███████▋  | 1686/2208 [10:01<03:09,  2.76it/s][A
Epoch 2/5:  76%|███████▋  | 1687/2208 [10:01<03:08,  2.77it/s][A
Epoch 2/5:  76%|███████▋  | 1688/2208 [10:02<03:08,  2.76it/s][A
Epoch 2/5:  76%|███████▋  | 1689/2208 [10:02<03:07,  2.76it/s][A
Epoch 2/5:  77%|███████▋  | 1690/2208 [10:02<03:05,  2.80it/s][A
Epoch 2/5:  77%|███████▋  | 1691/2208 [10:03<03:03,  2.81it/s][A
Epoch 2/5

Batch 1700: Training accuracy = 0.8828, F1 = 0.8735, Precision = 0.8724, Recall = 0.8828



Epoch 2/5:  77%|███████▋  | 1702/2208 [10:07<03:00,  2.81it/s][A
Epoch 2/5:  77%|███████▋  | 1703/2208 [10:07<03:02,  2.77it/s][A
Epoch 2/5:  77%|███████▋  | 1704/2208 [10:07<03:03,  2.75it/s][A
Epoch 2/5:  77%|███████▋  | 1705/2208 [10:08<02:59,  2.80it/s][A
Epoch 2/5:  77%|███████▋  | 1706/2208 [10:08<03:02,  2.75it/s][A
Epoch 2/5:  77%|███████▋  | 1707/2208 [10:08<02:58,  2.81it/s][A
Epoch 2/5:  77%|███████▋  | 1708/2208 [10:09<02:58,  2.80it/s][A
Epoch 2/5:  77%|███████▋  | 1709/2208 [10:09<02:55,  2.84it/s][A
Epoch 2/5:  77%|███████▋  | 1710/2208 [10:10<02:59,  2.78it/s][A
Epoch 2/5:  77%|███████▋  | 1711/2208 [10:10<02:56,  2.81it/s][A
Epoch 2/5:  78%|███████▊  | 1712/2208 [10:10<02:56,  2.80it/s][A
Epoch 2/5:  78%|███████▊  | 1713/2208 [10:11<02:54,  2.84it/s][A
Epoch 2/5:  78%|███████▊  | 1714/2208 [10:11<02:55,  2.82it/s][A
Epoch 2/5:  78%|███████▊  | 1715/2208 [10:11<02:58,  2.77it/s][A
Epoch 2/5:  78%|███████▊  | 1716/2208 [10:12<02:56,  2.79it/s][A
Epoch 2/5

Batch 1725: Training accuracy = 0.8672, F1 = 0.8551, Precision = 0.8555, Recall = 0.8672



Epoch 2/5:  78%|███████▊  | 1727/2208 [10:16<02:49,  2.84it/s][A
Epoch 2/5:  78%|███████▊  | 1728/2208 [10:16<02:47,  2.86it/s][A
Epoch 2/5:  78%|███████▊  | 1729/2208 [10:16<02:46,  2.88it/s][A
Epoch 2/5:  78%|███████▊  | 1730/2208 [10:17<02:51,  2.79it/s][A
Epoch 2/5:  78%|███████▊  | 1731/2208 [10:17<02:48,  2.82it/s][A
Epoch 2/5:  78%|███████▊  | 1732/2208 [10:17<02:47,  2.85it/s][A
Epoch 2/5:  78%|███████▊  | 1733/2208 [10:18<02:48,  2.82it/s][A
Epoch 2/5:  79%|███████▊  | 1734/2208 [10:18<02:50,  2.79it/s][A
Epoch 2/5:  79%|███████▊  | 1735/2208 [10:18<02:49,  2.80it/s][A
Epoch 2/5:  79%|███████▊  | 1736/2208 [10:19<02:50,  2.76it/s][A
Epoch 2/5:  79%|███████▊  | 1737/2208 [10:19<02:48,  2.79it/s][A
Epoch 2/5:  79%|███████▊  | 1738/2208 [10:20<02:47,  2.81it/s][A
Epoch 2/5:  79%|███████▉  | 1739/2208 [10:20<02:48,  2.78it/s][A
Epoch 2/5:  79%|███████▉  | 1740/2208 [10:20<02:47,  2.79it/s][A
Epoch 2/5:  79%|███████▉  | 1741/2208 [10:21<02:46,  2.80it/s][A
Epoch 2/5

Batch 1750: Training accuracy = 0.8750, F1 = 0.8693, Precision = 0.8737, Recall = 0.8750



Epoch 2/5:  79%|███████▉  | 1752/2208 [10:25<02:41,  2.82it/s][A
Epoch 2/5:  79%|███████▉  | 1753/2208 [10:25<02:40,  2.84it/s][A
Epoch 2/5:  79%|███████▉  | 1754/2208 [10:25<02:42,  2.80it/s][A
Epoch 2/5:  79%|███████▉  | 1755/2208 [10:26<02:39,  2.84it/s][A
Epoch 2/5:  80%|███████▉  | 1756/2208 [10:26<02:44,  2.75it/s][A
Epoch 2/5:  80%|███████▉  | 1757/2208 [10:26<02:40,  2.80it/s][A
Epoch 2/5:  80%|███████▉  | 1758/2208 [10:27<02:38,  2.83it/s][A
Epoch 2/5:  80%|███████▉  | 1759/2208 [10:27<02:37,  2.86it/s][A
Epoch 2/5:  80%|███████▉  | 1760/2208 [10:27<02:35,  2.88it/s][A
Epoch 2/5:  80%|███████▉  | 1761/2208 [10:28<02:33,  2.90it/s][A
Epoch 2/5:  80%|███████▉  | 1762/2208 [10:28<02:33,  2.90it/s][A
Epoch 2/5:  80%|███████▉  | 1763/2208 [10:28<02:32,  2.91it/s][A
Epoch 2/5:  80%|███████▉  | 1764/2208 [10:29<02:31,  2.92it/s][A
Epoch 2/5:  80%|███████▉  | 1765/2208 [10:29<02:31,  2.93it/s][A
Epoch 2/5:  80%|███████▉  | 1766/2208 [10:29<02:34,  2.85it/s][A
Epoch 2/5

Batch 1775: Training accuracy = 0.8438, F1 = 0.8451, Precision = 0.8698, Recall = 0.8438



Epoch 2/5:  80%|████████  | 1777/2208 [10:33<02:39,  2.70it/s][A
Epoch 2/5:  81%|████████  | 1778/2208 [10:34<02:39,  2.70it/s][A
Epoch 2/5:  81%|████████  | 1779/2208 [10:34<02:37,  2.73it/s][A
Epoch 2/5:  81%|████████  | 1780/2208 [10:34<02:33,  2.78it/s][A
Epoch 2/5:  81%|████████  | 1781/2208 [10:35<02:34,  2.76it/s][A
Epoch 2/5:  81%|████████  | 1782/2208 [10:35<02:38,  2.68it/s][A
Epoch 2/5:  81%|████████  | 1783/2208 [10:36<02:37,  2.69it/s][A
Epoch 2/5:  81%|████████  | 1784/2208 [10:36<02:37,  2.69it/s][A
Epoch 2/5:  81%|████████  | 1785/2208 [10:36<02:34,  2.74it/s][A
Epoch 2/5:  81%|████████  | 1786/2208 [10:37<02:37,  2.67it/s][A
Epoch 2/5:  81%|████████  | 1787/2208 [10:37<02:37,  2.68it/s][A
Epoch 2/5:  81%|████████  | 1788/2208 [10:37<02:35,  2.69it/s][A
Epoch 2/5:  81%|████████  | 1789/2208 [10:38<02:35,  2.70it/s][A
Epoch 2/5:  81%|████████  | 1790/2208 [10:38<02:37,  2.65it/s][A
Epoch 2/5:  81%|████████  | 1791/2208 [10:39<02:36,  2.66it/s][A
Epoch 2/5

Batch 1800: Training accuracy = 0.8906, F1 = 0.8924, Precision = 0.9167, Recall = 0.8906



Epoch 2/5:  82%|████████▏ | 1802/2208 [10:42<02:26,  2.77it/s][A
Epoch 2/5:  82%|████████▏ | 1803/2208 [10:43<02:26,  2.76it/s][A
Epoch 2/5:  82%|████████▏ | 1804/2208 [10:43<02:27,  2.74it/s][A
Epoch 2/5:  82%|████████▏ | 1805/2208 [10:44<02:24,  2.80it/s][A
Epoch 2/5:  82%|████████▏ | 1806/2208 [10:44<02:21,  2.85it/s][A
Epoch 2/5:  82%|████████▏ | 1807/2208 [10:44<02:20,  2.86it/s][A
Epoch 2/5:  82%|████████▏ | 1808/2208 [10:45<02:24,  2.77it/s][A
Epoch 2/5:  82%|████████▏ | 1809/2208 [10:45<02:21,  2.83it/s][A
Epoch 2/5:  82%|████████▏ | 1810/2208 [10:45<02:20,  2.84it/s][A
Epoch 2/5:  82%|████████▏ | 1811/2208 [10:46<02:19,  2.85it/s][A
Epoch 2/5:  82%|████████▏ | 1812/2208 [10:46<02:18,  2.86it/s][A
Epoch 2/5:  82%|████████▏ | 1813/2208 [10:46<02:19,  2.82it/s][A
Epoch 2/5:  82%|████████▏ | 1814/2208 [10:47<02:17,  2.86it/s][A
Epoch 2/5:  82%|████████▏ | 1815/2208 [10:47<02:20,  2.80it/s][A
Epoch 2/5:  82%|████████▏ | 1816/2208 [10:47<02:22,  2.75it/s][A
Epoch 2/5

Batch 1825: Training accuracy = 0.8906, F1 = 0.8841, Precision = 0.8854, Recall = 0.8906



Epoch 2/5:  83%|████████▎ | 1827/2208 [10:52<02:17,  2.77it/s][A
Epoch 2/5:  83%|████████▎ | 1828/2208 [10:52<02:16,  2.79it/s][A
Epoch 2/5:  83%|████████▎ | 1829/2208 [10:52<02:17,  2.76it/s][A
Epoch 2/5:  83%|████████▎ | 1830/2208 [10:53<02:14,  2.82it/s][A
Epoch 2/5:  83%|████████▎ | 1831/2208 [10:53<02:16,  2.75it/s][A
Epoch 2/5:  83%|████████▎ | 1832/2208 [10:53<02:14,  2.80it/s][A
Epoch 2/5:  83%|████████▎ | 1833/2208 [10:54<02:12,  2.83it/s][A
Epoch 2/5:  83%|████████▎ | 1834/2208 [10:54<02:11,  2.84it/s][A
Epoch 2/5:  83%|████████▎ | 1835/2208 [10:54<02:12,  2.81it/s][A
Epoch 2/5:  83%|████████▎ | 1836/2208 [10:55<02:10,  2.85it/s][A
Epoch 2/5:  83%|████████▎ | 1837/2208 [10:55<02:12,  2.80it/s][A
Epoch 2/5:  83%|████████▎ | 1838/2208 [10:55<02:10,  2.83it/s][A
Epoch 2/5:  83%|████████▎ | 1839/2208 [10:56<02:09,  2.86it/s][A
Epoch 2/5:  83%|████████▎ | 1840/2208 [10:56<02:07,  2.88it/s][A
Epoch 2/5:  83%|████████▎ | 1841/2208 [10:56<02:09,  2.82it/s][A
Epoch 2/5

Batch 1850: Training accuracy = 0.8516, F1 = 0.8250, Precision = 0.8128, Recall = 0.8516



Epoch 2/5:  84%|████████▍ | 1852/2208 [11:00<02:05,  2.83it/s][A
Epoch 2/5:  84%|████████▍ | 1853/2208 [11:01<02:07,  2.80it/s][A
Epoch 2/5:  84%|████████▍ | 1854/2208 [11:01<02:08,  2.75it/s][A
Epoch 2/5:  84%|████████▍ | 1855/2208 [11:01<02:07,  2.77it/s][A
Epoch 2/5:  84%|████████▍ | 1856/2208 [11:02<02:07,  2.77it/s][A
Epoch 2/5:  84%|████████▍ | 1857/2208 [11:02<02:06,  2.78it/s][A
Epoch 2/5:  84%|████████▍ | 1858/2208 [11:03<02:06,  2.76it/s][A
Epoch 2/5:  84%|████████▍ | 1859/2208 [11:03<02:05,  2.79it/s][A
Epoch 2/5:  84%|████████▍ | 1860/2208 [11:03<02:06,  2.76it/s][A
Epoch 2/5:  84%|████████▍ | 1861/2208 [11:04<02:07,  2.73it/s][A
Epoch 2/5:  84%|████████▍ | 1862/2208 [11:04<02:06,  2.74it/s][A
Epoch 2/5:  84%|████████▍ | 1863/2208 [11:04<02:03,  2.80it/s][A
Epoch 2/5:  84%|████████▍ | 1864/2208 [11:05<02:05,  2.74it/s][A
Epoch 2/5:  84%|████████▍ | 1865/2208 [11:05<02:03,  2.77it/s][A
Epoch 2/5:  85%|████████▍ | 1866/2208 [11:05<02:04,  2.76it/s][A
Epoch 2/5

Batch 1875: Training accuracy = 0.8203, F1 = 0.8060, Precision = 0.8014, Recall = 0.8203



Epoch 2/5:  85%|████████▌ | 1877/2208 [11:09<02:01,  2.73it/s][A
Epoch 2/5:  85%|████████▌ | 1878/2208 [11:10<01:58,  2.78it/s][A
Epoch 2/5:  85%|████████▌ | 1879/2208 [11:10<01:59,  2.76it/s][A
Epoch 2/5:  85%|████████▌ | 1880/2208 [11:10<01:59,  2.74it/s][A
Epoch 2/5:  85%|████████▌ | 1881/2208 [11:11<01:57,  2.79it/s][A
Epoch 2/5:  85%|████████▌ | 1882/2208 [11:11<01:57,  2.77it/s][A
Epoch 2/5:  85%|████████▌ | 1883/2208 [11:12<01:56,  2.80it/s][A
Epoch 2/5:  85%|████████▌ | 1884/2208 [11:12<01:55,  2.80it/s][A
Epoch 2/5:  85%|████████▌ | 1885/2208 [11:12<01:55,  2.80it/s][A
Epoch 2/5:  85%|████████▌ | 1886/2208 [11:13<01:56,  2.76it/s][A
Epoch 2/5:  85%|████████▌ | 1887/2208 [11:13<01:55,  2.78it/s][A
Epoch 2/5:  86%|████████▌ | 1888/2208 [11:13<01:54,  2.80it/s][A
Epoch 2/5:  86%|████████▌ | 1889/2208 [11:14<01:55,  2.76it/s][A
Epoch 2/5:  86%|████████▌ | 1890/2208 [11:14<01:55,  2.75it/s][A
Epoch 2/5:  86%|████████▌ | 1891/2208 [11:15<01:59,  2.66it/s][A
Epoch 2/5

Batch 1900: Training accuracy = 0.9062, F1 = 0.8839, Precision = 0.8750, Recall = 0.9062



Epoch 2/5:  86%|████████▌ | 1902/2208 [11:18<01:50,  2.78it/s][A
Epoch 2/5:  86%|████████▌ | 1903/2208 [11:19<01:54,  2.66it/s][A
Epoch 2/5:  86%|████████▌ | 1904/2208 [11:19<01:53,  2.67it/s][A
Epoch 2/5:  86%|████████▋ | 1905/2208 [11:20<01:50,  2.75it/s][A
Epoch 2/5:  86%|████████▋ | 1906/2208 [11:20<01:49,  2.77it/s][A
Epoch 2/5:  86%|████████▋ | 1907/2208 [11:20<01:48,  2.78it/s][A
Epoch 2/5:  86%|████████▋ | 1908/2208 [11:21<01:45,  2.83it/s][A
Epoch 2/5:  86%|████████▋ | 1909/2208 [11:21<01:46,  2.81it/s][A
Epoch 2/5:  87%|████████▋ | 1910/2208 [11:21<01:47,  2.77it/s][A
Epoch 2/5:  87%|████████▋ | 1911/2208 [11:22<01:47,  2.75it/s][A
Epoch 2/5:  87%|████████▋ | 1912/2208 [11:22<01:48,  2.73it/s][A
Epoch 2/5:  87%|████████▋ | 1913/2208 [11:22<01:45,  2.79it/s][A
Epoch 2/5:  87%|████████▋ | 1914/2208 [11:23<01:44,  2.81it/s][A
Epoch 2/5:  87%|████████▋ | 1915/2208 [11:23<01:43,  2.83it/s][A
Epoch 2/5:  87%|████████▋ | 1916/2208 [11:23<01:42,  2.84it/s][A
Epoch 2/5

Batch 1925: Training accuracy = 0.8594, F1 = 0.8370, Precision = 0.8346, Recall = 0.8594



Epoch 2/5:  87%|████████▋ | 1927/2208 [11:27<01:40,  2.81it/s][A
Epoch 2/5:  87%|████████▋ | 1928/2208 [11:28<01:38,  2.85it/s][A
Epoch 2/5:  87%|████████▋ | 1929/2208 [11:28<01:39,  2.81it/s][A
Epoch 2/5:  87%|████████▋ | 1930/2208 [11:28<01:38,  2.81it/s][A
Epoch 2/5:  87%|████████▋ | 1931/2208 [11:29<01:39,  2.78it/s][A
Epoch 2/5:  88%|████████▊ | 1932/2208 [11:29<01:41,  2.73it/s][A
Epoch 2/5:  88%|████████▊ | 1933/2208 [11:29<01:39,  2.77it/s][A
Epoch 2/5:  88%|████████▊ | 1934/2208 [11:30<01:37,  2.82it/s][A
Epoch 2/5:  88%|████████▊ | 1935/2208 [11:30<01:38,  2.76it/s][A
Epoch 2/5:  88%|████████▊ | 1936/2208 [11:30<01:36,  2.81it/s][A
Epoch 2/5:  88%|████████▊ | 1937/2208 [11:31<01:35,  2.84it/s][A
Epoch 2/5:  88%|████████▊ | 1938/2208 [11:31<01:34,  2.87it/s][A
Epoch 2/5:  88%|████████▊ | 1939/2208 [11:32<01:34,  2.84it/s][A
Epoch 2/5:  88%|████████▊ | 1940/2208 [11:32<01:35,  2.80it/s][A
Epoch 2/5:  88%|████████▊ | 1941/2208 [11:32<01:38,  2.72it/s][A
Epoch 2/5

Batch 1950: Training accuracy = 0.8125, F1 = 0.7905, Precision = 0.7922, Recall = 0.8125



Epoch 2/5:  88%|████████▊ | 1952/2208 [11:36<01:33,  2.74it/s][A
Epoch 2/5:  88%|████████▊ | 1953/2208 [11:37<01:32,  2.75it/s][A
Epoch 2/5:  88%|████████▊ | 1954/2208 [11:37<01:30,  2.80it/s][A
Epoch 2/5:  89%|████████▊ | 1955/2208 [11:37<01:28,  2.85it/s][A
Epoch 2/5:  89%|████████▊ | 1956/2208 [11:38<01:27,  2.88it/s][A
Epoch 2/5:  89%|████████▊ | 1957/2208 [11:38<01:29,  2.79it/s][A
Epoch 2/5:  89%|████████▊ | 1958/2208 [11:38<01:28,  2.83it/s][A
Epoch 2/5:  89%|████████▊ | 1959/2208 [11:39<01:27,  2.86it/s][A
Epoch 2/5:  89%|████████▉ | 1960/2208 [11:39<01:27,  2.83it/s][A
Epoch 2/5:  89%|████████▉ | 1961/2208 [11:39<01:27,  2.83it/s][A
Epoch 2/5:  89%|████████▉ | 1962/2208 [11:40<01:28,  2.79it/s][A
Epoch 2/5:  89%|████████▉ | 1963/2208 [11:40<01:26,  2.83it/s][A
Epoch 2/5:  89%|████████▉ | 1964/2208 [11:41<01:26,  2.81it/s][A
Epoch 2/5:  89%|████████▉ | 1965/2208 [11:41<01:25,  2.83it/s][A
Epoch 2/5:  89%|████████▉ | 1966/2208 [11:41<01:27,  2.76it/s][A
Epoch 2/5

Batch 1975: Training accuracy = 0.8516, F1 = 0.8341, Precision = 0.8294, Recall = 0.8516



Epoch 2/5:  90%|████████▉ | 1977/2208 [11:45<01:25,  2.70it/s][A
Epoch 2/5:  90%|████████▉ | 1978/2208 [11:46<01:22,  2.78it/s][A
Epoch 2/5:  90%|████████▉ | 1979/2208 [11:46<01:21,  2.81it/s][A
Epoch 2/5:  90%|████████▉ | 1980/2208 [11:46<01:23,  2.74it/s][A
Epoch 2/5:  90%|████████▉ | 1981/2208 [11:47<01:23,  2.73it/s][A
Epoch 2/5:  90%|████████▉ | 1982/2208 [11:47<01:22,  2.73it/s][A
Epoch 2/5:  90%|████████▉ | 1983/2208 [11:47<01:22,  2.73it/s][A
Epoch 2/5:  90%|████████▉ | 1984/2208 [11:48<01:22,  2.72it/s][A
Epoch 2/5:  90%|████████▉ | 1985/2208 [11:48<01:22,  2.71it/s][A
Epoch 2/5:  90%|████████▉ | 1986/2208 [11:48<01:20,  2.75it/s][A
Epoch 2/5:  90%|████████▉ | 1987/2208 [11:49<01:22,  2.68it/s][A
Epoch 2/5:  90%|█████████ | 1988/2208 [11:49<01:22,  2.66it/s][A
Epoch 2/5:  90%|█████████ | 1989/2208 [11:50<01:21,  2.67it/s][A
Epoch 2/5:  90%|█████████ | 1990/2208 [11:50<01:20,  2.70it/s][A
Epoch 2/5:  90%|█████████ | 1991/2208 [11:50<01:18,  2.76it/s][A
Epoch 2/5

Batch 2000: Training accuracy = 0.8359, F1 = 0.8276, Precision = 0.8385, Recall = 0.8359



Epoch 2/5:  91%|█████████ | 2002/2208 [11:54<01:14,  2.75it/s][A
Epoch 2/5:  91%|█████████ | 2003/2208 [11:55<01:13,  2.81it/s][A
Epoch 2/5:  91%|█████████ | 2004/2208 [11:55<01:13,  2.76it/s][A
Epoch 2/5:  91%|█████████ | 2005/2208 [11:55<01:12,  2.79it/s][A
Epoch 2/5:  91%|█████████ | 2006/2208 [11:56<01:11,  2.83it/s][A
Epoch 2/5:  91%|█████████ | 2007/2208 [11:56<01:13,  2.75it/s][A
Epoch 2/5:  91%|█████████ | 2008/2208 [11:56<01:11,  2.80it/s][A
Epoch 2/5:  91%|█████████ | 2009/2208 [11:57<01:12,  2.76it/s][A
Epoch 2/5:  91%|█████████ | 2010/2208 [11:57<01:11,  2.77it/s][A
Epoch 2/5:  91%|█████████ | 2011/2208 [11:58<01:10,  2.80it/s][A
Epoch 2/5:  91%|█████████ | 2012/2208 [11:58<01:11,  2.74it/s][A
Epoch 2/5:  91%|█████████ | 2013/2208 [11:58<01:10,  2.75it/s][A
Epoch 2/5:  91%|█████████ | 2014/2208 [11:59<01:10,  2.75it/s][A
Epoch 2/5:  91%|█████████▏| 2015/2208 [11:59<01:08,  2.80it/s][A
Epoch 2/5:  91%|█████████▏| 2016/2208 [11:59<01:07,  2.85it/s][A
Epoch 2/5

Batch 2025: Training accuracy = 0.8594, F1 = 0.8549, Precision = 0.8815, Recall = 0.8594



Epoch 2/5:  92%|█████████▏| 2027/2208 [12:03<01:05,  2.77it/s][A
Epoch 2/5:  92%|█████████▏| 2028/2208 [12:04<01:05,  2.75it/s][A
Epoch 2/5:  92%|█████████▏| 2029/2208 [12:04<01:06,  2.71it/s][A
Epoch 2/5:  92%|█████████▏| 2030/2208 [12:04<01:04,  2.77it/s][A
Epoch 2/5:  92%|█████████▏| 2031/2208 [12:05<01:03,  2.77it/s][A
Epoch 2/5:  92%|█████████▏| 2032/2208 [12:05<01:04,  2.73it/s][A
Epoch 2/5:  92%|█████████▏| 2033/2208 [12:05<01:04,  2.70it/s][A
Epoch 2/5:  92%|█████████▏| 2034/2208 [12:06<01:05,  2.67it/s][A
Epoch 2/5:  92%|█████████▏| 2035/2208 [12:06<01:03,  2.73it/s][A
Epoch 2/5:  92%|█████████▏| 2036/2208 [12:07<01:01,  2.79it/s][A
Epoch 2/5:  92%|█████████▏| 2037/2208 [12:07<01:01,  2.76it/s][A
Epoch 2/5:  92%|█████████▏| 2038/2208 [12:07<01:01,  2.75it/s][A
Epoch 2/5:  92%|█████████▏| 2039/2208 [12:08<01:00,  2.80it/s][A
Epoch 2/5:  92%|█████████▏| 2040/2208 [12:08<01:00,  2.78it/s][A
Epoch 2/5:  92%|█████████▏| 2041/2208 [12:08<00:59,  2.79it/s][A
Epoch 2/5

Batch 2050: Training accuracy = 0.8516, F1 = 0.8380, Precision = 0.8477, Recall = 0.8516



Epoch 2/5:  93%|█████████▎| 2052/2208 [12:12<00:56,  2.75it/s][A
Epoch 2/5:  93%|█████████▎| 2053/2208 [12:13<00:56,  2.74it/s][A
Epoch 2/5:  93%|█████████▎| 2054/2208 [12:13<00:56,  2.71it/s][A
Epoch 2/5:  93%|█████████▎| 2055/2208 [12:13<00:55,  2.77it/s][A
Epoch 2/5:  93%|█████████▎| 2056/2208 [12:14<00:56,  2.70it/s][A
Epoch 2/5:  93%|█████████▎| 2057/2208 [12:14<00:56,  2.70it/s][A
Epoch 2/5:  93%|█████████▎| 2058/2208 [12:14<00:55,  2.72it/s][A
Epoch 2/5:  93%|█████████▎| 2059/2208 [12:15<00:53,  2.77it/s][A
Epoch 2/5:  93%|█████████▎| 2060/2208 [12:15<00:53,  2.76it/s][A
Epoch 2/5:  93%|█████████▎| 2061/2208 [12:16<00:52,  2.80it/s][A
Epoch 2/5:  93%|█████████▎| 2062/2208 [12:16<00:51,  2.82it/s][A
Epoch 2/5:  93%|█████████▎| 2063/2208 [12:16<00:51,  2.80it/s][A
Epoch 2/5:  93%|█████████▎| 2064/2208 [12:17<00:52,  2.76it/s][A
Epoch 2/5:  94%|█████████▎| 2065/2208 [12:17<00:51,  2.80it/s][A
Epoch 2/5:  94%|█████████▎| 2066/2208 [12:17<00:52,  2.70it/s][A
Epoch 2/5

Batch 2075: Training accuracy = 0.8516, F1 = 0.8484, Precision = 0.8620, Recall = 0.8516



Epoch 2/5:  94%|█████████▍| 2077/2208 [12:21<00:47,  2.76it/s][A
Epoch 2/5:  94%|█████████▍| 2078/2208 [12:22<00:46,  2.81it/s][A
Epoch 2/5:  94%|█████████▍| 2079/2208 [12:22<00:45,  2.83it/s][A
Epoch 2/5:  94%|█████████▍| 2080/2208 [12:22<00:45,  2.81it/s][A
Epoch 2/5:  94%|█████████▍| 2081/2208 [12:23<00:44,  2.85it/s][A
Epoch 2/5:  94%|█████████▍| 2082/2208 [12:23<00:44,  2.84it/s][A
Epoch 2/5:  94%|█████████▍| 2083/2208 [12:23<00:43,  2.86it/s][A
Epoch 2/5:  94%|█████████▍| 2084/2208 [12:24<00:43,  2.86it/s][A
Epoch 2/5:  94%|█████████▍| 2085/2208 [12:24<00:43,  2.86it/s][A
Epoch 2/5:  94%|█████████▍| 2086/2208 [12:24<00:43,  2.81it/s][A
Epoch 2/5:  95%|█████████▍| 2087/2208 [12:25<00:42,  2.82it/s][A
Epoch 2/5:  95%|█████████▍| 2088/2208 [12:25<00:43,  2.76it/s][A
Epoch 2/5:  95%|█████████▍| 2089/2208 [12:26<00:43,  2.74it/s][A
Epoch 2/5:  95%|█████████▍| 2090/2208 [12:26<00:43,  2.74it/s][A
Epoch 2/5:  95%|█████████▍| 2091/2208 [12:26<00:42,  2.72it/s][A
Epoch 2/5

Batch 2100: Training accuracy = 0.8750, F1 = 0.8698, Precision = 0.8844, Recall = 0.8750



Epoch 2/5:  95%|█████████▌| 2102/2208 [12:30<00:37,  2.81it/s][A
Epoch 2/5:  95%|█████████▌| 2103/2208 [12:31<00:37,  2.84it/s][A
Epoch 2/5:  95%|█████████▌| 2104/2208 [12:31<00:36,  2.86it/s][A
Epoch 2/5:  95%|█████████▌| 2105/2208 [12:31<00:37,  2.72it/s][A
Epoch 2/5:  95%|█████████▌| 2106/2208 [12:32<00:36,  2.77it/s][A
Epoch 2/5:  95%|█████████▌| 2107/2208 [12:32<00:37,  2.70it/s][A
Epoch 2/5:  95%|█████████▌| 2108/2208 [12:32<00:37,  2.69it/s][A
Epoch 2/5:  96%|█████████▌| 2109/2208 [12:33<00:36,  2.74it/s][A
Epoch 2/5:  96%|█████████▌| 2110/2208 [12:33<00:36,  2.72it/s][A
Epoch 2/5:  96%|█████████▌| 2111/2208 [12:33<00:35,  2.70it/s][A
Epoch 2/5:  96%|█████████▌| 2112/2208 [12:34<00:34,  2.75it/s][A
Epoch 2/5:  96%|█████████▌| 2113/2208 [12:34<00:34,  2.73it/s][A
Epoch 2/5:  96%|█████████▌| 2114/2208 [12:35<00:34,  2.73it/s][A
Epoch 2/5:  96%|█████████▌| 2115/2208 [12:35<00:34,  2.69it/s][A
Epoch 2/5:  96%|█████████▌| 2116/2208 [12:35<00:33,  2.72it/s][A
Epoch 2/5

Batch 2125: Training accuracy = 0.8594, F1 = 0.8448, Precision = 0.8411, Recall = 0.8594



Epoch 2/5:  96%|█████████▋| 2127/2208 [12:39<00:28,  2.86it/s][A
Epoch 2/5:  96%|█████████▋| 2128/2208 [12:39<00:27,  2.87it/s][A
Epoch 2/5:  96%|█████████▋| 2129/2208 [12:40<00:27,  2.87it/s][A
Epoch 2/5:  96%|█████████▋| 2130/2208 [12:40<00:27,  2.81it/s][A
Epoch 2/5:  97%|█████████▋| 2131/2208 [12:41<00:27,  2.85it/s][A
Epoch 2/5:  97%|█████████▋| 2132/2208 [12:41<00:26,  2.88it/s][A
Epoch 2/5:  97%|█████████▋| 2133/2208 [12:41<00:26,  2.88it/s][A
Epoch 2/5:  97%|█████████▋| 2134/2208 [12:42<00:26,  2.82it/s][A
Epoch 2/5:  97%|█████████▋| 2135/2208 [12:42<00:25,  2.85it/s][A
Epoch 2/5:  97%|█████████▋| 2136/2208 [12:42<00:25,  2.85it/s][A
Epoch 2/5:  97%|█████████▋| 2137/2208 [12:43<00:24,  2.85it/s][A
Epoch 2/5:  97%|█████████▋| 2138/2208 [12:43<00:25,  2.73it/s][A
Epoch 2/5:  97%|█████████▋| 2139/2208 [12:43<00:24,  2.78it/s][A
Epoch 2/5:  97%|█████████▋| 2140/2208 [12:44<00:24,  2.80it/s][A
Epoch 2/5:  97%|█████████▋| 2141/2208 [12:44<00:23,  2.81it/s][A
Epoch 2/5

Batch 2150: Training accuracy = 0.8828, F1 = 0.8766, Precision = 0.8802, Recall = 0.8828



Epoch 2/5:  97%|█████████▋| 2152/2208 [12:48<00:20,  2.77it/s][A
Epoch 2/5:  98%|█████████▊| 2153/2208 [12:49<00:20,  2.67it/s][A
Epoch 2/5:  98%|█████████▊| 2154/2208 [12:49<00:19,  2.75it/s][A
Epoch 2/5:  98%|█████████▊| 2155/2208 [12:49<00:18,  2.80it/s][A
Epoch 2/5:  98%|█████████▊| 2156/2208 [12:50<00:18,  2.78it/s][A
Epoch 2/5:  98%|█████████▊| 2157/2208 [12:50<00:18,  2.82it/s][A
Epoch 2/5:  98%|█████████▊| 2158/2208 [12:50<00:17,  2.79it/s][A
Epoch 2/5:  98%|█████████▊| 2159/2208 [12:51<00:17,  2.76it/s][A
Epoch 2/5:  98%|█████████▊| 2160/2208 [12:51<00:17,  2.80it/s][A
Epoch 2/5:  98%|█████████▊| 2161/2208 [12:51<00:16,  2.84it/s][A
Epoch 2/5:  98%|█████████▊| 2162/2208 [12:52<00:16,  2.83it/s][A
Epoch 2/5:  98%|█████████▊| 2163/2208 [12:52<00:15,  2.84it/s][A
Epoch 2/5:  98%|█████████▊| 2164/2208 [12:52<00:15,  2.86it/s][A
Epoch 2/5:  98%|█████████▊| 2165/2208 [12:53<00:14,  2.88it/s][A
Epoch 2/5:  98%|█████████▊| 2166/2208 [12:53<00:14,  2.90it/s][A
Epoch 2/5

Batch 2175: Training accuracy = 0.8750, F1 = 0.8742, Precision = 0.8932, Recall = 0.8750



Epoch 2/5:  99%|█████████▊| 2177/2208 [12:57<00:10,  2.84it/s][A
Epoch 2/5:  99%|█████████▊| 2178/2208 [12:57<00:10,  2.86it/s][A
Epoch 2/5:  99%|█████████▊| 2179/2208 [12:58<00:10,  2.89it/s][A
Epoch 2/5:  99%|█████████▊| 2180/2208 [12:58<00:09,  2.84it/s][A
Epoch 2/5:  99%|█████████▉| 2181/2208 [12:58<00:09,  2.77it/s][A
Epoch 2/5:  99%|█████████▉| 2182/2208 [12:59<00:09,  2.74it/s][A
Epoch 2/5:  99%|█████████▉| 2183/2208 [12:59<00:09,  2.66it/s][A
Epoch 2/5:  99%|█████████▉| 2184/2208 [13:00<00:08,  2.73it/s][A
Epoch 2/5:  99%|█████████▉| 2185/2208 [13:00<00:08,  2.77it/s][A
Epoch 2/5:  99%|█████████▉| 2186/2208 [13:00<00:08,  2.75it/s][A
Epoch 2/5:  99%|█████████▉| 2187/2208 [13:01<00:07,  2.79it/s][A
Epoch 2/5:  99%|█████████▉| 2188/2208 [13:01<00:07,  2.81it/s][A
Epoch 2/5:  99%|█████████▉| 2189/2208 [13:01<00:06,  2.83it/s][A
Epoch 2/5:  99%|█████████▉| 2190/2208 [13:02<00:06,  2.80it/s][A
Epoch 2/5:  99%|█████████▉| 2191/2208 [13:02<00:06,  2.76it/s][A
Epoch 2/5

Batch 2200: Training accuracy = 0.8359, F1 = 0.8352, Precision = 0.8542, Recall = 0.8359



Epoch 2/5: 100%|█████████▉| 2202/2208 [13:06<00:02,  2.85it/s][A
Epoch 2/5: 100%|█████████▉| 2203/2208 [13:06<00:01,  2.87it/s][A
Epoch 2/5: 100%|█████████▉| 2204/2208 [13:07<00:01,  2.88it/s][A
Epoch 2/5: 100%|█████████▉| 2205/2208 [13:07<00:01,  2.88it/s][A
Epoch 2/5: 100%|█████████▉| 2206/2208 [13:07<00:00,  2.88it/s][A
Epoch 2/5: 100%|█████████▉| 2207/2208 [13:08<00:00,  2.90it/s][A
Epoch 2/5: 100%|██████████| 2208/2208 [13:08<00:00,  2.91it/s][A
                                                              [A


Epoch 2 training accuracy: 0.84%
Epoch 2 training F1 score: 0.8502
Epoch 2 training precision: 0.8591
Epoch 2 training recall: 0.8448

Starting validation...



Validation:   0%|          | 0/552 [00:00<?, ?it/s][A
Validation:   0%|          | 1/552 [00:01<15:49,  1.72s/it][A
Validation:   1%|          | 3/552 [00:01<04:26,  2.06it/s][A
Validation:   1%|          | 6/552 [00:02<02:04,  4.40it/s][A
Validation:   1%|▏         | 8/552 [00:02<01:29,  6.06it/s][A
Validation:   2%|▏         | 10/552 [00:02<01:15,  7.14it/s][A
Validation:   2%|▏         | 12/552 [00:02<01:00,  8.99it/s][A
Validation:   3%|▎         | 14/552 [00:02<00:58,  9.22it/s][A
Validation:   3%|▎         | 17/552 [00:02<00:50, 10.66it/s][A
Validation:   3%|▎         | 19/552 [00:03<00:50, 10.59it/s][A
Validation:   4%|▍         | 21/552 [00:03<00:46, 11.34it/s][A
Validation:   4%|▍         | 23/552 [00:03<00:47, 11.10it/s][A
Validation:   5%|▍         | 26/552 [00:03<00:40, 13.01it/s][A
Validation:   5%|▌         | 29/552 [00:03<00:36, 14.46it/s][A
Validation:   6%|▌         | 31/552 [00:04<00:48, 10.66it/s][A
Validation:   6%|▌         | 33/552 [00:04<00:43, 12

Validation accuracy: 0.68%
Validation F1 score: 0.7021
Validation precision: 0.8222
Validation recall: 0.6823

Starting epoch 3/5



  _warn_prf(average, modifier, f"{metric.capitalize()} is", len(result))
  _warn_prf(average, modifier, f"{metric.capitalize()} is", len(result))

Epoch 3/5:   0%|          | 1/2208 [00:02<1:15:48,  2.06s/it][A

Batch 0: Training accuracy = 0.8672, F1 = 0.8607, Precision = 0.8620, Recall = 0.8672



Epoch 3/5:   0%|          | 2/2208 [00:02<38:27,  1.05s/it]  [A
Epoch 3/5:   0%|          | 3/2208 [00:02<26:35,  1.38it/s][A
Epoch 3/5:   0%|          | 4/2208 [00:03<21:30,  1.71it/s][A
Epoch 3/5:   0%|          | 5/2208 [00:03<18:30,  1.98it/s][A
Epoch 3/5:   0%|          | 6/2208 [00:03<16:31,  2.22it/s][A
Epoch 3/5:   0%|          | 7/2208 [00:04<15:21,  2.39it/s][A
Epoch 3/5:   0%|          | 8/2208 [00:04<14:24,  2.55it/s][A
Epoch 3/5:   0%|          | 9/2208 [00:04<14:20,  2.56it/s][A
Epoch 3/5:   0%|          | 10/2208 [00:05<13:44,  2.67it/s][A
Epoch 3/5:   0%|          | 11/2208 [00:05<13:38,  2.68it/s][A
Epoch 3/5:   1%|          | 12/2208 [00:05<13:14,  2.76it/s][A
Epoch 3/5:   1%|          | 13/2208 [00:06<13:11,  2.77it/s][A
Epoch 3/5:   1%|          | 14/2208 [00:06<12:57,  2.82it/s][A
Epoch 3/5:   1%|          | 15/2208 [00:07<13:09,  2.78it/s][A
Epoch 3/5:   1%|          | 16/2208 [00:07<13:01,  2.80it/s][A
Epoch 3/5:   1%|          | 17/2208 [00:07<13

Batch 25: Training accuracy = 0.8828, F1 = 0.8828, Precision = 0.8906, Recall = 0.8828



Epoch 3/5:   1%|          | 27/2208 [00:11<13:23,  2.71it/s][A
Epoch 3/5:   1%|▏         | 28/2208 [00:11<13:08,  2.76it/s][A
Epoch 3/5:   1%|▏         | 29/2208 [00:12<13:00,  2.79it/s][A
Epoch 3/5:   1%|▏         | 30/2208 [00:12<12:59,  2.79it/s][A
Epoch 3/5:   1%|▏         | 31/2208 [00:12<12:56,  2.80it/s][A
Epoch 3/5:   1%|▏         | 32/2208 [00:13<13:17,  2.73it/s][A
Epoch 3/5:   1%|▏         | 33/2208 [00:13<13:10,  2.75it/s][A
Epoch 3/5:   2%|▏         | 34/2208 [00:13<13:19,  2.72it/s][A
Epoch 3/5:   2%|▏         | 35/2208 [00:14<13:18,  2.72it/s][A
Epoch 3/5:   2%|▏         | 36/2208 [00:14<13:01,  2.78it/s][A
Epoch 3/5:   2%|▏         | 37/2208 [00:15<12:56,  2.80it/s][A
Epoch 3/5:   2%|▏         | 38/2208 [00:15<13:00,  2.78it/s][A
Epoch 3/5:   2%|▏         | 39/2208 [00:15<13:08,  2.75it/s][A
Epoch 3/5:   2%|▏         | 40/2208 [00:16<13:13,  2.73it/s][A
Epoch 3/5:   2%|▏         | 41/2208 [00:16<13:12,  2.73it/s][A
Epoch 3/5:   2%|▏         | 42/2208 [00

Batch 50: Training accuracy = 0.8828, F1 = 0.8703, Precision = 0.8691, Recall = 0.8828



Epoch 3/5:   2%|▏         | 52/2208 [00:20<12:30,  2.87it/s][A
Epoch 3/5:   2%|▏         | 53/2208 [00:20<12:57,  2.77it/s][A
Epoch 3/5:   2%|▏         | 54/2208 [00:21<12:46,  2.81it/s][A
Epoch 3/5:   2%|▏         | 55/2208 [00:21<12:35,  2.85it/s][A
Epoch 3/5:   3%|▎         | 56/2208 [00:21<13:02,  2.75it/s][A
Epoch 3/5:   3%|▎         | 57/2208 [00:22<12:48,  2.80it/s][A
Epoch 3/5:   3%|▎         | 58/2208 [00:22<12:40,  2.83it/s][A
Epoch 3/5:   3%|▎         | 59/2208 [00:22<12:36,  2.84it/s][A
Epoch 3/5:   3%|▎         | 60/2208 [00:23<12:48,  2.79it/s][A
Epoch 3/5:   3%|▎         | 61/2208 [00:23<12:59,  2.76it/s][A
Epoch 3/5:   3%|▎         | 62/2208 [00:23<12:51,  2.78it/s][A
Epoch 3/5:   3%|▎         | 63/2208 [00:24<12:38,  2.83it/s][A
Epoch 3/5:   3%|▎         | 64/2208 [00:24<12:37,  2.83it/s][A
Epoch 3/5:   3%|▎         | 65/2208 [00:25<12:27,  2.87it/s][A
Epoch 3/5:   3%|▎         | 66/2208 [00:25<12:23,  2.88it/s][A
Epoch 3/5:   3%|▎         | 67/2208 [00

Batch 75: Training accuracy = 0.8281, F1 = 0.8120, Precision = 0.8130, Recall = 0.8281



Epoch 3/5:   3%|▎         | 77/2208 [00:29<12:44,  2.79it/s][A
Epoch 3/5:   4%|▎         | 78/2208 [00:29<12:30,  2.84it/s][A
Epoch 3/5:   4%|▎         | 79/2208 [00:29<12:44,  2.79it/s][A
Epoch 3/5:   4%|▎         | 80/2208 [00:30<12:47,  2.77it/s][A
Epoch 3/5:   4%|▎         | 81/2208 [00:30<12:40,  2.80it/s][A
Epoch 3/5:   4%|▎         | 82/2208 [00:31<12:33,  2.82it/s][A
Epoch 3/5:   4%|▍         | 83/2208 [00:31<12:25,  2.85it/s][A
Epoch 3/5:   4%|▍         | 84/2208 [00:31<12:30,  2.83it/s][A
Epoch 3/5:   4%|▍         | 85/2208 [00:32<12:25,  2.85it/s][A
Epoch 3/5:   4%|▍         | 86/2208 [00:32<12:17,  2.88it/s][A
Epoch 3/5:   4%|▍         | 87/2208 [00:32<12:14,  2.89it/s][A
Epoch 3/5:   4%|▍         | 88/2208 [00:33<12:29,  2.83it/s][A
Epoch 3/5:   4%|▍         | 89/2208 [00:33<12:31,  2.82it/s][A
Epoch 3/5:   4%|▍         | 90/2208 [00:33<12:24,  2.84it/s][A
Epoch 3/5:   4%|▍         | 91/2208 [00:34<12:23,  2.85it/s][A
Epoch 3/5:   4%|▍         | 92/2208 [00

Batch 100: Training accuracy = 0.8672, F1 = 0.8583, Precision = 0.8607, Recall = 0.8672



Epoch 3/5:   5%|▍         | 102/2208 [00:38<12:21,  2.84it/s][A
Epoch 3/5:   5%|▍         | 103/2208 [00:38<12:19,  2.84it/s][A
Epoch 3/5:   5%|▍         | 104/2208 [00:38<12:14,  2.86it/s][A
Epoch 3/5:   5%|▍         | 105/2208 [00:39<12:18,  2.85it/s][A
Epoch 3/5:   5%|▍         | 106/2208 [00:39<12:10,  2.88it/s][A
Epoch 3/5:   5%|▍         | 107/2208 [00:39<12:17,  2.85it/s][A
Epoch 3/5:   5%|▍         | 108/2208 [00:40<12:20,  2.83it/s][A
Epoch 3/5:   5%|▍         | 109/2208 [00:40<12:36,  2.77it/s][A
Epoch 3/5:   5%|▍         | 110/2208 [00:40<12:36,  2.77it/s][A
Epoch 3/5:   5%|▌         | 111/2208 [00:41<12:28,  2.80it/s][A
Epoch 3/5:   5%|▌         | 112/2208 [00:41<12:15,  2.85it/s][A
Epoch 3/5:   5%|▌         | 113/2208 [00:41<12:14,  2.85it/s][A
Epoch 3/5:   5%|▌         | 114/2208 [00:42<12:29,  2.79it/s][A
Epoch 3/5:   5%|▌         | 115/2208 [00:42<12:38,  2.76it/s][A
Epoch 3/5:   5%|▌         | 116/2208 [00:43<12:38,  2.76it/s][A
Epoch 3/5:   5%|▌       

Batch 125: Training accuracy = 0.8672, F1 = 0.8547, Precision = 0.8561, Recall = 0.8672



Epoch 3/5:   6%|▌         | 127/2208 [00:47<13:01,  2.66it/s][A
Epoch 3/5:   6%|▌         | 128/2208 [00:47<12:53,  2.69it/s][A
Epoch 3/5:   6%|▌         | 129/2208 [00:47<13:01,  2.66it/s][A
Epoch 3/5:   6%|▌         | 130/2208 [00:48<12:51,  2.69it/s][A
Epoch 3/5:   6%|▌         | 131/2208 [00:48<12:58,  2.67it/s][A
Epoch 3/5:   6%|▌         | 132/2208 [00:48<12:52,  2.69it/s][A
Epoch 3/5:   6%|▌         | 133/2208 [00:49<12:59,  2.66it/s][A
Epoch 3/5:   6%|▌         | 134/2208 [00:49<12:36,  2.74it/s][A
Epoch 3/5:   6%|▌         | 135/2208 [00:50<12:31,  2.76it/s][A
Epoch 3/5:   6%|▌         | 136/2208 [00:50<12:16,  2.81it/s][A
Epoch 3/5:   6%|▌         | 137/2208 [00:50<12:12,  2.83it/s][A
Epoch 3/5:   6%|▋         | 138/2208 [00:51<12:06,  2.85it/s][A
Epoch 3/5:   6%|▋         | 139/2208 [00:51<12:06,  2.85it/s][A
Epoch 3/5:   6%|▋         | 140/2208 [00:51<11:57,  2.88it/s][A
Epoch 3/5:   6%|▋         | 141/2208 [00:52<12:23,  2.78it/s][A
Epoch 3/5:   6%|▋       

Batch 150: Training accuracy = 0.8828, F1 = 0.8793, Precision = 0.9089, Recall = 0.8828



Epoch 3/5:   7%|▋         | 152/2208 [00:56<12:11,  2.81it/s][A
Epoch 3/5:   7%|▋         | 153/2208 [00:56<12:11,  2.81it/s][A
Epoch 3/5:   7%|▋         | 154/2208 [00:56<12:16,  2.79it/s][A
Epoch 3/5:   7%|▋         | 155/2208 [00:57<12:14,  2.79it/s][A
Epoch 3/5:   7%|▋         | 156/2208 [00:57<12:05,  2.83it/s][A
Epoch 3/5:   7%|▋         | 157/2208 [00:57<12:00,  2.85it/s][A
Epoch 3/5:   7%|▋         | 158/2208 [00:58<12:01,  2.84it/s][A
Epoch 3/5:   7%|▋         | 159/2208 [00:58<12:09,  2.81it/s][A
Epoch 3/5:   7%|▋         | 160/2208 [00:58<12:06,  2.82it/s][A
Epoch 3/5:   7%|▋         | 161/2208 [00:59<12:02,  2.83it/s][A
Epoch 3/5:   7%|▋         | 162/2208 [00:59<12:14,  2.79it/s][A
Epoch 3/5:   7%|▋         | 163/2208 [01:00<12:36,  2.70it/s][A
Epoch 3/5:   7%|▋         | 164/2208 [01:00<12:34,  2.71it/s][A
Epoch 3/5:   7%|▋         | 165/2208 [01:00<12:33,  2.71it/s][A
Epoch 3/5:   8%|▊         | 166/2208 [01:01<12:20,  2.76it/s][A
Epoch 3/5:   8%|▊       

Batch 175: Training accuracy = 0.8281, F1 = 0.8260, Precision = 0.8434, Recall = 0.8281



Epoch 3/5:   8%|▊         | 177/2208 [01:04<11:49,  2.86it/s][A
Epoch 3/5:   8%|▊         | 178/2208 [01:05<11:48,  2.87it/s][A
Epoch 3/5:   8%|▊         | 179/2208 [01:05<11:40,  2.90it/s][A
Epoch 3/5:   8%|▊         | 180/2208 [01:06<11:40,  2.90it/s][A
Epoch 3/5:   8%|▊         | 181/2208 [01:06<11:52,  2.84it/s][A
Epoch 3/5:   8%|▊         | 182/2208 [01:06<11:45,  2.87it/s][A
Epoch 3/5:   8%|▊         | 183/2208 [01:07<11:59,  2.81it/s][A
Epoch 3/5:   8%|▊         | 184/2208 [01:07<11:49,  2.85it/s][A
Epoch 3/5:   8%|▊         | 185/2208 [01:07<11:42,  2.88it/s][A
Epoch 3/5:   8%|▊         | 186/2208 [01:08<11:39,  2.89it/s][A
Epoch 3/5:   8%|▊         | 187/2208 [01:08<11:33,  2.91it/s][A
Epoch 3/5:   9%|▊         | 188/2208 [01:08<11:33,  2.91it/s][A
Epoch 3/5:   9%|▊         | 189/2208 [01:09<11:31,  2.92it/s][A
Epoch 3/5:   9%|▊         | 190/2208 [01:09<11:31,  2.92it/s][A
Epoch 3/5:   9%|▊         | 191/2208 [01:09<12:01,  2.80it/s][A
Epoch 3/5:   9%|▊       

Batch 200: Training accuracy = 0.8438, F1 = 0.8385, Precision = 0.8438, Recall = 0.8438



Epoch 3/5:   9%|▉         | 202/2208 [01:13<12:15,  2.73it/s][A
Epoch 3/5:   9%|▉         | 203/2208 [01:14<12:29,  2.68it/s][A
Epoch 3/5:   9%|▉         | 204/2208 [01:14<12:31,  2.67it/s][A
Epoch 3/5:   9%|▉         | 205/2208 [01:14<12:08,  2.75it/s][A
Epoch 3/5:   9%|▉         | 206/2208 [01:15<12:12,  2.73it/s][A
Epoch 3/5:   9%|▉         | 207/2208 [01:15<12:06,  2.76it/s][A
Epoch 3/5:   9%|▉         | 208/2208 [01:16<12:14,  2.72it/s][A
Epoch 3/5:   9%|▉         | 209/2208 [01:16<12:01,  2.77it/s][A
Epoch 3/5:  10%|▉         | 210/2208 [01:16<12:07,  2.75it/s][A
Epoch 3/5:  10%|▉         | 211/2208 [01:17<12:11,  2.73it/s][A
Epoch 3/5:  10%|▉         | 212/2208 [01:17<11:56,  2.79it/s][A
Epoch 3/5:  10%|▉         | 213/2208 [01:17<11:44,  2.83it/s][A
Epoch 3/5:  10%|▉         | 214/2208 [01:18<11:38,  2.85it/s][A
Epoch 3/5:  10%|▉         | 215/2208 [01:18<11:31,  2.88it/s][A
Epoch 3/5:  10%|▉         | 216/2208 [01:18<11:29,  2.89it/s][A
Epoch 3/5:  10%|▉       

Batch 225: Training accuracy = 0.8516, F1 = 0.8370, Precision = 0.8320, Recall = 0.8516



Epoch 3/5:  10%|█         | 227/2208 [01:22<11:34,  2.85it/s][A
Epoch 3/5:  10%|█         | 228/2208 [01:23<11:44,  2.81it/s][A
Epoch 3/5:  10%|█         | 229/2208 [01:23<11:49,  2.79it/s][A
Epoch 3/5:  10%|█         | 230/2208 [01:23<11:41,  2.82it/s][A
Epoch 3/5:  10%|█         | 231/2208 [01:24<11:40,  2.82it/s][A
Epoch 3/5:  11%|█         | 232/2208 [01:24<11:33,  2.85it/s][A
Epoch 3/5:  11%|█         | 233/2208 [01:24<11:37,  2.83it/s][A
Epoch 3/5:  11%|█         | 234/2208 [01:25<11:39,  2.82it/s][A
Epoch 3/5:  11%|█         | 235/2208 [01:25<11:38,  2.82it/s][A
Epoch 3/5:  11%|█         | 236/2208 [01:25<11:28,  2.86it/s][A
Epoch 3/5:  11%|█         | 237/2208 [01:26<11:40,  2.81it/s][A
Epoch 3/5:  11%|█         | 238/2208 [01:26<11:44,  2.80it/s][A
Epoch 3/5:  11%|█         | 239/2208 [01:26<11:55,  2.75it/s][A
Epoch 3/5:  11%|█         | 240/2208 [01:27<11:45,  2.79it/s][A
Epoch 3/5:  11%|█         | 241/2208 [01:27<11:36,  2.83it/s][A
Epoch 3/5:  11%|█       

Batch 250: Training accuracy = 0.7891, F1 = 0.7786, Precision = 0.7812, Recall = 0.7891



Epoch 3/5:  11%|█▏        | 252/2208 [01:31<11:45,  2.77it/s][A
Epoch 3/5:  11%|█▏        | 253/2208 [01:32<12:01,  2.71it/s][A
Epoch 3/5:  12%|█▏        | 254/2208 [01:32<12:10,  2.68it/s][A
Epoch 3/5:  12%|█▏        | 255/2208 [01:32<11:54,  2.73it/s][A
Epoch 3/5:  12%|█▏        | 256/2208 [01:33<12:00,  2.71it/s][A
Epoch 3/5:  12%|█▏        | 257/2208 [01:33<12:12,  2.66it/s][A
Epoch 3/5:  12%|█▏        | 258/2208 [01:34<12:16,  2.65it/s][A
Epoch 3/5:  12%|█▏        | 259/2208 [01:34<11:56,  2.72it/s][A
Epoch 3/5:  12%|█▏        | 260/2208 [01:34<12:05,  2.69it/s][A
Epoch 3/5:  12%|█▏        | 261/2208 [01:35<11:47,  2.75it/s][A
Epoch 3/5:  12%|█▏        | 262/2208 [01:35<11:52,  2.73it/s][A
Epoch 3/5:  12%|█▏        | 263/2208 [01:35<11:47,  2.75it/s][A
Epoch 3/5:  12%|█▏        | 264/2208 [01:36<11:45,  2.76it/s][A
Epoch 3/5:  12%|█▏        | 265/2208 [01:36<11:52,  2.73it/s][A
Epoch 3/5:  12%|█▏        | 266/2208 [01:36<11:37,  2.78it/s][A
Epoch 3/5:  12%|█▏      

Batch 275: Training accuracy = 0.8594, F1 = 0.8456, Precision = 0.8418, Recall = 0.8594



Epoch 3/5:  13%|█▎        | 277/2208 [01:40<11:35,  2.78it/s][A
Epoch 3/5:  13%|█▎        | 278/2208 [01:41<11:34,  2.78it/s][A
Epoch 3/5:  13%|█▎        | 279/2208 [01:41<11:33,  2.78it/s][A
Epoch 3/5:  13%|█▎        | 280/2208 [01:41<11:25,  2.81it/s][A
Epoch 3/5:  13%|█▎        | 281/2208 [01:42<11:23,  2.82it/s][A
Epoch 3/5:  13%|█▎        | 282/2208 [01:42<11:16,  2.85it/s][A
Epoch 3/5:  13%|█▎        | 283/2208 [01:42<11:13,  2.86it/s][A
Epoch 3/5:  13%|█▎        | 284/2208 [01:43<11:18,  2.83it/s][A
Epoch 3/5:  13%|█▎        | 285/2208 [01:43<11:24,  2.81it/s][A
Epoch 3/5:  13%|█▎        | 286/2208 [01:44<11:31,  2.78it/s][A
Epoch 3/5:  13%|█▎        | 287/2208 [01:44<11:40,  2.74it/s][A
Epoch 3/5:  13%|█▎        | 288/2208 [01:44<11:34,  2.77it/s][A
Epoch 3/5:  13%|█▎        | 289/2208 [01:45<11:26,  2.79it/s][A
Epoch 3/5:  13%|█▎        | 290/2208 [01:45<11:19,  2.82it/s][A
Epoch 3/5:  13%|█▎        | 291/2208 [01:45<11:27,  2.79it/s][A
Epoch 3/5:  13%|█▎      

Batch 300: Training accuracy = 0.8750, F1 = 0.8646, Precision = 0.8659, Recall = 0.8750



Epoch 3/5:  14%|█▎        | 302/2208 [01:49<11:08,  2.85it/s][A
Epoch 3/5:  14%|█▎        | 303/2208 [01:50<11:19,  2.81it/s][A
Epoch 3/5:  14%|█▍        | 304/2208 [01:50<11:15,  2.82it/s][A
Epoch 3/5:  14%|█▍        | 305/2208 [01:50<11:10,  2.84it/s][A
Epoch 3/5:  14%|█▍        | 306/2208 [01:51<11:14,  2.82it/s][A
Epoch 3/5:  14%|█▍        | 307/2208 [01:51<11:23,  2.78it/s][A
Epoch 3/5:  14%|█▍        | 308/2208 [01:51<11:12,  2.83it/s][A
Epoch 3/5:  14%|█▍        | 309/2208 [01:52<11:06,  2.85it/s][A
Epoch 3/5:  14%|█▍        | 310/2208 [01:52<11:03,  2.86it/s][A
Epoch 3/5:  14%|█▍        | 311/2208 [01:52<11:23,  2.78it/s][A
Epoch 3/5:  14%|█▍        | 312/2208 [01:53<11:14,  2.81it/s][A
Epoch 3/5:  14%|█▍        | 313/2208 [01:53<11:22,  2.78it/s][A
Epoch 3/5:  14%|█▍        | 314/2208 [01:54<11:17,  2.80it/s][A
Epoch 3/5:  14%|█▍        | 315/2208 [01:54<11:21,  2.78it/s][A
Epoch 3/5:  14%|█▍        | 316/2208 [01:54<11:10,  2.82it/s][A
Epoch 3/5:  14%|█▍      

Batch 325: Training accuracy = 0.8438, F1 = 0.8287, Precision = 0.8344, Recall = 0.8438



Epoch 3/5:  15%|█▍        | 327/2208 [01:58<11:21,  2.76it/s][A
Epoch 3/5:  15%|█▍        | 328/2208 [01:59<11:10,  2.80it/s][A
Epoch 3/5:  15%|█▍        | 329/2208 [01:59<11:04,  2.83it/s][A
Epoch 3/5:  15%|█▍        | 330/2208 [01:59<10:59,  2.85it/s][A
Epoch 3/5:  15%|█▍        | 331/2208 [02:00<10:55,  2.86it/s][A
Epoch 3/5:  15%|█▌        | 332/2208 [02:00<11:12,  2.79it/s][A
Epoch 3/5:  15%|█▌        | 333/2208 [02:00<11:09,  2.80it/s][A
Epoch 3/5:  15%|█▌        | 334/2208 [02:01<11:08,  2.80it/s][A
Epoch 3/5:  15%|█▌        | 335/2208 [02:01<10:59,  2.84it/s][A
Epoch 3/5:  15%|█▌        | 336/2208 [02:01<10:56,  2.85it/s][A
Epoch 3/5:  15%|█▌        | 337/2208 [02:02<10:51,  2.87it/s][A
Epoch 3/5:  15%|█▌        | 338/2208 [02:02<10:49,  2.88it/s][A
Epoch 3/5:  15%|█▌        | 339/2208 [02:02<10:58,  2.84it/s][A
Epoch 3/5:  15%|█▌        | 340/2208 [02:03<10:56,  2.85it/s][A
Epoch 3/5:  15%|█▌        | 341/2208 [02:03<10:48,  2.88it/s][A
Epoch 3/5:  15%|█▌      

Batch 350: Training accuracy = 0.8516, F1 = 0.8458, Precision = 0.8555, Recall = 0.8516



Epoch 3/5:  16%|█▌        | 352/2208 [02:07<10:48,  2.86it/s][A
Epoch 3/5:  16%|█▌        | 353/2208 [02:07<10:48,  2.86it/s][A
Epoch 3/5:  16%|█▌        | 354/2208 [02:08<10:47,  2.86it/s][A
Epoch 3/5:  16%|█▌        | 355/2208 [02:08<10:42,  2.88it/s][A
Epoch 3/5:  16%|█▌        | 356/2208 [02:08<10:38,  2.90it/s][A
Epoch 3/5:  16%|█▌        | 357/2208 [02:09<10:40,  2.89it/s][A
Epoch 3/5:  16%|█▌        | 358/2208 [02:09<10:37,  2.90it/s][A
Epoch 3/5:  16%|█▋        | 359/2208 [02:09<10:55,  2.82it/s][A
Epoch 3/5:  16%|█▋        | 360/2208 [02:10<11:02,  2.79it/s][A
Epoch 3/5:  16%|█▋        | 361/2208 [02:10<10:53,  2.83it/s][A
Epoch 3/5:  16%|█▋        | 362/2208 [02:11<11:10,  2.75it/s][A
Epoch 3/5:  16%|█▋        | 363/2208 [02:11<11:23,  2.70it/s][A
Epoch 3/5:  16%|█▋        | 364/2208 [02:11<11:24,  2.69it/s][A
Epoch 3/5:  17%|█▋        | 365/2208 [02:12<11:12,  2.74it/s][A
Epoch 3/5:  17%|█▋        | 366/2208 [02:12<11:06,  2.76it/s][A
Epoch 3/5:  17%|█▋      

Batch 375: Training accuracy = 0.8672, F1 = 0.8488, Precision = 0.8477, Recall = 0.8672



Epoch 3/5:  17%|█▋        | 377/2208 [02:16<10:58,  2.78it/s][A
Epoch 3/5:  17%|█▋        | 378/2208 [02:16<11:20,  2.69it/s][A
Epoch 3/5:  17%|█▋        | 379/2208 [02:17<11:04,  2.75it/s][A
Epoch 3/5:  17%|█▋        | 380/2208 [02:17<10:51,  2.81it/s][A
Epoch 3/5:  17%|█▋        | 381/2208 [02:17<10:41,  2.85it/s][A
Epoch 3/5:  17%|█▋        | 382/2208 [02:18<10:43,  2.84it/s][A
Epoch 3/5:  17%|█▋        | 383/2208 [02:18<10:36,  2.87it/s][A
Epoch 3/5:  17%|█▋        | 384/2208 [02:18<10:34,  2.88it/s][A
Epoch 3/5:  17%|█▋        | 385/2208 [02:19<10:30,  2.89it/s][A
Epoch 3/5:  17%|█▋        | 386/2208 [02:19<10:27,  2.90it/s][A
Epoch 3/5:  18%|█▊        | 387/2208 [02:20<10:40,  2.84it/s][A
Epoch 3/5:  18%|█▊        | 388/2208 [02:20<10:44,  2.82it/s][A
Epoch 3/5:  18%|█▊        | 389/2208 [02:20<10:40,  2.84it/s][A
Epoch 3/5:  18%|█▊        | 390/2208 [02:21<10:34,  2.87it/s][A
Epoch 3/5:  18%|█▊        | 391/2208 [02:21<10:33,  2.87it/s][A
Epoch 3/5:  18%|█▊      

Batch 400: Training accuracy = 0.9297, F1 = 0.9193, Precision = 0.9141, Recall = 0.9297



Epoch 3/5:  18%|█▊        | 402/2208 [02:25<10:51,  2.77it/s][A
Epoch 3/5:  18%|█▊        | 403/2208 [02:25<10:41,  2.81it/s][A
Epoch 3/5:  18%|█▊        | 404/2208 [02:26<10:58,  2.74it/s][A
Epoch 3/5:  18%|█▊        | 405/2208 [02:26<10:48,  2.78it/s][A
Epoch 3/5:  18%|█▊        | 406/2208 [02:26<10:44,  2.80it/s][A
Epoch 3/5:  18%|█▊        | 407/2208 [02:27<11:02,  2.72it/s][A
Epoch 3/5:  18%|█▊        | 408/2208 [02:27<11:05,  2.71it/s][A
Epoch 3/5:  19%|█▊        | 409/2208 [02:27<11:08,  2.69it/s][A
Epoch 3/5:  19%|█▊        | 410/2208 [02:28<11:07,  2.69it/s][A
Epoch 3/5:  19%|█▊        | 411/2208 [02:28<11:20,  2.64it/s][A
Epoch 3/5:  19%|█▊        | 412/2208 [02:29<11:08,  2.69it/s][A
Epoch 3/5:  19%|█▊        | 413/2208 [02:29<10:58,  2.73it/s][A
Epoch 3/5:  19%|█▉        | 414/2208 [02:29<11:02,  2.71it/s][A
Epoch 3/5:  19%|█▉        | 415/2208 [02:30<10:52,  2.75it/s][A
Epoch 3/5:  19%|█▉        | 416/2208 [02:30<10:38,  2.81it/s][A
Epoch 3/5:  19%|█▉      

Batch 425: Training accuracy = 0.8906, F1 = 0.8717, Precision = 0.8743, Recall = 0.8906



Epoch 3/5:  19%|█▉        | 427/2208 [02:34<10:33,  2.81it/s][A
Epoch 3/5:  19%|█▉        | 428/2208 [02:34<10:24,  2.85it/s][A
Epoch 3/5:  19%|█▉        | 429/2208 [02:35<10:23,  2.85it/s][A
Epoch 3/5:  19%|█▉        | 430/2208 [02:35<10:18,  2.88it/s][A
Epoch 3/5:  20%|█▉        | 431/2208 [02:35<10:15,  2.89it/s][A
Epoch 3/5:  20%|█▉        | 432/2208 [02:36<10:18,  2.87it/s][A
Epoch 3/5:  20%|█▉        | 433/2208 [02:36<10:17,  2.88it/s][A
Epoch 3/5:  20%|█▉        | 434/2208 [02:36<10:42,  2.76it/s][A
Epoch 3/5:  20%|█▉        | 435/2208 [02:37<10:50,  2.73it/s][A
Epoch 3/5:  20%|█▉        | 436/2208 [02:37<10:52,  2.71it/s][A
Epoch 3/5:  20%|█▉        | 437/2208 [02:37<10:37,  2.78it/s][A
Epoch 3/5:  20%|█▉        | 438/2208 [02:38<10:25,  2.83it/s][A
Epoch 3/5:  20%|█▉        | 439/2208 [02:38<10:34,  2.79it/s][A
Epoch 3/5:  20%|█▉        | 440/2208 [02:38<10:24,  2.83it/s][A
Epoch 3/5:  20%|█▉        | 441/2208 [02:39<10:18,  2.86it/s][A
Epoch 3/5:  20%|██      

Batch 450: Training accuracy = 0.8516, F1 = 0.8406, Precision = 0.8477, Recall = 0.8516



Epoch 3/5:  20%|██        | 452/2208 [02:43<10:30,  2.78it/s][A
Epoch 3/5:  21%|██        | 453/2208 [02:43<10:27,  2.79it/s][A
Epoch 3/5:  21%|██        | 454/2208 [02:43<10:39,  2.74it/s][A
Epoch 3/5:  21%|██        | 455/2208 [02:44<10:44,  2.72it/s][A
Epoch 3/5:  21%|██        | 456/2208 [02:44<10:52,  2.69it/s][A
Epoch 3/5:  21%|██        | 457/2208 [02:45<10:43,  2.72it/s][A
Epoch 3/5:  21%|██        | 458/2208 [02:45<10:39,  2.74it/s][A
Epoch 3/5:  21%|██        | 459/2208 [02:45<10:41,  2.73it/s][A
Epoch 3/5:  21%|██        | 460/2208 [02:46<10:25,  2.79it/s][A
Epoch 3/5:  21%|██        | 461/2208 [02:46<10:26,  2.79it/s][A
Epoch 3/5:  21%|██        | 462/2208 [02:46<10:38,  2.74it/s][A
Epoch 3/5:  21%|██        | 463/2208 [02:47<10:26,  2.78it/s][A
Epoch 3/5:  21%|██        | 464/2208 [02:47<10:23,  2.80it/s][A
Epoch 3/5:  21%|██        | 465/2208 [02:47<10:19,  2.81it/s][A
Epoch 3/5:  21%|██        | 466/2208 [02:48<10:27,  2.78it/s][A
Epoch 3/5:  21%|██      

Batch 475: Training accuracy = 0.8594, F1 = 0.8401, Precision = 0.8398, Recall = 0.8594



Epoch 3/5:  22%|██▏       | 477/2208 [02:52<10:32,  2.74it/s][A
Epoch 3/5:  22%|██▏       | 478/2208 [02:52<10:18,  2.80it/s][A
Epoch 3/5:  22%|██▏       | 479/2208 [02:52<10:09,  2.84it/s][A
Epoch 3/5:  22%|██▏       | 480/2208 [02:53<10:06,  2.85it/s][A
Epoch 3/5:  22%|██▏       | 481/2208 [02:53<10:04,  2.86it/s][A
Epoch 3/5:  22%|██▏       | 482/2208 [02:54<10:05,  2.85it/s][A
Epoch 3/5:  22%|██▏       | 483/2208 [02:54<10:14,  2.81it/s][A
Epoch 3/5:  22%|██▏       | 484/2208 [02:54<10:05,  2.85it/s][A
Epoch 3/5:  22%|██▏       | 485/2208 [02:55<10:08,  2.83it/s][A
Epoch 3/5:  22%|██▏       | 486/2208 [02:55<10:03,  2.85it/s][A
Epoch 3/5:  22%|██▏       | 487/2208 [02:55<10:23,  2.76it/s][A
Epoch 3/5:  22%|██▏       | 488/2208 [02:56<10:26,  2.74it/s][A
Epoch 3/5:  22%|██▏       | 489/2208 [02:56<10:27,  2.74it/s][A
Epoch 3/5:  22%|██▏       | 490/2208 [02:56<10:28,  2.73it/s][A
Epoch 3/5:  22%|██▏       | 491/2208 [02:57<10:35,  2.70it/s][A
Epoch 3/5:  22%|██▏     

Batch 500: Training accuracy = 0.8125, F1 = 0.7870, Precision = 0.7760, Recall = 0.8125



Epoch 3/5:  23%|██▎       | 502/2208 [03:01<09:57,  2.85it/s][A
Epoch 3/5:  23%|██▎       | 503/2208 [03:01<09:56,  2.86it/s][A
Epoch 3/5:  23%|██▎       | 504/2208 [03:02<10:05,  2.81it/s][A
Epoch 3/5:  23%|██▎       | 505/2208 [03:02<10:01,  2.83it/s][A
Epoch 3/5:  23%|██▎       | 506/2208 [03:02<09:54,  2.86it/s][A
Epoch 3/5:  23%|██▎       | 507/2208 [03:03<09:56,  2.85it/s][A
Epoch 3/5:  23%|██▎       | 508/2208 [03:03<10:06,  2.80it/s][A
Epoch 3/5:  23%|██▎       | 509/2208 [03:03<09:57,  2.84it/s][A
Epoch 3/5:  23%|██▎       | 510/2208 [03:04<10:04,  2.81it/s][A
Epoch 3/5:  23%|██▎       | 511/2208 [03:04<09:56,  2.85it/s][A
Epoch 3/5:  23%|██▎       | 512/2208 [03:04<09:49,  2.88it/s][A
Epoch 3/5:  23%|██▎       | 513/2208 [03:05<09:45,  2.89it/s][A
Epoch 3/5:  23%|██▎       | 514/2208 [03:05<09:46,  2.89it/s][A
Epoch 3/5:  23%|██▎       | 515/2208 [03:05<09:44,  2.90it/s][A
Epoch 3/5:  23%|██▎       | 516/2208 [03:06<09:42,  2.91it/s][A
Epoch 3/5:  23%|██▎     

Batch 525: Training accuracy = 0.8594, F1 = 0.8396, Precision = 0.8405, Recall = 0.8594



Epoch 3/5:  24%|██▍       | 527/2208 [03:10<10:06,  2.77it/s][A
Epoch 3/5:  24%|██▍       | 528/2208 [03:10<09:57,  2.81it/s][A
Epoch 3/5:  24%|██▍       | 529/2208 [03:10<09:54,  2.82it/s][A
Epoch 3/5:  24%|██▍       | 530/2208 [03:11<09:59,  2.80it/s][A
Epoch 3/5:  24%|██▍       | 531/2208 [03:11<09:58,  2.80it/s][A
Epoch 3/5:  24%|██▍       | 532/2208 [03:11<10:02,  2.78it/s][A
Epoch 3/5:  24%|██▍       | 533/2208 [03:12<10:08,  2.75it/s][A
Epoch 3/5:  24%|██▍       | 534/2208 [03:12<10:12,  2.73it/s][A
Epoch 3/5:  24%|██▍       | 535/2208 [03:13<10:07,  2.75it/s][A
Epoch 3/5:  24%|██▍       | 536/2208 [03:13<10:22,  2.69it/s][A
Epoch 3/5:  24%|██▍       | 537/2208 [03:13<10:23,  2.68it/s][A
Epoch 3/5:  24%|██▍       | 538/2208 [03:14<10:17,  2.70it/s][A
Epoch 3/5:  24%|██▍       | 539/2208 [03:14<10:04,  2.76it/s][A
Epoch 3/5:  24%|██▍       | 540/2208 [03:14<09:58,  2.79it/s][A
Epoch 3/5:  25%|██▍       | 541/2208 [03:15<09:54,  2.80it/s][A
Epoch 3/5:  25%|██▍     

Batch 550: Training accuracy = 0.8203, F1 = 0.8099, Precision = 0.8318, Recall = 0.8203



Epoch 3/5:  25%|██▌       | 552/2208 [03:19<10:02,  2.75it/s][A
Epoch 3/5:  25%|██▌       | 553/2208 [03:19<09:50,  2.80it/s][A
Epoch 3/5:  25%|██▌       | 554/2208 [03:19<09:41,  2.84it/s][A
Epoch 3/5:  25%|██▌       | 555/2208 [03:20<09:37,  2.86it/s][A
Epoch 3/5:  25%|██▌       | 556/2208 [03:20<09:33,  2.88it/s][A
Epoch 3/5:  25%|██▌       | 557/2208 [03:20<09:41,  2.84it/s][A
Epoch 3/5:  25%|██▌       | 558/2208 [03:21<09:38,  2.85it/s][A
Epoch 3/5:  25%|██▌       | 559/2208 [03:21<09:43,  2.83it/s][A
Epoch 3/5:  25%|██▌       | 560/2208 [03:21<09:35,  2.87it/s][A
Epoch 3/5:  25%|██▌       | 561/2208 [03:22<09:55,  2.77it/s][A
Epoch 3/5:  25%|██▌       | 562/2208 [03:22<09:54,  2.77it/s][A
Epoch 3/5:  25%|██▌       | 563/2208 [03:22<09:57,  2.75it/s][A
Epoch 3/5:  26%|██▌       | 564/2208 [03:23<10:08,  2.70it/s][A
Epoch 3/5:  26%|██▌       | 565/2208 [03:23<10:03,  2.72it/s][A
Epoch 3/5:  26%|██▌       | 566/2208 [03:24<10:04,  2.71it/s][A
Epoch 3/5:  26%|██▌     

Batch 575: Training accuracy = 0.8359, F1 = 0.8344, Precision = 0.8500, Recall = 0.8359



Epoch 3/5:  26%|██▌       | 577/2208 [03:28<10:12,  2.66it/s][A
Epoch 3/5:  26%|██▌       | 578/2208 [03:28<10:04,  2.70it/s][A
Epoch 3/5:  26%|██▌       | 579/2208 [03:28<10:04,  2.69it/s][A
Epoch 3/5:  26%|██▋       | 580/2208 [03:29<10:02,  2.70it/s][A
Epoch 3/5:  26%|██▋       | 581/2208 [03:29<09:56,  2.73it/s][A
Epoch 3/5:  26%|██▋       | 582/2208 [03:29<09:57,  2.72it/s][A
Epoch 3/5:  26%|██▋       | 583/2208 [03:30<09:56,  2.72it/s][A
Epoch 3/5:  26%|██▋       | 584/2208 [03:30<10:05,  2.68it/s][A
Epoch 3/5:  26%|██▋       | 585/2208 [03:31<09:49,  2.75it/s][A
Epoch 3/5:  27%|██▋       | 586/2208 [03:31<09:40,  2.80it/s][A
Epoch 3/5:  27%|██▋       | 587/2208 [03:31<09:37,  2.81it/s][A
Epoch 3/5:  27%|██▋       | 588/2208 [03:32<09:32,  2.83it/s][A
Epoch 3/5:  27%|██▋       | 589/2208 [03:32<09:40,  2.79it/s][A
Epoch 3/5:  27%|██▋       | 590/2208 [03:32<09:41,  2.78it/s][A
Epoch 3/5:  27%|██▋       | 591/2208 [03:33<09:45,  2.76it/s][A
Epoch 3/5:  27%|██▋     

Batch 600: Training accuracy = 0.7969, F1 = 0.7852, Precision = 0.7897, Recall = 0.7969



Epoch 3/5:  27%|██▋       | 602/2208 [03:37<09:24,  2.85it/s][A
Epoch 3/5:  27%|██▋       | 603/2208 [03:37<09:20,  2.86it/s][A
Epoch 3/5:  27%|██▋       | 604/2208 [03:37<09:33,  2.80it/s][A
Epoch 3/5:  27%|██▋       | 605/2208 [03:38<09:42,  2.75it/s][A
Epoch 3/5:  27%|██▋       | 606/2208 [03:38<09:44,  2.74it/s][A
Epoch 3/5:  27%|██▋       | 607/2208 [03:38<09:36,  2.78it/s][A
Epoch 3/5:  28%|██▊       | 608/2208 [03:39<09:30,  2.80it/s][A
Epoch 3/5:  28%|██▊       | 609/2208 [03:39<09:38,  2.77it/s][A
Epoch 3/5:  28%|██▊       | 610/2208 [03:39<09:28,  2.81it/s][A
Epoch 3/5:  28%|██▊       | 611/2208 [03:40<09:27,  2.81it/s][A
Epoch 3/5:  28%|██▊       | 612/2208 [03:40<09:26,  2.82it/s][A
Epoch 3/5:  28%|██▊       | 613/2208 [03:40<09:21,  2.84it/s][A
Epoch 3/5:  28%|██▊       | 614/2208 [03:41<09:34,  2.77it/s][A
Epoch 3/5:  28%|██▊       | 615/2208 [03:41<09:40,  2.74it/s][A
Epoch 3/5:  28%|██▊       | 616/2208 [03:42<09:47,  2.71it/s][A
Epoch 3/5:  28%|██▊     

Batch 625: Training accuracy = 0.8438, F1 = 0.8248, Precision = 0.8161, Recall = 0.8438



Epoch 3/5:  28%|██▊       | 627/2208 [03:46<09:30,  2.77it/s][A
Epoch 3/5:  28%|██▊       | 628/2208 [03:46<09:25,  2.79it/s][A
Epoch 3/5:  28%|██▊       | 629/2208 [03:46<09:16,  2.84it/s][A
Epoch 3/5:  29%|██▊       | 630/2208 [03:47<09:12,  2.85it/s][A
Epoch 3/5:  29%|██▊       | 631/2208 [03:47<09:08,  2.88it/s][A
Epoch 3/5:  29%|██▊       | 632/2208 [03:47<09:13,  2.85it/s][A
Epoch 3/5:  29%|██▊       | 633/2208 [03:48<09:18,  2.82it/s][A
Epoch 3/5:  29%|██▊       | 634/2208 [03:48<09:26,  2.78it/s][A
Epoch 3/5:  29%|██▉       | 635/2208 [03:48<09:26,  2.78it/s][A
Epoch 3/5:  29%|██▉       | 636/2208 [03:49<09:22,  2.79it/s][A
Epoch 3/5:  29%|██▉       | 637/2208 [03:49<09:29,  2.76it/s][A
Epoch 3/5:  29%|██▉       | 638/2208 [03:49<09:22,  2.79it/s][A
Epoch 3/5:  29%|██▉       | 639/2208 [03:50<09:17,  2.81it/s][A
Epoch 3/5:  29%|██▉       | 640/2208 [03:50<09:13,  2.83it/s][A
Epoch 3/5:  29%|██▉       | 641/2208 [03:51<09:09,  2.85it/s][A
Epoch 3/5:  29%|██▉     

Batch 650: Training accuracy = 0.8594, F1 = 0.8594, Precision = 0.8776, Recall = 0.8594



Epoch 3/5:  30%|██▉       | 652/2208 [03:55<09:45,  2.66it/s][A
Epoch 3/5:  30%|██▉       | 653/2208 [03:55<09:36,  2.70it/s][A
Epoch 3/5:  30%|██▉       | 654/2208 [03:55<09:30,  2.72it/s][A
Epoch 3/5:  30%|██▉       | 655/2208 [03:56<09:27,  2.74it/s][A
Epoch 3/5:  30%|██▉       | 656/2208 [03:56<09:31,  2.71it/s][A
Epoch 3/5:  30%|██▉       | 657/2208 [03:56<09:34,  2.70it/s][A
Epoch 3/5:  30%|██▉       | 658/2208 [03:57<09:36,  2.69it/s][A
Epoch 3/5:  30%|██▉       | 659/2208 [03:57<09:31,  2.71it/s][A
Epoch 3/5:  30%|██▉       | 660/2208 [03:57<09:42,  2.66it/s][A
Epoch 3/5:  30%|██▉       | 661/2208 [03:58<09:39,  2.67it/s][A
Epoch 3/5:  30%|██▉       | 662/2208 [03:58<09:22,  2.75it/s][A
Epoch 3/5:  30%|███       | 663/2208 [03:59<09:11,  2.80it/s][A
Epoch 3/5:  30%|███       | 664/2208 [03:59<09:03,  2.84it/s][A
Epoch 3/5:  30%|███       | 665/2208 [03:59<09:04,  2.83it/s][A
Epoch 3/5:  30%|███       | 666/2208 [04:00<09:08,  2.81it/s][A
Epoch 3/5:  30%|███     

Batch 675: Training accuracy = 0.8281, F1 = 0.8099, Precision = 0.8073, Recall = 0.8281



Epoch 3/5:  31%|███       | 677/2208 [04:04<09:14,  2.76it/s][A
Epoch 3/5:  31%|███       | 678/2208 [04:04<09:12,  2.77it/s][A
Epoch 3/5:  31%|███       | 679/2208 [04:04<09:18,  2.74it/s][A
Epoch 3/5:  31%|███       | 680/2208 [04:05<09:10,  2.78it/s][A
Epoch 3/5:  31%|███       | 681/2208 [04:05<09:03,  2.81it/s][A
Epoch 3/5:  31%|███       | 682/2208 [04:05<09:12,  2.76it/s][A
Epoch 3/5:  31%|███       | 683/2208 [04:06<09:17,  2.74it/s][A
Epoch 3/5:  31%|███       | 684/2208 [04:06<09:10,  2.77it/s][A
Epoch 3/5:  31%|███       | 685/2208 [04:06<09:04,  2.80it/s][A
Epoch 3/5:  31%|███       | 686/2208 [04:07<09:24,  2.70it/s][A
Epoch 3/5:  31%|███       | 687/2208 [04:07<09:09,  2.77it/s][A
Epoch 3/5:  31%|███       | 688/2208 [04:08<08:59,  2.82it/s][A
Epoch 3/5:  31%|███       | 689/2208 [04:08<08:53,  2.85it/s][A
Epoch 3/5:  31%|███▏      | 690/2208 [04:08<08:48,  2.87it/s][A
Epoch 3/5:  31%|███▏      | 691/2208 [04:09<08:56,  2.83it/s][A
Epoch 3/5:  31%|███▏    

Batch 700: Training accuracy = 0.8359, F1 = 0.8255, Precision = 0.8307, Recall = 0.8359



Epoch 3/5:  32%|███▏      | 702/2208 [04:13<09:11,  2.73it/s][A
Epoch 3/5:  32%|███▏      | 703/2208 [04:13<09:01,  2.78it/s][A
Epoch 3/5:  32%|███▏      | 704/2208 [04:13<09:08,  2.74it/s][A
Epoch 3/5:  32%|███▏      | 705/2208 [04:14<08:59,  2.79it/s][A
Epoch 3/5:  32%|███▏      | 706/2208 [04:14<08:52,  2.82it/s][A
Epoch 3/5:  32%|███▏      | 707/2208 [04:14<08:48,  2.84it/s][A
Epoch 3/5:  32%|███▏      | 708/2208 [04:15<08:52,  2.82it/s][A
Epoch 3/5:  32%|███▏      | 709/2208 [04:15<08:49,  2.83it/s][A
Epoch 3/5:  32%|███▏      | 710/2208 [04:15<08:53,  2.81it/s][A
Epoch 3/5:  32%|███▏      | 711/2208 [04:16<08:44,  2.85it/s][A
Epoch 3/5:  32%|███▏      | 712/2208 [04:16<09:01,  2.76it/s][A
Epoch 3/5:  32%|███▏      | 713/2208 [04:17<08:52,  2.81it/s][A
Epoch 3/5:  32%|███▏      | 714/2208 [04:17<08:44,  2.85it/s][A
Epoch 3/5:  32%|███▏      | 715/2208 [04:17<08:39,  2.88it/s][A
Epoch 3/5:  32%|███▏      | 716/2208 [04:18<08:53,  2.80it/s][A
Epoch 3/5:  32%|███▏    

Batch 725: Training accuracy = 0.9062, F1 = 0.8974, Precision = 0.8997, Recall = 0.9062



Epoch 3/5:  33%|███▎      | 727/2208 [04:22<08:45,  2.82it/s][A
Epoch 3/5:  33%|███▎      | 728/2208 [04:22<08:38,  2.86it/s][A
Epoch 3/5:  33%|███▎      | 729/2208 [04:22<08:39,  2.85it/s][A
Epoch 3/5:  33%|███▎      | 730/2208 [04:23<08:38,  2.85it/s][A
Epoch 3/5:  33%|███▎      | 731/2208 [04:23<08:44,  2.82it/s][A
Epoch 3/5:  33%|███▎      | 732/2208 [04:23<08:45,  2.81it/s][A
Epoch 3/5:  33%|███▎      | 733/2208 [04:24<09:05,  2.70it/s][A
Epoch 3/5:  33%|███▎      | 734/2208 [04:24<09:04,  2.71it/s][A
Epoch 3/5:  33%|███▎      | 735/2208 [04:24<09:04,  2.71it/s][A
Epoch 3/5:  33%|███▎      | 736/2208 [04:25<09:06,  2.69it/s][A
Epoch 3/5:  33%|███▎      | 737/2208 [04:25<08:57,  2.74it/s][A
Epoch 3/5:  33%|███▎      | 738/2208 [04:26<09:01,  2.72it/s][A
Epoch 3/5:  33%|███▎      | 739/2208 [04:26<08:54,  2.75it/s][A
Epoch 3/5:  34%|███▎      | 740/2208 [04:26<08:55,  2.74it/s][A
Epoch 3/5:  34%|███▎      | 741/2208 [04:27<08:57,  2.73it/s][A
Epoch 3/5:  34%|███▎    

Batch 750: Training accuracy = 0.8125, F1 = 0.7954, Precision = 0.8038, Recall = 0.8125



Epoch 3/5:  34%|███▍      | 752/2208 [04:31<08:48,  2.75it/s][A
Epoch 3/5:  34%|███▍      | 753/2208 [04:31<08:50,  2.74it/s][A
Epoch 3/5:  34%|███▍      | 754/2208 [04:31<08:51,  2.74it/s][A
Epoch 3/5:  34%|███▍      | 755/2208 [04:32<08:43,  2.77it/s][A
Epoch 3/5:  34%|███▍      | 756/2208 [04:32<08:46,  2.76it/s][A
Epoch 3/5:  34%|███▍      | 757/2208 [04:32<08:41,  2.78it/s][A
Epoch 3/5:  34%|███▍      | 758/2208 [04:33<08:31,  2.83it/s][A
Epoch 3/5:  34%|███▍      | 759/2208 [04:33<08:27,  2.85it/s][A
Epoch 3/5:  34%|███▍      | 760/2208 [04:33<08:23,  2.87it/s][A
Epoch 3/5:  34%|███▍      | 761/2208 [04:34<08:33,  2.82it/s][A
Epoch 3/5:  35%|███▍      | 762/2208 [04:34<08:34,  2.81it/s][A
Epoch 3/5:  35%|███▍      | 763/2208 [04:35<08:27,  2.85it/s][A
Epoch 3/5:  35%|███▍      | 764/2208 [04:35<08:24,  2.86it/s][A
Epoch 3/5:  35%|███▍      | 765/2208 [04:35<08:19,  2.89it/s][A
Epoch 3/5:  35%|███▍      | 766/2208 [04:36<08:26,  2.85it/s][A
Epoch 3/5:  35%|███▍    

Batch 775: Training accuracy = 0.8516, F1 = 0.8326, Precision = 0.8288, Recall = 0.8516



Epoch 3/5:  35%|███▌      | 777/2208 [04:40<08:34,  2.78it/s][A
Epoch 3/5:  35%|███▌      | 778/2208 [04:40<08:30,  2.80it/s][A
Epoch 3/5:  35%|███▌      | 779/2208 [04:40<08:31,  2.79it/s][A
Epoch 3/5:  35%|███▌      | 780/2208 [04:41<08:26,  2.82it/s][A
Epoch 3/5:  35%|███▌      | 781/2208 [04:41<08:36,  2.76it/s][A
Epoch 3/5:  35%|███▌      | 782/2208 [04:41<09:01,  2.64it/s][A
Epoch 3/5:  35%|███▌      | 783/2208 [04:42<09:02,  2.63it/s][A
Epoch 3/5:  36%|███▌      | 784/2208 [04:42<08:44,  2.72it/s][A
Epoch 3/5:  36%|███▌      | 785/2208 [04:43<08:56,  2.65it/s][A
Epoch 3/5:  36%|███▌      | 786/2208 [04:43<08:40,  2.73it/s][A
Epoch 3/5:  36%|███▌      | 787/2208 [04:43<08:29,  2.79it/s][A
Epoch 3/5:  36%|███▌      | 788/2208 [04:44<08:22,  2.83it/s][A
Epoch 3/5:  36%|███▌      | 789/2208 [04:44<08:31,  2.77it/s][A
Epoch 3/5:  36%|███▌      | 790/2208 [04:44<08:24,  2.81it/s][A
Epoch 3/5:  36%|███▌      | 791/2208 [04:45<08:18,  2.84it/s][A
Epoch 3/5:  36%|███▌    

Batch 800: Training accuracy = 0.9141, F1 = 0.8959, Precision = 0.8874, Recall = 0.9141



Epoch 3/5:  36%|███▋      | 802/2208 [04:48<08:02,  2.91it/s][A
Epoch 3/5:  36%|███▋      | 803/2208 [04:49<08:01,  2.92it/s][A
Epoch 3/5:  36%|███▋      | 804/2208 [04:49<08:18,  2.82it/s][A
Epoch 3/5:  36%|███▋      | 805/2208 [04:49<08:13,  2.84it/s][A
Epoch 3/5:  37%|███▋      | 806/2208 [04:50<08:08,  2.87it/s][A
Epoch 3/5:  37%|███▋      | 807/2208 [04:50<08:07,  2.88it/s][A
Epoch 3/5:  37%|███▋      | 808/2208 [04:51<08:14,  2.83it/s][A
Epoch 3/5:  37%|███▋      | 809/2208 [04:51<08:24,  2.77it/s][A
Epoch 3/5:  37%|███▋      | 810/2208 [04:51<08:30,  2.74it/s][A
Epoch 3/5:  37%|███▋      | 811/2208 [04:52<08:33,  2.72it/s][A
Epoch 3/5:  37%|███▋      | 812/2208 [04:52<08:26,  2.76it/s][A
Epoch 3/5:  37%|███▋      | 813/2208 [04:52<08:24,  2.76it/s][A
Epoch 3/5:  37%|███▋      | 814/2208 [04:53<08:30,  2.73it/s][A
Epoch 3/5:  37%|███▋      | 815/2208 [04:53<08:23,  2.77it/s][A
Epoch 3/5:  37%|███▋      | 816/2208 [04:53<08:18,  2.79it/s][A
Epoch 3/5:  37%|███▋    

Batch 825: Training accuracy = 0.8359, F1 = 0.8240, Precision = 0.8297, Recall = 0.8359



Epoch 3/5:  37%|███▋      | 827/2208 [04:57<08:18,  2.77it/s][A
Epoch 3/5:  38%|███▊      | 828/2208 [04:58<08:11,  2.81it/s][A
Epoch 3/5:  38%|███▊      | 829/2208 [04:58<08:08,  2.82it/s][A
Epoch 3/5:  38%|███▊      | 830/2208 [04:58<08:03,  2.85it/s][A
Epoch 3/5:  38%|███▊      | 831/2208 [04:59<07:59,  2.87it/s][A
Epoch 3/5:  38%|███▊      | 832/2208 [04:59<07:56,  2.89it/s][A
Epoch 3/5:  38%|███▊      | 833/2208 [04:59<07:57,  2.88it/s][A
Epoch 3/5:  38%|███▊      | 834/2208 [05:00<08:05,  2.83it/s][A
Epoch 3/5:  38%|███▊      | 835/2208 [05:00<07:59,  2.86it/s][A
Epoch 3/5:  38%|███▊      | 836/2208 [05:00<07:54,  2.89it/s][A
Epoch 3/5:  38%|███▊      | 837/2208 [05:01<07:52,  2.90it/s][A
Epoch 3/5:  38%|███▊      | 838/2208 [05:01<07:54,  2.89it/s][A
Epoch 3/5:  38%|███▊      | 839/2208 [05:02<07:54,  2.88it/s][A
Epoch 3/5:  38%|███▊      | 840/2208 [05:02<08:11,  2.78it/s][A
Epoch 3/5:  38%|███▊      | 841/2208 [05:02<08:15,  2.76it/s][A
Epoch 3/5:  38%|███▊    

Batch 850: Training accuracy = 0.8047, F1 = 0.8130, Precision = 0.8320, Recall = 0.8047



Epoch 3/5:  39%|███▊      | 852/2208 [05:06<08:05,  2.79it/s][A
Epoch 3/5:  39%|███▊      | 853/2208 [05:07<08:03,  2.80it/s][A
Epoch 3/5:  39%|███▊      | 854/2208 [05:07<08:00,  2.82it/s][A
Epoch 3/5:  39%|███▊      | 855/2208 [05:07<07:53,  2.86it/s][A
Epoch 3/5:  39%|███▉      | 856/2208 [05:08<08:13,  2.74it/s][A
Epoch 3/5:  39%|███▉      | 857/2208 [05:08<08:09,  2.76it/s][A
Epoch 3/5:  39%|███▉      | 858/2208 [05:08<08:17,  2.71it/s][A
Epoch 3/5:  39%|███▉      | 859/2208 [05:09<08:22,  2.69it/s][A
Epoch 3/5:  39%|███▉      | 860/2208 [05:09<08:14,  2.73it/s][A
Epoch 3/5:  39%|███▉      | 861/2208 [05:10<08:15,  2.72it/s][A
Epoch 3/5:  39%|███▉      | 862/2208 [05:10<08:08,  2.76it/s][A
Epoch 3/5:  39%|███▉      | 863/2208 [05:10<07:58,  2.81it/s][A
Epoch 3/5:  39%|███▉      | 864/2208 [05:11<08:03,  2.78it/s][A
Epoch 3/5:  39%|███▉      | 865/2208 [05:11<07:57,  2.81it/s][A
Epoch 3/5:  39%|███▉      | 866/2208 [05:11<08:04,  2.77it/s][A
Epoch 3/5:  39%|███▉    

Batch 875: Training accuracy = 0.8281, F1 = 0.8130, Precision = 0.8164, Recall = 0.8281



Epoch 3/5:  40%|███▉      | 877/2208 [05:15<07:39,  2.90it/s][A
Epoch 3/5:  40%|███▉      | 878/2208 [05:16<07:37,  2.91it/s][A
Epoch 3/5:  40%|███▉      | 879/2208 [05:16<07:47,  2.84it/s][A
Epoch 3/5:  40%|███▉      | 880/2208 [05:16<07:41,  2.88it/s][A
Epoch 3/5:  40%|███▉      | 881/2208 [05:17<07:45,  2.85it/s][A
Epoch 3/5:  40%|███▉      | 882/2208 [05:17<07:51,  2.81it/s][A
Epoch 3/5:  40%|███▉      | 883/2208 [05:17<07:43,  2.86it/s][A
Epoch 3/5:  40%|████      | 884/2208 [05:18<07:54,  2.79it/s][A
Epoch 3/5:  40%|████      | 885/2208 [05:18<08:01,  2.75it/s][A
Epoch 3/5:  40%|████      | 886/2208 [05:18<08:03,  2.73it/s][A
Epoch 3/5:  40%|████      | 887/2208 [05:19<07:59,  2.76it/s][A
Epoch 3/5:  40%|████      | 888/2208 [05:19<08:10,  2.69it/s][A
Epoch 3/5:  40%|████      | 889/2208 [05:20<08:02,  2.73it/s][A
Epoch 3/5:  40%|████      | 890/2208 [05:20<08:12,  2.67it/s][A
Epoch 3/5:  40%|████      | 891/2208 [05:20<08:08,  2.70it/s][A
Epoch 3/5:  40%|████    

Batch 900: Training accuracy = 0.8516, F1 = 0.8432, Precision = 0.8557, Recall = 0.8516



Epoch 3/5:  41%|████      | 902/2208 [05:24<07:48,  2.79it/s][A
Epoch 3/5:  41%|████      | 903/2208 [05:25<07:58,  2.73it/s][A
Epoch 3/5:  41%|████      | 904/2208 [05:25<07:50,  2.77it/s][A
Epoch 3/5:  41%|████      | 905/2208 [05:25<07:44,  2.81it/s][A
Epoch 3/5:  41%|████      | 906/2208 [05:26<07:37,  2.85it/s][A
Epoch 3/5:  41%|████      | 907/2208 [05:26<07:43,  2.81it/s][A
Epoch 3/5:  41%|████      | 908/2208 [05:26<07:47,  2.78it/s][A
Epoch 3/5:  41%|████      | 909/2208 [05:27<07:47,  2.78it/s][A
Epoch 3/5:  41%|████      | 910/2208 [05:27<07:52,  2.75it/s][A
Epoch 3/5:  41%|████▏     | 911/2208 [05:28<07:47,  2.78it/s][A
Epoch 3/5:  41%|████▏     | 912/2208 [05:28<07:39,  2.82it/s][A
Epoch 3/5:  41%|████▏     | 913/2208 [05:28<07:33,  2.86it/s][A
Epoch 3/5:  41%|████▏     | 914/2208 [05:29<07:32,  2.86it/s][A
Epoch 3/5:  41%|████▏     | 915/2208 [05:29<07:31,  2.86it/s][A
Epoch 3/5:  41%|████▏     | 916/2208 [05:29<07:31,  2.86it/s][A
Epoch 3/5:  42%|████▏   

Batch 925: Training accuracy = 0.8828, F1 = 0.8724, Precision = 0.8750, Recall = 0.8828



Epoch 3/5:  42%|████▏     | 927/2208 [05:33<07:30,  2.84it/s][A
Epoch 3/5:  42%|████▏     | 928/2208 [05:33<07:26,  2.86it/s][A
Epoch 3/5:  42%|████▏     | 929/2208 [05:34<07:23,  2.89it/s][A
Epoch 3/5:  42%|████▏     | 930/2208 [05:34<07:31,  2.83it/s][A
Epoch 3/5:  42%|████▏     | 931/2208 [05:35<07:39,  2.78it/s][A
Epoch 3/5:  42%|████▏     | 932/2208 [05:35<07:44,  2.74it/s][A
Epoch 3/5:  42%|████▏     | 933/2208 [05:35<07:49,  2.72it/s][A
Epoch 3/5:  42%|████▏     | 934/2208 [05:36<07:48,  2.72it/s][A
Epoch 3/5:  42%|████▏     | 935/2208 [05:36<07:37,  2.79it/s][A
Epoch 3/5:  42%|████▏     | 936/2208 [05:36<07:39,  2.77it/s][A
Epoch 3/5:  42%|████▏     | 937/2208 [05:37<07:41,  2.75it/s][A
Epoch 3/5:  42%|████▏     | 938/2208 [05:37<07:43,  2.74it/s][A
Epoch 3/5:  43%|████▎     | 939/2208 [05:37<07:35,  2.78it/s][A
Epoch 3/5:  43%|████▎     | 940/2208 [05:38<07:31,  2.81it/s][A
Epoch 3/5:  43%|████▎     | 941/2208 [05:38<07:42,  2.74it/s][A
Epoch 3/5:  43%|████▎   

Batch 950: Training accuracy = 0.8125, F1 = 0.8049, Precision = 0.8203, Recall = 0.8125



Epoch 3/5:  43%|████▎     | 952/2208 [05:42<07:26,  2.81it/s][A
Epoch 3/5:  43%|████▎     | 953/2208 [05:42<07:20,  2.85it/s][A
Epoch 3/5:  43%|████▎     | 954/2208 [05:43<07:19,  2.85it/s][A
Epoch 3/5:  43%|████▎     | 955/2208 [05:43<07:18,  2.86it/s][A
Epoch 3/5:  43%|████▎     | 956/2208 [05:44<07:15,  2.87it/s][A
Epoch 3/5:  43%|████▎     | 957/2208 [05:44<07:16,  2.86it/s][A
Epoch 3/5:  43%|████▎     | 958/2208 [05:44<07:24,  2.81it/s][A
Epoch 3/5:  43%|████▎     | 959/2208 [05:45<07:24,  2.81it/s][A
Epoch 3/5:  43%|████▎     | 960/2208 [05:45<07:30,  2.77it/s][A
Epoch 3/5:  44%|████▎     | 961/2208 [05:45<07:20,  2.83it/s][A
Epoch 3/5:  44%|████▎     | 962/2208 [05:46<07:18,  2.84it/s][A
Epoch 3/5:  44%|████▎     | 963/2208 [05:46<07:22,  2.82it/s][A
Epoch 3/5:  44%|████▎     | 964/2208 [05:46<07:29,  2.77it/s][A
Epoch 3/5:  44%|████▎     | 965/2208 [05:47<07:20,  2.82it/s][A
Epoch 3/5:  44%|████▍     | 966/2208 [05:47<07:24,  2.79it/s][A
Epoch 3/5:  44%|████▍   

Batch 975: Training accuracy = 0.8672, F1 = 0.8559, Precision = 0.8633, Recall = 0.8672



Epoch 3/5:  44%|████▍     | 977/2208 [05:51<07:07,  2.88it/s][A
Epoch 3/5:  44%|████▍     | 978/2208 [05:51<07:09,  2.86it/s][A
Epoch 3/5:  44%|████▍     | 979/2208 [05:52<07:15,  2.82it/s][A
Epoch 3/5:  44%|████▍     | 980/2208 [05:52<07:23,  2.77it/s][A
Epoch 3/5:  44%|████▍     | 981/2208 [05:52<07:18,  2.80it/s][A
Epoch 3/5:  44%|████▍     | 982/2208 [05:53<07:23,  2.76it/s][A
Epoch 3/5:  45%|████▍     | 983/2208 [05:53<07:25,  2.75it/s][A
Epoch 3/5:  45%|████▍     | 984/2208 [05:54<07:21,  2.77it/s][A
Epoch 3/5:  45%|████▍     | 985/2208 [05:54<07:21,  2.77it/s][A
Epoch 3/5:  45%|████▍     | 986/2208 [05:54<07:14,  2.82it/s][A
Epoch 3/5:  45%|████▍     | 987/2208 [05:55<07:19,  2.78it/s][A
Epoch 3/5:  45%|████▍     | 988/2208 [05:55<07:31,  2.70it/s][A
Epoch 3/5:  45%|████▍     | 989/2208 [05:55<07:35,  2.67it/s][A
Epoch 3/5:  45%|████▍     | 990/2208 [05:56<07:33,  2.69it/s][A
Epoch 3/5:  45%|████▍     | 991/2208 [05:56<07:33,  2.69it/s][A
Epoch 3/5:  45%|████▍   

Batch 1000: Training accuracy = 0.8516, F1 = 0.8427, Precision = 0.8620, Recall = 0.8516



Epoch 3/5:  45%|████▌     | 1002/2208 [06:00<07:17,  2.75it/s][A
Epoch 3/5:  45%|████▌     | 1003/2208 [06:00<07:08,  2.81it/s][A
Epoch 3/5:  45%|████▌     | 1004/2208 [06:01<07:09,  2.80it/s][A
Epoch 3/5:  46%|████▌     | 1005/2208 [06:01<07:16,  2.75it/s][A
Epoch 3/5:  46%|████▌     | 1006/2208 [06:01<07:14,  2.77it/s][A
Epoch 3/5:  46%|████▌     | 1007/2208 [06:02<07:20,  2.73it/s][A
Epoch 3/5:  46%|████▌     | 1008/2208 [06:02<07:12,  2.77it/s][A
Epoch 3/5:  46%|████▌     | 1009/2208 [06:03<07:06,  2.81it/s][A
Epoch 3/5:  46%|████▌     | 1010/2208 [06:03<07:00,  2.85it/s][A
Epoch 3/5:  46%|████▌     | 1011/2208 [06:03<06:59,  2.85it/s][A
Epoch 3/5:  46%|████▌     | 1012/2208 [06:04<06:56,  2.87it/s][A
Epoch 3/5:  46%|████▌     | 1013/2208 [06:04<07:01,  2.83it/s][A
Epoch 3/5:  46%|████▌     | 1014/2208 [06:04<06:56,  2.87it/s][A
Epoch 3/5:  46%|████▌     | 1015/2208 [06:05<06:55,  2.87it/s][A
Epoch 3/5:  46%|████▌     | 1016/2208 [06:05<07:01,  2.83it/s][A
Epoch 3/5

Batch 1025: Training accuracy = 0.8594, F1 = 0.8479, Precision = 0.8490, Recall = 0.8594



Epoch 3/5:  47%|████▋     | 1027/2208 [06:09<07:02,  2.80it/s][A
Epoch 3/5:  47%|████▋     | 1028/2208 [06:09<07:00,  2.81it/s][A
Epoch 3/5:  47%|████▋     | 1029/2208 [06:10<07:06,  2.76it/s][A
Epoch 3/5:  47%|████▋     | 1030/2208 [06:10<07:00,  2.80it/s][A
Epoch 3/5:  47%|████▋     | 1031/2208 [06:10<06:56,  2.83it/s][A
Epoch 3/5:  47%|████▋     | 1032/2208 [06:11<06:56,  2.83it/s][A
Epoch 3/5:  47%|████▋     | 1033/2208 [06:11<07:01,  2.79it/s][A
Epoch 3/5:  47%|████▋     | 1034/2208 [06:11<07:07,  2.75it/s][A
Epoch 3/5:  47%|████▋     | 1035/2208 [06:12<06:57,  2.81it/s][A
Epoch 3/5:  47%|████▋     | 1036/2208 [06:12<06:52,  2.84it/s][A
Epoch 3/5:  47%|████▋     | 1037/2208 [06:12<06:48,  2.87it/s][A
Epoch 3/5:  47%|████▋     | 1038/2208 [06:13<06:55,  2.82it/s][A
Epoch 3/5:  47%|████▋     | 1039/2208 [06:13<06:52,  2.83it/s][A
Epoch 3/5:  47%|████▋     | 1040/2208 [06:14<06:57,  2.80it/s][A
Epoch 3/5:  47%|████▋     | 1041/2208 [06:14<06:51,  2.83it/s][A
Epoch 3/5

Batch 1050: Training accuracy = 0.8516, F1 = 0.8429, Precision = 0.8486, Recall = 0.8516



Epoch 3/5:  48%|████▊     | 1052/2208 [06:18<06:49,  2.83it/s][A
Epoch 3/5:  48%|████▊     | 1053/2208 [06:18<06:43,  2.86it/s][A
Epoch 3/5:  48%|████▊     | 1054/2208 [06:19<06:41,  2.88it/s][A
Epoch 3/5:  48%|████▊     | 1055/2208 [06:19<06:38,  2.90it/s][A
Epoch 3/5:  48%|████▊     | 1056/2208 [06:19<06:44,  2.85it/s][A
Epoch 3/5:  48%|████▊     | 1057/2208 [06:20<06:41,  2.86it/s][A
Epoch 3/5:  48%|████▊     | 1058/2208 [06:20<06:50,  2.80it/s][A
Epoch 3/5:  48%|████▊     | 1059/2208 [06:20<06:55,  2.76it/s][A
Epoch 3/5:  48%|████▊     | 1060/2208 [06:21<07:03,  2.71it/s][A
Epoch 3/5:  48%|████▊     | 1061/2208 [06:21<07:03,  2.71it/s][A
Epoch 3/5:  48%|████▊     | 1062/2208 [06:22<07:03,  2.71it/s][A
Epoch 3/5:  48%|████▊     | 1063/2208 [06:22<07:02,  2.71it/s][A
Epoch 3/5:  48%|████▊     | 1064/2208 [06:22<07:02,  2.71it/s][A
Epoch 3/5:  48%|████▊     | 1065/2208 [06:23<06:59,  2.72it/s][A
Epoch 3/5:  48%|████▊     | 1066/2208 [06:23<06:52,  2.77it/s][A
Epoch 3/5

Batch 1075: Training accuracy = 0.8594, F1 = 0.8578, Precision = 0.8685, Recall = 0.8594



Epoch 3/5:  49%|████▉     | 1077/2208 [06:27<06:45,  2.79it/s][A
Epoch 3/5:  49%|████▉     | 1078/2208 [06:27<06:39,  2.83it/s][A
Epoch 3/5:  49%|████▉     | 1079/2208 [06:28<06:44,  2.79it/s][A
Epoch 3/5:  49%|████▉     | 1080/2208 [06:28<06:43,  2.80it/s][A
Epoch 3/5:  49%|████▉     | 1081/2208 [06:28<06:38,  2.83it/s][A
Epoch 3/5:  49%|████▉     | 1082/2208 [06:29<06:37,  2.84it/s][A
Epoch 3/5:  49%|████▉     | 1083/2208 [06:29<06:45,  2.78it/s][A
Epoch 3/5:  49%|████▉     | 1084/2208 [06:29<06:41,  2.80it/s][A
Epoch 3/5:  49%|████▉     | 1085/2208 [06:30<06:35,  2.84it/s][A
Epoch 3/5:  49%|████▉     | 1086/2208 [06:30<06:32,  2.86it/s][A
Epoch 3/5:  49%|████▉     | 1087/2208 [06:30<06:31,  2.86it/s][A
Epoch 3/5:  49%|████▉     | 1088/2208 [06:31<06:29,  2.87it/s][A
Epoch 3/5:  49%|████▉     | 1089/2208 [06:31<06:37,  2.82it/s][A
Epoch 3/5:  49%|████▉     | 1090/2208 [06:31<06:39,  2.80it/s][A
Epoch 3/5:  49%|████▉     | 1091/2208 [06:32<06:33,  2.84it/s][A
Epoch 3/5

Batch 1100: Training accuracy = 0.8594, F1 = 0.8552, Precision = 0.8646, Recall = 0.8594



Epoch 3/5:  50%|████▉     | 1102/2208 [06:36<06:35,  2.80it/s][A
Epoch 3/5:  50%|████▉     | 1103/2208 [06:36<06:31,  2.82it/s][A
Epoch 3/5:  50%|█████     | 1104/2208 [06:36<06:43,  2.73it/s][A
Epoch 3/5:  50%|█████     | 1105/2208 [06:37<06:47,  2.71it/s][A
Epoch 3/5:  50%|█████     | 1106/2208 [06:37<06:53,  2.66it/s][A
Epoch 3/5:  50%|█████     | 1107/2208 [06:38<06:44,  2.72it/s][A
Epoch 3/5:  50%|█████     | 1108/2208 [06:38<06:34,  2.79it/s][A
Epoch 3/5:  50%|█████     | 1109/2208 [06:38<06:34,  2.79it/s][A
Epoch 3/5:  50%|█████     | 1110/2208 [06:39<06:42,  2.72it/s][A
Epoch 3/5:  50%|█████     | 1111/2208 [06:39<06:33,  2.79it/s][A
Epoch 3/5:  50%|█████     | 1112/2208 [06:39<06:32,  2.80it/s][A
Epoch 3/5:  50%|█████     | 1113/2208 [06:40<06:32,  2.79it/s][A
Epoch 3/5:  50%|█████     | 1114/2208 [06:40<06:38,  2.74it/s][A
Epoch 3/5:  50%|█████     | 1115/2208 [06:40<06:43,  2.71it/s][A
Epoch 3/5:  51%|█████     | 1116/2208 [06:41<06:48,  2.67it/s][A
Epoch 3/5

Batch 1125: Training accuracy = 0.8828, F1 = 0.8745, Precision = 0.8887, Recall = 0.8828



Epoch 3/5:  51%|█████     | 1127/2208 [06:45<06:24,  2.81it/s][A
Epoch 3/5:  51%|█████     | 1128/2208 [06:45<06:19,  2.85it/s][A
Epoch 3/5:  51%|█████     | 1129/2208 [06:45<06:31,  2.76it/s][A
Epoch 3/5:  51%|█████     | 1130/2208 [06:46<06:31,  2.75it/s][A
Epoch 3/5:  51%|█████     | 1131/2208 [06:46<06:23,  2.81it/s][A
Epoch 3/5:  51%|█████▏    | 1132/2208 [06:47<06:17,  2.85it/s][A
Epoch 3/5:  51%|█████▏    | 1133/2208 [06:47<06:13,  2.88it/s][A
Epoch 3/5:  51%|█████▏    | 1134/2208 [06:47<06:22,  2.81it/s][A
Epoch 3/5:  51%|█████▏    | 1135/2208 [06:48<06:33,  2.73it/s][A
Epoch 3/5:  51%|█████▏    | 1136/2208 [06:48<06:26,  2.77it/s][A
Epoch 3/5:  51%|█████▏    | 1137/2208 [06:48<06:30,  2.74it/s][A
Epoch 3/5:  52%|█████▏    | 1138/2208 [06:49<06:36,  2.70it/s][A
Epoch 3/5:  52%|█████▏    | 1139/2208 [06:49<06:31,  2.73it/s][A
Epoch 3/5:  52%|█████▏    | 1140/2208 [06:49<06:23,  2.78it/s][A
Epoch 3/5:  52%|█████▏    | 1141/2208 [06:50<06:19,  2.81it/s][A
Epoch 3/5

Batch 1150: Training accuracy = 0.8594, F1 = 0.8451, Precision = 0.8490, Recall = 0.8594



Epoch 3/5:  52%|█████▏    | 1152/2208 [06:54<06:15,  2.81it/s][A
Epoch 3/5:  52%|█████▏    | 1153/2208 [06:54<06:22,  2.76it/s][A
Epoch 3/5:  52%|█████▏    | 1154/2208 [06:55<06:23,  2.75it/s][A
Epoch 3/5:  52%|█████▏    | 1155/2208 [06:55<06:18,  2.78it/s][A
Epoch 3/5:  52%|█████▏    | 1156/2208 [06:55<06:24,  2.74it/s][A
Epoch 3/5:  52%|█████▏    | 1157/2208 [06:56<06:16,  2.79it/s][A
Epoch 3/5:  52%|█████▏    | 1158/2208 [06:56<06:11,  2.82it/s][A
Epoch 3/5:  52%|█████▏    | 1159/2208 [06:56<06:18,  2.77it/s][A
Epoch 3/5:  53%|█████▎    | 1160/2208 [06:57<06:12,  2.82it/s][A
Epoch 3/5:  53%|█████▎    | 1161/2208 [06:57<06:15,  2.79it/s][A
Epoch 3/5:  53%|█████▎    | 1162/2208 [06:57<06:09,  2.83it/s][A
Epoch 3/5:  53%|█████▎    | 1163/2208 [06:58<06:16,  2.77it/s][A
Epoch 3/5:  53%|█████▎    | 1164/2208 [06:58<06:12,  2.80it/s][A
Epoch 3/5:  53%|█████▎    | 1165/2208 [06:59<06:16,  2.77it/s][A
Epoch 3/5:  53%|█████▎    | 1166/2208 [06:59<06:17,  2.76it/s][A
Epoch 3/5

Batch 1175: Training accuracy = 0.8516, F1 = 0.8385, Precision = 0.8424, Recall = 0.8516



Epoch 3/5:  53%|█████▎    | 1177/2208 [07:03<05:57,  2.89it/s][A
Epoch 3/5:  53%|█████▎    | 1178/2208 [07:03<05:58,  2.87it/s][A
Epoch 3/5:  53%|█████▎    | 1179/2208 [07:03<05:56,  2.89it/s][A
Epoch 3/5:  53%|█████▎    | 1180/2208 [07:04<06:09,  2.78it/s][A
Epoch 3/5:  53%|█████▎    | 1181/2208 [07:04<06:05,  2.81it/s][A
Epoch 3/5:  54%|█████▎    | 1182/2208 [07:05<05:59,  2.85it/s][A
Epoch 3/5:  54%|█████▎    | 1183/2208 [07:05<05:59,  2.85it/s][A
Epoch 3/5:  54%|█████▎    | 1184/2208 [07:05<05:56,  2.87it/s][A
Epoch 3/5:  54%|█████▎    | 1185/2208 [07:06<06:00,  2.84it/s][A
Epoch 3/5:  54%|█████▎    | 1186/2208 [07:06<06:03,  2.81it/s][A
Epoch 3/5:  54%|█████▍    | 1187/2208 [07:06<06:09,  2.77it/s][A
Epoch 3/5:  54%|█████▍    | 1188/2208 [07:07<06:01,  2.82it/s][A
Epoch 3/5:  54%|█████▍    | 1189/2208 [07:07<06:07,  2.77it/s][A
Epoch 3/5:  54%|█████▍    | 1190/2208 [07:07<06:05,  2.78it/s][A
Epoch 3/5:  54%|█████▍    | 1191/2208 [07:08<06:09,  2.76it/s][A
Epoch 3/5

Batch 1200: Training accuracy = 0.8047, F1 = 0.7989, Precision = 0.8158, Recall = 0.8047



Epoch 3/5:  54%|█████▍    | 1202/2208 [07:12<05:58,  2.81it/s][A
Epoch 3/5:  54%|█████▍    | 1203/2208 [07:12<06:08,  2.73it/s][A
Epoch 3/5:  55%|█████▍    | 1204/2208 [07:12<06:09,  2.71it/s][A
Epoch 3/5:  55%|█████▍    | 1205/2208 [07:13<06:09,  2.72it/s][A
Epoch 3/5:  55%|█████▍    | 1206/2208 [07:13<06:00,  2.78it/s][A
Epoch 3/5:  55%|█████▍    | 1207/2208 [07:13<05:54,  2.82it/s][A
Epoch 3/5:  55%|█████▍    | 1208/2208 [07:14<05:50,  2.85it/s][A
Epoch 3/5:  55%|█████▍    | 1209/2208 [07:14<05:47,  2.88it/s][A
Epoch 3/5:  55%|█████▍    | 1210/2208 [07:14<05:48,  2.87it/s][A
Epoch 3/5:  55%|█████▍    | 1211/2208 [07:15<05:46,  2.88it/s][A
Epoch 3/5:  55%|█████▍    | 1212/2208 [07:15<05:49,  2.85it/s][A
Epoch 3/5:  55%|█████▍    | 1213/2208 [07:16<05:54,  2.81it/s][A
Epoch 3/5:  55%|█████▍    | 1214/2208 [07:16<05:49,  2.85it/s][A
Epoch 3/5:  55%|█████▌    | 1215/2208 [07:16<05:47,  2.86it/s][A
Epoch 3/5:  55%|█████▌    | 1216/2208 [07:17<05:44,  2.88it/s][A
Epoch 3/5

Batch 1225: Training accuracy = 0.8828, F1 = 0.8802, Precision = 0.8906, Recall = 0.8828



Epoch 3/5:  56%|█████▌    | 1227/2208 [07:21<05:58,  2.74it/s][A
Epoch 3/5:  56%|█████▌    | 1228/2208 [07:21<05:59,  2.72it/s][A
Epoch 3/5:  56%|█████▌    | 1229/2208 [07:21<05:57,  2.74it/s][A
Epoch 3/5:  56%|█████▌    | 1230/2208 [07:22<06:02,  2.70it/s][A
Epoch 3/5:  56%|█████▌    | 1231/2208 [07:22<05:53,  2.76it/s][A
Epoch 3/5:  56%|█████▌    | 1232/2208 [07:22<05:55,  2.75it/s][A
Epoch 3/5:  56%|█████▌    | 1233/2208 [07:23<05:58,  2.72it/s][A
Epoch 3/5:  56%|█████▌    | 1234/2208 [07:23<05:56,  2.73it/s][A
Epoch 3/5:  56%|█████▌    | 1235/2208 [07:23<05:58,  2.71it/s][A
Epoch 3/5:  56%|█████▌    | 1236/2208 [07:24<06:06,  2.66it/s][A
Epoch 3/5:  56%|█████▌    | 1237/2208 [07:24<05:55,  2.73it/s][A
Epoch 3/5:  56%|█████▌    | 1238/2208 [07:25<05:51,  2.76it/s][A
Epoch 3/5:  56%|█████▌    | 1239/2208 [07:25<05:48,  2.78it/s][A
Epoch 3/5:  56%|█████▌    | 1240/2208 [07:25<05:50,  2.76it/s][A
Epoch 3/5:  56%|█████▌    | 1241/2208 [07:26<05:46,  2.79it/s][A
Epoch 3/5

Batch 1250: Training accuracy = 0.8984, F1 = 0.8966, Precision = 0.9036, Recall = 0.8984



Epoch 3/5:  57%|█████▋    | 1252/2208 [07:30<05:38,  2.83it/s][A
Epoch 3/5:  57%|█████▋    | 1253/2208 [07:30<05:43,  2.78it/s][A
Epoch 3/5:  57%|█████▋    | 1254/2208 [07:30<05:43,  2.78it/s][A
Epoch 3/5:  57%|█████▋    | 1255/2208 [07:31<05:46,  2.75it/s][A
Epoch 3/5:  57%|█████▋    | 1256/2208 [07:31<05:38,  2.81it/s][A
Epoch 3/5:  57%|█████▋    | 1257/2208 [07:31<05:43,  2.77it/s][A
Epoch 3/5:  57%|█████▋    | 1258/2208 [07:32<05:39,  2.80it/s][A
Epoch 3/5:  57%|█████▋    | 1259/2208 [07:32<05:39,  2.80it/s][A
Epoch 3/5:  57%|█████▋    | 1260/2208 [07:32<05:36,  2.82it/s][A
Epoch 3/5:  57%|█████▋    | 1261/2208 [07:33<05:32,  2.85it/s][A
Epoch 3/5:  57%|█████▋    | 1262/2208 [07:33<05:38,  2.80it/s][A
Epoch 3/5:  57%|█████▋    | 1263/2208 [07:34<05:39,  2.78it/s][A
Epoch 3/5:  57%|█████▋    | 1264/2208 [07:34<05:38,  2.79it/s][A
Epoch 3/5:  57%|█████▋    | 1265/2208 [07:34<05:38,  2.79it/s][A
Epoch 3/5:  57%|█████▋    | 1266/2208 [07:35<05:37,  2.79it/s][A
Epoch 3/5

Batch 1275: Training accuracy = 0.8906, F1 = 0.8849, Precision = 0.8893, Recall = 0.8906



Epoch 3/5:  58%|█████▊    | 1277/2208 [07:39<05:51,  2.64it/s][A
Epoch 3/5:  58%|█████▊    | 1278/2208 [07:39<05:45,  2.69it/s][A
Epoch 3/5:  58%|█████▊    | 1279/2208 [07:39<05:36,  2.76it/s][A
Epoch 3/5:  58%|█████▊    | 1280/2208 [07:40<05:33,  2.79it/s][A
Epoch 3/5:  58%|█████▊    | 1281/2208 [07:40<05:28,  2.82it/s][A
Epoch 3/5:  58%|█████▊    | 1282/2208 [07:40<05:23,  2.86it/s][A
Epoch 3/5:  58%|█████▊    | 1283/2208 [07:41<05:28,  2.82it/s][A
Epoch 3/5:  58%|█████▊    | 1284/2208 [07:41<05:24,  2.85it/s][A
Epoch 3/5:  58%|█████▊    | 1285/2208 [07:41<05:29,  2.80it/s][A
Epoch 3/5:  58%|█████▊    | 1286/2208 [07:42<05:23,  2.85it/s][A
Epoch 3/5:  58%|█████▊    | 1287/2208 [07:42<05:24,  2.84it/s][A
Epoch 3/5:  58%|█████▊    | 1288/2208 [07:42<05:20,  2.87it/s][A
Epoch 3/5:  58%|█████▊    | 1289/2208 [07:43<05:24,  2.83it/s][A
Epoch 3/5:  58%|█████▊    | 1290/2208 [07:43<05:27,  2.81it/s][A
Epoch 3/5:  58%|█████▊    | 1291/2208 [07:44<05:23,  2.83it/s][A
Epoch 3/5

Batch 1300: Training accuracy = 0.8594, F1 = 0.8560, Precision = 0.8757, Recall = 0.8594



Epoch 3/5:  59%|█████▉    | 1302/2208 [07:47<05:24,  2.80it/s][A
Epoch 3/5:  59%|█████▉    | 1303/2208 [07:48<05:18,  2.84it/s][A
Epoch 3/5:  59%|█████▉    | 1304/2208 [07:48<05:17,  2.85it/s][A
Epoch 3/5:  59%|█████▉    | 1305/2208 [07:48<05:14,  2.87it/s][A
Epoch 3/5:  59%|█████▉    | 1306/2208 [07:49<05:16,  2.85it/s][A
Epoch 3/5:  59%|█████▉    | 1307/2208 [07:49<05:16,  2.85it/s][A
Epoch 3/5:  59%|█████▉    | 1308/2208 [07:50<05:13,  2.87it/s][A
Epoch 3/5:  59%|█████▉    | 1309/2208 [07:50<05:15,  2.85it/s][A
Epoch 3/5:  59%|█████▉    | 1310/2208 [07:50<05:16,  2.84it/s][A
Epoch 3/5:  59%|█████▉    | 1311/2208 [07:51<05:15,  2.84it/s][A
Epoch 3/5:  59%|█████▉    | 1312/2208 [07:51<05:22,  2.78it/s][A
Epoch 3/5:  59%|█████▉    | 1313/2208 [07:51<05:18,  2.81it/s][A
Epoch 3/5:  60%|█████▉    | 1314/2208 [07:52<05:21,  2.78it/s][A
Epoch 3/5:  60%|█████▉    | 1315/2208 [07:52<05:24,  2.76it/s][A
Epoch 3/5:  60%|█████▉    | 1316/2208 [07:52<05:26,  2.73it/s][A
Epoch 3/5

Batch 1325: Training accuracy = 0.9297, F1 = 0.9206, Precision = 0.9232, Recall = 0.9297



Epoch 3/5:  60%|██████    | 1327/2208 [07:56<05:27,  2.69it/s][A
Epoch 3/5:  60%|██████    | 1328/2208 [07:57<05:21,  2.74it/s][A
Epoch 3/5:  60%|██████    | 1329/2208 [07:57<05:24,  2.71it/s][A
Epoch 3/5:  60%|██████    | 1330/2208 [07:58<05:31,  2.65it/s][A
Epoch 3/5:  60%|██████    | 1331/2208 [07:58<05:22,  2.72it/s][A
Epoch 3/5:  60%|██████    | 1332/2208 [07:58<05:22,  2.72it/s][A
Epoch 3/5:  60%|██████    | 1333/2208 [07:59<05:20,  2.73it/s][A
Epoch 3/5:  60%|██████    | 1334/2208 [07:59<05:23,  2.70it/s][A
Epoch 3/5:  60%|██████    | 1335/2208 [07:59<05:15,  2.77it/s][A
Epoch 3/5:  61%|██████    | 1336/2208 [08:00<05:11,  2.80it/s][A
Epoch 3/5:  61%|██████    | 1337/2208 [08:00<05:07,  2.83it/s][A
Epoch 3/5:  61%|██████    | 1338/2208 [08:00<05:03,  2.87it/s][A
Epoch 3/5:  61%|██████    | 1339/2208 [08:01<05:03,  2.87it/s][A
Epoch 3/5:  61%|██████    | 1340/2208 [08:01<05:02,  2.87it/s][A
Epoch 3/5:  61%|██████    | 1341/2208 [08:01<05:01,  2.87it/s][A
Epoch 3/5

Batch 1350: Training accuracy = 0.8438, F1 = 0.8332, Precision = 0.8416, Recall = 0.8438



Epoch 3/5:  61%|██████    | 1352/2208 [08:05<05:12,  2.74it/s][A
Epoch 3/5:  61%|██████▏   | 1353/2208 [08:06<05:05,  2.80it/s][A
Epoch 3/5:  61%|██████▏   | 1354/2208 [08:06<05:00,  2.84it/s][A
Epoch 3/5:  61%|██████▏   | 1355/2208 [08:06<05:04,  2.80it/s][A
Epoch 3/5:  61%|██████▏   | 1356/2208 [08:07<05:09,  2.76it/s][A
Epoch 3/5:  61%|██████▏   | 1357/2208 [08:07<05:05,  2.78it/s][A
Epoch 3/5:  62%|██████▏   | 1358/2208 [08:08<05:11,  2.73it/s][A
Epoch 3/5:  62%|██████▏   | 1359/2208 [08:08<05:06,  2.77it/s][A
Epoch 3/5:  62%|██████▏   | 1360/2208 [08:08<05:12,  2.71it/s][A
Epoch 3/5:  62%|██████▏   | 1361/2208 [08:09<05:05,  2.78it/s][A
Epoch 3/5:  62%|██████▏   | 1362/2208 [08:09<05:00,  2.82it/s][A
Epoch 3/5:  62%|██████▏   | 1363/2208 [08:09<04:57,  2.84it/s][A
Epoch 3/5:  62%|██████▏   | 1364/2208 [08:10<05:03,  2.78it/s][A
Epoch 3/5:  62%|██████▏   | 1365/2208 [08:10<05:05,  2.76it/s][A
Epoch 3/5:  62%|██████▏   | 1366/2208 [08:10<05:02,  2.78it/s][A
Epoch 3/5

Batch 1375: Training accuracy = 0.8516, F1 = 0.8406, Precision = 0.8542, Recall = 0.8516



Epoch 3/5:  62%|██████▏   | 1377/2208 [08:14<04:53,  2.83it/s][A
Epoch 3/5:  62%|██████▏   | 1378/2208 [08:15<04:50,  2.86it/s][A
Epoch 3/5:  62%|██████▏   | 1379/2208 [08:15<04:56,  2.79it/s][A
Epoch 3/5:  62%|██████▎   | 1380/2208 [08:15<05:00,  2.76it/s][A
Epoch 3/5:  63%|██████▎   | 1381/2208 [08:16<04:54,  2.81it/s][A
Epoch 3/5:  63%|██████▎   | 1382/2208 [08:16<04:50,  2.84it/s][A
Epoch 3/5:  63%|██████▎   | 1383/2208 [08:16<04:46,  2.88it/s][A
Epoch 3/5:  63%|██████▎   | 1384/2208 [08:17<04:52,  2.81it/s][A
Epoch 3/5:  63%|██████▎   | 1385/2208 [08:17<04:51,  2.82it/s][A
Epoch 3/5:  63%|██████▎   | 1386/2208 [08:18<04:53,  2.80it/s][A
Epoch 3/5:  63%|██████▎   | 1387/2208 [08:18<04:53,  2.80it/s][A
Epoch 3/5:  63%|██████▎   | 1388/2208 [08:18<04:53,  2.80it/s][A
Epoch 3/5:  63%|██████▎   | 1389/2208 [08:19<04:57,  2.75it/s][A
Epoch 3/5:  63%|██████▎   | 1390/2208 [08:19<05:00,  2.73it/s][A
Epoch 3/5:  63%|██████▎   | 1391/2208 [08:19<05:05,  2.68it/s][A
Epoch 3/5

Batch 1400: Training accuracy = 0.8906, F1 = 0.8927, Precision = 0.9049, Recall = 0.8906



Epoch 3/5:  63%|██████▎   | 1402/2208 [08:23<04:50,  2.78it/s][A
Epoch 3/5:  64%|██████▎   | 1403/2208 [08:24<04:45,  2.82it/s][A
Epoch 3/5:  64%|██████▎   | 1404/2208 [08:24<04:50,  2.77it/s][A
Epoch 3/5:  64%|██████▎   | 1405/2208 [08:25<04:54,  2.72it/s][A
Epoch 3/5:  64%|██████▎   | 1406/2208 [08:25<05:01,  2.66it/s][A
Epoch 3/5:  64%|██████▎   | 1407/2208 [08:25<04:53,  2.73it/s][A
Epoch 3/5:  64%|██████▍   | 1408/2208 [08:26<04:58,  2.68it/s][A
Epoch 3/5:  64%|██████▍   | 1409/2208 [08:26<04:50,  2.75it/s][A
Epoch 3/5:  64%|██████▍   | 1410/2208 [08:26<04:45,  2.79it/s][A
Epoch 3/5:  64%|██████▍   | 1411/2208 [08:27<04:48,  2.76it/s][A
Epoch 3/5:  64%|██████▍   | 1412/2208 [08:27<04:43,  2.81it/s][A
Epoch 3/5:  64%|██████▍   | 1413/2208 [08:27<04:41,  2.82it/s][A
Epoch 3/5:  64%|██████▍   | 1414/2208 [08:28<04:47,  2.77it/s][A
Epoch 3/5:  64%|██████▍   | 1415/2208 [08:28<04:44,  2.78it/s][A
Epoch 3/5:  64%|██████▍   | 1416/2208 [08:29<04:43,  2.79it/s][A
Epoch 3/5

Batch 1425: Training accuracy = 0.8438, F1 = 0.8263, Precision = 0.8158, Recall = 0.8438



Epoch 3/5:  65%|██████▍   | 1427/2208 [08:32<04:44,  2.74it/s][A
Epoch 3/5:  65%|██████▍   | 1428/2208 [08:33<04:37,  2.81it/s][A
Epoch 3/5:  65%|██████▍   | 1429/2208 [08:33<04:32,  2.86it/s][A
Epoch 3/5:  65%|██████▍   | 1430/2208 [08:34<04:39,  2.78it/s][A
Epoch 3/5:  65%|██████▍   | 1431/2208 [08:34<04:46,  2.72it/s][A
Epoch 3/5:  65%|██████▍   | 1432/2208 [08:34<04:40,  2.76it/s][A
Epoch 3/5:  65%|██████▍   | 1433/2208 [08:35<04:42,  2.74it/s][A
Epoch 3/5:  65%|██████▍   | 1434/2208 [08:35<04:39,  2.77it/s][A
Epoch 3/5:  65%|██████▍   | 1435/2208 [08:35<04:36,  2.79it/s][A
Epoch 3/5:  65%|██████▌   | 1436/2208 [08:36<04:35,  2.80it/s][A
Epoch 3/5:  65%|██████▌   | 1437/2208 [08:36<04:34,  2.81it/s][A
Epoch 3/5:  65%|██████▌   | 1438/2208 [08:36<04:33,  2.81it/s][A
Epoch 3/5:  65%|██████▌   | 1439/2208 [08:37<04:38,  2.76it/s][A
Epoch 3/5:  65%|██████▌   | 1440/2208 [08:37<04:34,  2.80it/s][A
Epoch 3/5:  65%|██████▌   | 1441/2208 [08:37<04:31,  2.82it/s][A
Epoch 3/5

Batch 1450: Training accuracy = 0.8203, F1 = 0.7992, Precision = 0.7971, Recall = 0.8203



Epoch 3/5:  66%|██████▌   | 1452/2208 [08:41<04:31,  2.79it/s][A
Epoch 3/5:  66%|██████▌   | 1453/2208 [08:42<04:37,  2.72it/s][A
Epoch 3/5:  66%|██████▌   | 1454/2208 [08:42<04:31,  2.78it/s][A
Epoch 3/5:  66%|██████▌   | 1455/2208 [08:43<04:28,  2.81it/s][A
Epoch 3/5:  66%|██████▌   | 1456/2208 [08:43<04:31,  2.77it/s][A
Epoch 3/5:  66%|██████▌   | 1457/2208 [08:43<04:28,  2.79it/s][A
Epoch 3/5:  66%|██████▌   | 1458/2208 [08:44<04:30,  2.77it/s][A
Epoch 3/5:  66%|██████▌   | 1459/2208 [08:44<04:29,  2.78it/s][A
Epoch 3/5:  66%|██████▌   | 1460/2208 [08:44<04:26,  2.81it/s][A
Epoch 3/5:  66%|██████▌   | 1461/2208 [08:45<04:29,  2.78it/s][A
Epoch 3/5:  66%|██████▌   | 1462/2208 [08:45<04:25,  2.81it/s][A
Epoch 3/5:  66%|██████▋   | 1463/2208 [08:45<04:24,  2.82it/s][A
Epoch 3/5:  66%|██████▋   | 1464/2208 [08:46<04:26,  2.80it/s][A
Epoch 3/5:  66%|██████▋   | 1465/2208 [08:46<04:24,  2.81it/s][A
Epoch 3/5:  66%|██████▋   | 1466/2208 [08:46<04:29,  2.76it/s][A
Epoch 3/5

Batch 1475: Training accuracy = 0.8047, F1 = 0.7982, Precision = 0.8216, Recall = 0.8047



Epoch 3/5:  67%|██████▋   | 1477/2208 [08:50<04:19,  2.81it/s][A
Epoch 3/5:  67%|██████▋   | 1478/2208 [08:51<04:24,  2.76it/s][A
Epoch 3/5:  67%|██████▋   | 1479/2208 [08:51<04:25,  2.75it/s][A
Epoch 3/5:  67%|██████▋   | 1480/2208 [08:52<04:26,  2.73it/s][A
Epoch 3/5:  67%|██████▋   | 1481/2208 [08:52<04:27,  2.71it/s][A
Epoch 3/5:  67%|██████▋   | 1482/2208 [08:52<04:37,  2.62it/s][A
Epoch 3/5:  67%|██████▋   | 1483/2208 [08:53<04:38,  2.61it/s][A
Epoch 3/5:  67%|██████▋   | 1484/2208 [08:53<04:29,  2.69it/s][A
Epoch 3/5:  67%|██████▋   | 1485/2208 [08:53<04:26,  2.71it/s][A
Epoch 3/5:  67%|██████▋   | 1486/2208 [08:54<04:25,  2.72it/s][A
Epoch 3/5:  67%|██████▋   | 1487/2208 [08:54<04:25,  2.71it/s][A
Epoch 3/5:  67%|██████▋   | 1488/2208 [08:55<04:23,  2.74it/s][A
Epoch 3/5:  67%|██████▋   | 1489/2208 [08:55<04:20,  2.76it/s][A
Epoch 3/5:  67%|██████▋   | 1490/2208 [08:55<04:20,  2.75it/s][A
Epoch 3/5:  68%|██████▊   | 1491/2208 [08:56<04:20,  2.75it/s][A
Epoch 3/5

Batch 1500: Training accuracy = 0.9141, F1 = 0.9083, Precision = 0.9076, Recall = 0.9141



Epoch 3/5:  68%|██████▊   | 1502/2208 [09:00<04:13,  2.78it/s][A
Epoch 3/5:  68%|██████▊   | 1503/2208 [09:00<04:18,  2.73it/s][A
Epoch 3/5:  68%|██████▊   | 1504/2208 [09:00<04:18,  2.72it/s][A
Epoch 3/5:  68%|██████▊   | 1505/2208 [09:01<04:14,  2.76it/s][A
Epoch 3/5:  68%|██████▊   | 1506/2208 [09:01<04:10,  2.80it/s][A
Epoch 3/5:  68%|██████▊   | 1507/2208 [09:01<04:07,  2.83it/s][A
Epoch 3/5:  68%|██████▊   | 1508/2208 [09:02<04:13,  2.76it/s][A
Epoch 3/5:  68%|██████▊   | 1509/2208 [09:02<04:09,  2.80it/s][A
Epoch 3/5:  68%|██████▊   | 1510/2208 [09:02<04:05,  2.84it/s][A
Epoch 3/5:  68%|██████▊   | 1511/2208 [09:03<04:06,  2.83it/s][A
Epoch 3/5:  68%|██████▊   | 1512/2208 [09:03<04:04,  2.85it/s][A
Epoch 3/5:  69%|██████▊   | 1513/2208 [09:03<04:01,  2.88it/s][A
Epoch 3/5:  69%|██████▊   | 1514/2208 [09:04<04:02,  2.86it/s][A
Epoch 3/5:  69%|██████▊   | 1515/2208 [09:04<04:08,  2.79it/s][A
Epoch 3/5:  69%|██████▊   | 1516/2208 [09:05<04:05,  2.82it/s][A
Epoch 3/5

Batch 1525: Training accuracy = 0.8750, F1 = 0.8602, Precision = 0.8633, Recall = 0.8750



Epoch 3/5:  69%|██████▉   | 1527/2208 [09:09<04:02,  2.81it/s][A
Epoch 3/5:  69%|██████▉   | 1528/2208 [09:09<03:58,  2.85it/s][A
Epoch 3/5:  69%|██████▉   | 1529/2208 [09:09<03:55,  2.88it/s][A
Epoch 3/5:  69%|██████▉   | 1530/2208 [09:10<03:56,  2.87it/s][A
Epoch 3/5:  69%|██████▉   | 1531/2208 [09:10<04:01,  2.80it/s][A
Epoch 3/5:  69%|██████▉   | 1532/2208 [09:10<03:58,  2.83it/s][A
Epoch 3/5:  69%|██████▉   | 1533/2208 [09:11<03:58,  2.83it/s][A
Epoch 3/5:  69%|██████▉   | 1534/2208 [09:11<03:57,  2.84it/s][A
Epoch 3/5:  70%|██████▉   | 1535/2208 [09:11<04:01,  2.79it/s][A
Epoch 3/5:  70%|██████▉   | 1536/2208 [09:12<04:04,  2.75it/s][A
Epoch 3/5:  70%|██████▉   | 1537/2208 [09:12<04:01,  2.78it/s][A
Epoch 3/5:  70%|██████▉   | 1538/2208 [09:12<03:59,  2.80it/s][A
Epoch 3/5:  70%|██████▉   | 1539/2208 [09:13<03:57,  2.82it/s][A
Epoch 3/5:  70%|██████▉   | 1540/2208 [09:13<04:00,  2.77it/s][A
Epoch 3/5:  70%|██████▉   | 1541/2208 [09:14<03:59,  2.78it/s][A
Epoch 3/5

Batch 1550: Training accuracy = 0.9141, F1 = 0.9031, Precision = 0.9010, Recall = 0.9141



Epoch 3/5:  70%|███████   | 1552/2208 [09:18<03:56,  2.78it/s][A
Epoch 3/5:  70%|███████   | 1553/2208 [09:18<03:53,  2.81it/s][A
Epoch 3/5:  70%|███████   | 1554/2208 [09:18<03:50,  2.84it/s][A
Epoch 3/5:  70%|███████   | 1555/2208 [09:19<03:48,  2.86it/s][A
Epoch 3/5:  70%|███████   | 1556/2208 [09:19<03:51,  2.81it/s][A
Epoch 3/5:  71%|███████   | 1557/2208 [09:19<03:48,  2.84it/s][A
Epoch 3/5:  71%|███████   | 1558/2208 [09:20<03:52,  2.79it/s][A
Epoch 3/5:  71%|███████   | 1559/2208 [09:20<03:52,  2.80it/s][A
Epoch 3/5:  71%|███████   | 1560/2208 [09:20<03:49,  2.82it/s][A
Epoch 3/5:  71%|███████   | 1561/2208 [09:21<03:53,  2.77it/s][A
Epoch 3/5:  71%|███████   | 1562/2208 [09:21<03:55,  2.74it/s][A
Epoch 3/5:  71%|███████   | 1563/2208 [09:21<03:57,  2.71it/s][A
Epoch 3/5:  71%|███████   | 1564/2208 [09:22<04:00,  2.67it/s][A
Epoch 3/5:  71%|███████   | 1565/2208 [09:22<03:56,  2.72it/s][A
Epoch 3/5:  71%|███████   | 1566/2208 [09:23<03:53,  2.75it/s][A
Epoch 3/5

Batch 1575: Training accuracy = 0.8984, F1 = 0.8919, Precision = 0.8971, Recall = 0.8984



Epoch 3/5:  71%|███████▏  | 1577/2208 [09:26<03:41,  2.85it/s][A
Epoch 3/5:  71%|███████▏  | 1578/2208 [09:27<03:39,  2.88it/s][A
Epoch 3/5:  72%|███████▏  | 1579/2208 [09:27<03:37,  2.89it/s][A
Epoch 3/5:  72%|███████▏  | 1580/2208 [09:27<03:37,  2.89it/s][A
Epoch 3/5:  72%|███████▏  | 1581/2208 [09:28<03:37,  2.88it/s][A
Epoch 3/5:  72%|███████▏  | 1582/2208 [09:28<03:36,  2.90it/s][A
Epoch 3/5:  72%|███████▏  | 1583/2208 [09:29<03:37,  2.88it/s][A
Epoch 3/5:  72%|███████▏  | 1584/2208 [09:29<03:36,  2.88it/s][A
Epoch 3/5:  72%|███████▏  | 1585/2208 [09:29<03:43,  2.79it/s][A
Epoch 3/5:  72%|███████▏  | 1586/2208 [09:30<03:40,  2.82it/s][A
Epoch 3/5:  72%|███████▏  | 1587/2208 [09:30<03:46,  2.74it/s][A
Epoch 3/5:  72%|███████▏  | 1588/2208 [09:30<03:42,  2.79it/s][A
Epoch 3/5:  72%|███████▏  | 1589/2208 [09:31<03:47,  2.72it/s][A
Epoch 3/5:  72%|███████▏  | 1590/2208 [09:31<03:47,  2.72it/s][A
Epoch 3/5:  72%|███████▏  | 1591/2208 [09:31<03:41,  2.78it/s][A
Epoch 3/5

Batch 1600: Training accuracy = 0.8438, F1 = 0.8305, Precision = 0.8333, Recall = 0.8438



Epoch 3/5:  73%|███████▎  | 1602/2208 [09:35<03:40,  2.75it/s][A
Epoch 3/5:  73%|███████▎  | 1603/2208 [09:36<03:38,  2.76it/s][A
Epoch 3/5:  73%|███████▎  | 1604/2208 [09:36<03:42,  2.71it/s][A
Epoch 3/5:  73%|███████▎  | 1605/2208 [09:36<03:40,  2.73it/s][A
Epoch 3/5:  73%|███████▎  | 1606/2208 [09:37<03:43,  2.70it/s][A
Epoch 3/5:  73%|███████▎  | 1607/2208 [09:37<03:39,  2.74it/s][A
Epoch 3/5:  73%|███████▎  | 1608/2208 [09:38<03:38,  2.75it/s][A
Epoch 3/5:  73%|███████▎  | 1609/2208 [09:38<03:37,  2.75it/s][A
Epoch 3/5:  73%|███████▎  | 1610/2208 [09:38<03:33,  2.80it/s][A
Epoch 3/5:  73%|███████▎  | 1611/2208 [09:39<03:31,  2.83it/s][A
Epoch 3/5:  73%|███████▎  | 1612/2208 [09:39<03:29,  2.84it/s][A
Epoch 3/5:  73%|███████▎  | 1613/2208 [09:39<03:28,  2.86it/s][A
Epoch 3/5:  73%|███████▎  | 1614/2208 [09:40<03:27,  2.87it/s][A
Epoch 3/5:  73%|███████▎  | 1615/2208 [09:40<03:25,  2.88it/s][A
Epoch 3/5:  73%|███████▎  | 1616/2208 [09:40<03:25,  2.88it/s][A
Epoch 3/5

Batch 1625: Training accuracy = 0.8750, F1 = 0.8565, Precision = 0.8542, Recall = 0.8750



Epoch 3/5:  74%|███████▎  | 1627/2208 [09:44<03:24,  2.84it/s][A
Epoch 3/5:  74%|███████▎  | 1628/2208 [09:45<03:24,  2.84it/s][A
Epoch 3/5:  74%|███████▍  | 1629/2208 [09:45<03:22,  2.86it/s][A
Epoch 3/5:  74%|███████▍  | 1630/2208 [09:45<03:22,  2.86it/s][A
Epoch 3/5:  74%|███████▍  | 1631/2208 [09:46<03:22,  2.85it/s][A
Epoch 3/5:  74%|███████▍  | 1632/2208 [09:46<03:24,  2.82it/s][A
Epoch 3/5:  74%|███████▍  | 1633/2208 [09:46<03:24,  2.81it/s][A
Epoch 3/5:  74%|███████▍  | 1634/2208 [09:47<03:27,  2.77it/s][A
Epoch 3/5:  74%|███████▍  | 1635/2208 [09:47<03:27,  2.76it/s][A
Epoch 3/5:  74%|███████▍  | 1636/2208 [09:47<03:26,  2.77it/s][A
Epoch 3/5:  74%|███████▍  | 1637/2208 [09:48<03:27,  2.75it/s][A
Epoch 3/5:  74%|███████▍  | 1638/2208 [09:48<03:27,  2.75it/s][A
Epoch 3/5:  74%|███████▍  | 1639/2208 [09:49<03:32,  2.68it/s][A
Epoch 3/5:  74%|███████▍  | 1640/2208 [09:49<03:27,  2.74it/s][A
Epoch 3/5:  74%|███████▍  | 1641/2208 [09:49<03:25,  2.76it/s][A
Epoch 3/5

Batch 1650: Training accuracy = 0.8203, F1 = 0.8047, Precision = 0.8112, Recall = 0.8203



Epoch 3/5:  75%|███████▍  | 1652/2208 [09:53<03:20,  2.77it/s][A
Epoch 3/5:  75%|███████▍  | 1653/2208 [09:54<03:20,  2.77it/s][A
Epoch 3/5:  75%|███████▍  | 1654/2208 [09:54<03:18,  2.80it/s][A
Epoch 3/5:  75%|███████▍  | 1655/2208 [09:54<03:16,  2.82it/s][A
Epoch 3/5:  75%|███████▌  | 1656/2208 [09:55<03:15,  2.82it/s][A
Epoch 3/5:  75%|███████▌  | 1657/2208 [09:55<03:13,  2.85it/s][A
Epoch 3/5:  75%|███████▌  | 1658/2208 [09:55<03:17,  2.79it/s][A
Epoch 3/5:  75%|███████▌  | 1659/2208 [09:56<03:19,  2.76it/s][A
Epoch 3/5:  75%|███████▌  | 1660/2208 [09:56<03:21,  2.72it/s][A
Epoch 3/5:  75%|███████▌  | 1661/2208 [09:56<03:19,  2.75it/s][A
Epoch 3/5:  75%|███████▌  | 1662/2208 [09:57<03:18,  2.75it/s][A
Epoch 3/5:  75%|███████▌  | 1663/2208 [09:57<03:15,  2.78it/s][A
Epoch 3/5:  75%|███████▌  | 1664/2208 [09:58<03:14,  2.80it/s][A
Epoch 3/5:  75%|███████▌  | 1665/2208 [09:58<03:10,  2.84it/s][A
Epoch 3/5:  75%|███████▌  | 1666/2208 [09:58<03:08,  2.88it/s][A
Epoch 3/5

Batch 1675: Training accuracy = 0.8984, F1 = 0.8964, Precision = 0.8984, Recall = 0.8984



Epoch 3/5:  76%|███████▌  | 1677/2208 [10:02<03:16,  2.71it/s][A
Epoch 3/5:  76%|███████▌  | 1678/2208 [10:03<03:14,  2.72it/s][A
Epoch 3/5:  76%|███████▌  | 1679/2208 [10:03<03:16,  2.69it/s][A
Epoch 3/5:  76%|███████▌  | 1680/2208 [10:03<03:12,  2.74it/s][A
Epoch 3/5:  76%|███████▌  | 1681/2208 [10:04<03:09,  2.78it/s][A
Epoch 3/5:  76%|███████▌  | 1682/2208 [10:04<03:07,  2.81it/s][A
Epoch 3/5:  76%|███████▌  | 1683/2208 [10:04<03:08,  2.79it/s][A
Epoch 3/5:  76%|███████▋  | 1684/2208 [10:05<03:13,  2.71it/s][A
Epoch 3/5:  76%|███████▋  | 1685/2208 [10:05<03:13,  2.70it/s][A
Epoch 3/5:  76%|███████▋  | 1686/2208 [10:06<03:14,  2.68it/s][A
Epoch 3/5:  76%|███████▋  | 1687/2208 [10:06<03:12,  2.70it/s][A
Epoch 3/5:  76%|███████▋  | 1688/2208 [10:06<03:18,  2.62it/s][A
Epoch 3/5:  76%|███████▋  | 1689/2208 [10:07<03:13,  2.68it/s][A
Epoch 3/5:  77%|███████▋  | 1690/2208 [10:07<03:15,  2.65it/s][A
Epoch 3/5:  77%|███████▋  | 1691/2208 [10:07<03:13,  2.67it/s][A
Epoch 3/5

Batch 1700: Training accuracy = 0.8906, F1 = 0.8839, Precision = 0.8854, Recall = 0.8906



Epoch 3/5:  77%|███████▋  | 1702/2208 [10:11<02:58,  2.84it/s][A
Epoch 3/5:  77%|███████▋  | 1703/2208 [10:12<03:02,  2.77it/s][A
Epoch 3/5:  77%|███████▋  | 1704/2208 [10:12<02:59,  2.81it/s][A
Epoch 3/5:  77%|███████▋  | 1705/2208 [10:12<02:56,  2.85it/s][A
Epoch 3/5:  77%|███████▋  | 1706/2208 [10:13<02:56,  2.84it/s][A
Epoch 3/5:  77%|███████▋  | 1707/2208 [10:13<02:54,  2.86it/s][A
Epoch 3/5:  77%|███████▋  | 1708/2208 [10:13<02:54,  2.86it/s][A
Epoch 3/5:  77%|███████▋  | 1709/2208 [10:14<02:55,  2.84it/s][A
Epoch 3/5:  77%|███████▋  | 1710/2208 [10:14<02:54,  2.85it/s][A
Epoch 3/5:  77%|███████▋  | 1711/2208 [10:14<02:56,  2.82it/s][A
Epoch 3/5:  78%|███████▊  | 1712/2208 [10:15<02:58,  2.77it/s][A
Epoch 3/5:  78%|███████▊  | 1713/2208 [10:15<03:01,  2.73it/s][A
Epoch 3/5:  78%|███████▊  | 1714/2208 [10:16<02:57,  2.78it/s][A
Epoch 3/5:  78%|███████▊  | 1715/2208 [10:16<02:55,  2.81it/s][A
Epoch 3/5:  78%|███████▊  | 1716/2208 [10:16<02:56,  2.80it/s][A
Epoch 3/5

Batch 1725: Training accuracy = 0.8516, F1 = 0.8333, Precision = 0.8336, Recall = 0.8516



Epoch 3/5:  78%|███████▊  | 1727/2208 [10:20<02:53,  2.77it/s][A
Epoch 3/5:  78%|███████▊  | 1728/2208 [10:21<02:54,  2.74it/s][A
Epoch 3/5:  78%|███████▊  | 1729/2208 [10:21<03:00,  2.65it/s][A
Epoch 3/5:  78%|███████▊  | 1730/2208 [10:21<02:56,  2.70it/s][A
Epoch 3/5:  78%|███████▊  | 1731/2208 [10:22<02:53,  2.75it/s][A
Epoch 3/5:  78%|███████▊  | 1732/2208 [10:22<02:50,  2.80it/s][A
Epoch 3/5:  78%|███████▊  | 1733/2208 [10:23<02:54,  2.72it/s][A
Epoch 3/5:  79%|███████▊  | 1734/2208 [10:23<02:51,  2.76it/s][A
Epoch 3/5:  79%|███████▊  | 1735/2208 [10:23<02:53,  2.73it/s][A
Epoch 3/5:  79%|███████▊  | 1736/2208 [10:24<02:48,  2.80it/s][A
Epoch 3/5:  79%|███████▊  | 1737/2208 [10:24<02:46,  2.83it/s][A
Epoch 3/5:  79%|███████▊  | 1738/2208 [10:24<02:45,  2.84it/s][A
Epoch 3/5:  79%|███████▉  | 1739/2208 [10:25<02:45,  2.83it/s][A
Epoch 3/5:  79%|███████▉  | 1740/2208 [10:25<02:43,  2.86it/s][A
Epoch 3/5:  79%|███████▉  | 1741/2208 [10:25<02:41,  2.88it/s][A
Epoch 3/5

Batch 1750: Training accuracy = 0.8906, F1 = 0.8735, Precision = 0.8747, Recall = 0.8906



Epoch 3/5:  79%|███████▉  | 1752/2208 [10:29<02:41,  2.82it/s][A
Epoch 3/5:  79%|███████▉  | 1753/2208 [10:30<02:40,  2.83it/s][A
Epoch 3/5:  79%|███████▉  | 1754/2208 [10:30<02:38,  2.86it/s][A
Epoch 3/5:  79%|███████▉  | 1755/2208 [10:30<02:41,  2.81it/s][A
Epoch 3/5:  80%|███████▉  | 1756/2208 [10:31<02:39,  2.84it/s][A
Epoch 3/5:  80%|███████▉  | 1757/2208 [10:31<02:41,  2.79it/s][A
Epoch 3/5:  80%|███████▉  | 1758/2208 [10:31<02:40,  2.81it/s][A
Epoch 3/5:  80%|███████▉  | 1759/2208 [10:32<02:41,  2.77it/s][A
Epoch 3/5:  80%|███████▉  | 1760/2208 [10:32<02:40,  2.78it/s][A
Epoch 3/5:  80%|███████▉  | 1761/2208 [10:33<02:39,  2.81it/s][A
Epoch 3/5:  80%|███████▉  | 1762/2208 [10:33<02:40,  2.78it/s][A
Epoch 3/5:  80%|███████▉  | 1763/2208 [10:33<02:41,  2.76it/s][A
Epoch 3/5:  80%|███████▉  | 1764/2208 [10:34<02:40,  2.76it/s][A
Epoch 3/5:  80%|███████▉  | 1765/2208 [10:34<02:44,  2.69it/s][A
Epoch 3/5:  80%|███████▉  | 1766/2208 [10:34<02:42,  2.72it/s][A
Epoch 3/5

Batch 1775: Training accuracy = 0.8750, F1 = 0.8755, Precision = 0.8965, Recall = 0.8750



Epoch 3/5:  80%|████████  | 1777/2208 [10:38<02:36,  2.76it/s][A
Epoch 3/5:  81%|████████  | 1778/2208 [10:39<02:33,  2.80it/s][A
Epoch 3/5:  81%|████████  | 1779/2208 [10:39<02:32,  2.82it/s][A
Epoch 3/5:  81%|████████  | 1780/2208 [10:39<02:30,  2.84it/s][A
Epoch 3/5:  81%|████████  | 1781/2208 [10:40<02:30,  2.84it/s][A
Epoch 3/5:  81%|████████  | 1782/2208 [10:40<02:31,  2.81it/s][A
Epoch 3/5:  81%|████████  | 1783/2208 [10:40<02:29,  2.83it/s][A
Epoch 3/5:  81%|████████  | 1784/2208 [10:41<02:30,  2.82it/s][A
Epoch 3/5:  81%|████████  | 1785/2208 [10:41<02:34,  2.74it/s][A
Epoch 3/5:  81%|████████  | 1786/2208 [10:42<02:34,  2.74it/s][A
Epoch 3/5:  81%|████████  | 1787/2208 [10:42<02:30,  2.79it/s][A
Epoch 3/5:  81%|████████  | 1788/2208 [10:42<02:28,  2.83it/s][A
Epoch 3/5:  81%|████████  | 1789/2208 [10:43<02:31,  2.77it/s][A
Epoch 3/5:  81%|████████  | 1790/2208 [10:43<02:31,  2.77it/s][A
Epoch 3/5:  81%|████████  | 1791/2208 [10:43<02:28,  2.81it/s][A
Epoch 3/5

Batch 1800: Training accuracy = 0.8984, F1 = 0.9016, Precision = 0.9258, Recall = 0.8984



Epoch 3/5:  82%|████████▏ | 1802/2208 [10:47<02:28,  2.74it/s][A
Epoch 3/5:  82%|████████▏ | 1803/2208 [10:48<02:24,  2.79it/s][A
Epoch 3/5:  82%|████████▏ | 1804/2208 [10:48<02:24,  2.79it/s][A
Epoch 3/5:  82%|████████▏ | 1805/2208 [10:48<02:25,  2.78it/s][A
Epoch 3/5:  82%|████████▏ | 1806/2208 [10:49<02:27,  2.72it/s][A
Epoch 3/5:  82%|████████▏ | 1807/2208 [10:49<02:26,  2.73it/s][A
Epoch 3/5:  82%|████████▏ | 1808/2208 [10:50<02:27,  2.72it/s][A
Epoch 3/5:  82%|████████▏ | 1809/2208 [10:50<02:30,  2.66it/s][A
Epoch 3/5:  82%|████████▏ | 1810/2208 [10:50<02:27,  2.69it/s][A
Epoch 3/5:  82%|████████▏ | 1811/2208 [10:51<02:27,  2.69it/s][A
Epoch 3/5:  82%|████████▏ | 1812/2208 [10:51<02:24,  2.74it/s][A
Epoch 3/5:  82%|████████▏ | 1813/2208 [10:51<02:22,  2.77it/s][A
Epoch 3/5:  82%|████████▏ | 1814/2208 [10:52<02:20,  2.81it/s][A
Epoch 3/5:  82%|████████▏ | 1815/2208 [10:52<02:19,  2.81it/s][A
Epoch 3/5:  82%|████████▏ | 1816/2208 [10:52<02:17,  2.85it/s][A
Epoch 3/5

Batch 1825: Training accuracy = 0.8828, F1 = 0.8763, Precision = 0.8815, Recall = 0.8828



Epoch 3/5:  83%|████████▎ | 1827/2208 [10:56<02:14,  2.83it/s][A
Epoch 3/5:  83%|████████▎ | 1828/2208 [10:57<02:13,  2.85it/s][A
Epoch 3/5:  83%|████████▎ | 1829/2208 [10:57<02:11,  2.89it/s][A
Epoch 3/5:  83%|████████▎ | 1830/2208 [10:57<02:09,  2.91it/s][A
Epoch 3/5:  83%|████████▎ | 1831/2208 [10:58<02:10,  2.89it/s][A
Epoch 3/5:  83%|████████▎ | 1832/2208 [10:58<02:09,  2.90it/s][A
Epoch 3/5:  83%|████████▎ | 1833/2208 [10:58<02:11,  2.84it/s][A
Epoch 3/5:  83%|████████▎ | 1834/2208 [10:59<02:11,  2.84it/s][A
Epoch 3/5:  83%|████████▎ | 1835/2208 [10:59<02:13,  2.80it/s][A
Epoch 3/5:  83%|████████▎ | 1836/2208 [10:59<02:12,  2.82it/s][A
Epoch 3/5:  83%|████████▎ | 1837/2208 [11:00<02:11,  2.83it/s][A
Epoch 3/5:  83%|████████▎ | 1838/2208 [11:00<02:09,  2.86it/s][A
Epoch 3/5:  83%|████████▎ | 1839/2208 [11:00<02:08,  2.87it/s][A
Epoch 3/5:  83%|████████▎ | 1840/2208 [11:01<02:11,  2.81it/s][A
Epoch 3/5:  83%|████████▎ | 1841/2208 [11:01<02:09,  2.82it/s][A
Epoch 3/5

Batch 1850: Training accuracy = 0.8672, F1 = 0.8516, Precision = 0.8477, Recall = 0.8672



Epoch 3/5:  84%|████████▍ | 1852/2208 [11:05<02:09,  2.76it/s][A
Epoch 3/5:  84%|████████▍ | 1853/2208 [11:06<02:09,  2.74it/s][A
Epoch 3/5:  84%|████████▍ | 1854/2208 [11:06<02:10,  2.72it/s][A
Epoch 3/5:  84%|████████▍ | 1855/2208 [11:06<02:07,  2.77it/s][A
Epoch 3/5:  84%|████████▍ | 1856/2208 [11:07<02:07,  2.76it/s][A
Epoch 3/5:  84%|████████▍ | 1857/2208 [11:07<02:07,  2.75it/s][A
Epoch 3/5:  84%|████████▍ | 1858/2208 [11:07<02:04,  2.80it/s][A
Epoch 3/5:  84%|████████▍ | 1859/2208 [11:08<02:07,  2.75it/s][A
Epoch 3/5:  84%|████████▍ | 1860/2208 [11:08<02:09,  2.69it/s][A
Epoch 3/5:  84%|████████▍ | 1861/2208 [11:08<02:08,  2.69it/s][A
Epoch 3/5:  84%|████████▍ | 1862/2208 [11:09<02:09,  2.66it/s][A
Epoch 3/5:  84%|████████▍ | 1863/2208 [11:09<02:05,  2.75it/s][A
Epoch 3/5:  84%|████████▍ | 1864/2208 [11:10<02:06,  2.73it/s][A
Epoch 3/5:  84%|████████▍ | 1865/2208 [11:10<02:03,  2.79it/s][A
Epoch 3/5:  85%|████████▍ | 1866/2208 [11:10<02:05,  2.73it/s][A
Epoch 3/5

Batch 1875: Training accuracy = 0.8281, F1 = 0.8065, Precision = 0.7972, Recall = 0.8281



Epoch 3/5:  85%|████████▌ | 1877/2208 [11:14<02:04,  2.66it/s][A
Epoch 3/5:  85%|████████▌ | 1878/2208 [11:15<02:00,  2.73it/s][A
Epoch 3/5:  85%|████████▌ | 1879/2208 [11:15<02:02,  2.68it/s][A
Epoch 3/5:  85%|████████▌ | 1880/2208 [11:15<02:00,  2.73it/s][A
Epoch 3/5:  85%|████████▌ | 1881/2208 [11:16<01:58,  2.77it/s][A
Epoch 3/5:  85%|████████▌ | 1882/2208 [11:16<01:58,  2.75it/s][A
Epoch 3/5:  85%|████████▌ | 1883/2208 [11:16<01:56,  2.80it/s][A
Epoch 3/5:  85%|████████▌ | 1884/2208 [11:17<01:55,  2.80it/s][A
Epoch 3/5:  85%|████████▌ | 1885/2208 [11:17<01:54,  2.83it/s][A
Epoch 3/5:  85%|████████▌ | 1886/2208 [11:18<01:56,  2.77it/s][A
Epoch 3/5:  85%|████████▌ | 1887/2208 [11:18<01:54,  2.81it/s][A
Epoch 3/5:  86%|████████▌ | 1888/2208 [11:18<01:53,  2.82it/s][A
Epoch 3/5:  86%|████████▌ | 1889/2208 [11:19<01:55,  2.75it/s][A
Epoch 3/5:  86%|████████▌ | 1890/2208 [11:19<01:53,  2.80it/s][A
Epoch 3/5:  86%|████████▌ | 1891/2208 [11:19<01:57,  2.69it/s][A
Epoch 3/5

Batch 1900: Training accuracy = 0.8984, F1 = 0.8862, Precision = 0.8880, Recall = 0.8984



Epoch 3/5:  86%|████████▌ | 1902/2208 [11:23<01:50,  2.77it/s][A
Epoch 3/5:  86%|████████▌ | 1903/2208 [11:24<01:51,  2.73it/s][A
Epoch 3/5:  86%|████████▌ | 1904/2208 [11:24<01:49,  2.78it/s][A
Epoch 3/5:  86%|████████▋ | 1905/2208 [11:24<01:47,  2.82it/s][A
Epoch 3/5:  86%|████████▋ | 1906/2208 [11:25<01:49,  2.77it/s][A
Epoch 3/5:  86%|████████▋ | 1907/2208 [11:25<01:49,  2.75it/s][A
Epoch 3/5:  86%|████████▋ | 1908/2208 [11:25<01:47,  2.79it/s][A
Epoch 3/5:  86%|████████▋ | 1909/2208 [11:26<01:47,  2.78it/s][A
Epoch 3/5:  87%|████████▋ | 1910/2208 [11:26<01:45,  2.81it/s][A
Epoch 3/5:  87%|████████▋ | 1911/2208 [11:27<01:48,  2.75it/s][A
Epoch 3/5:  87%|████████▋ | 1912/2208 [11:27<01:48,  2.73it/s][A
Epoch 3/5:  87%|████████▋ | 1913/2208 [11:27<01:48,  2.73it/s][A
Epoch 3/5:  87%|████████▋ | 1914/2208 [11:28<01:46,  2.76it/s][A
Epoch 3/5:  87%|████████▋ | 1915/2208 [11:28<01:45,  2.77it/s][A
Epoch 3/5:  87%|████████▋ | 1916/2208 [11:28<01:43,  2.82it/s][A
Epoch 3/5

Batch 1925: Training accuracy = 0.8281, F1 = 0.8115, Precision = 0.8154, Recall = 0.8281



Epoch 3/5:  87%|████████▋ | 1927/2208 [11:32<01:42,  2.74it/s][A
Epoch 3/5:  87%|████████▋ | 1928/2208 [11:33<01:44,  2.69it/s][A
Epoch 3/5:  87%|████████▋ | 1929/2208 [11:33<01:41,  2.75it/s][A
Epoch 3/5:  87%|████████▋ | 1930/2208 [11:33<01:43,  2.69it/s][A
Epoch 3/5:  87%|████████▋ | 1931/2208 [11:34<01:42,  2.70it/s][A
Epoch 3/5:  88%|████████▊ | 1932/2208 [11:34<01:42,  2.69it/s][A
Epoch 3/5:  88%|████████▊ | 1933/2208 [11:35<01:39,  2.75it/s][A
Epoch 3/5:  88%|████████▊ | 1934/2208 [11:35<01:42,  2.68it/s][A
Epoch 3/5:  88%|████████▊ | 1935/2208 [11:35<01:39,  2.74it/s][A
Epoch 3/5:  88%|████████▊ | 1936/2208 [11:36<01:39,  2.72it/s][A
Epoch 3/5:  88%|████████▊ | 1937/2208 [11:36<01:40,  2.71it/s][A
Epoch 3/5:  88%|████████▊ | 1938/2208 [11:36<01:39,  2.72it/s][A
Epoch 3/5:  88%|████████▊ | 1939/2208 [11:37<01:36,  2.79it/s][A
Epoch 3/5:  88%|████████▊ | 1940/2208 [11:37<01:34,  2.83it/s][A
Epoch 3/5:  88%|████████▊ | 1941/2208 [11:37<01:35,  2.79it/s][A
Epoch 3/5

Batch 1950: Training accuracy = 0.8047, F1 = 0.7956, Precision = 0.8079, Recall = 0.8047



Epoch 3/5:  88%|████████▊ | 1952/2208 [11:41<01:30,  2.82it/s][A
Epoch 3/5:  88%|████████▊ | 1953/2208 [11:42<01:30,  2.83it/s][A
Epoch 3/5:  88%|████████▊ | 1954/2208 [11:42<01:30,  2.79it/s][A
Epoch 3/5:  89%|████████▊ | 1955/2208 [11:42<01:29,  2.84it/s][A
Epoch 3/5:  89%|████████▊ | 1956/2208 [11:43<01:30,  2.79it/s][A
Epoch 3/5:  89%|████████▊ | 1957/2208 [11:43<01:30,  2.77it/s][A
Epoch 3/5:  89%|████████▊ | 1958/2208 [11:43<01:28,  2.81it/s][A
Epoch 3/5:  89%|████████▊ | 1959/2208 [11:44<01:29,  2.78it/s][A
Epoch 3/5:  89%|████████▉ | 1960/2208 [11:44<01:27,  2.84it/s][A
Epoch 3/5:  89%|████████▉ | 1961/2208 [11:44<01:26,  2.86it/s][A
Epoch 3/5:  89%|████████▉ | 1962/2208 [11:45<01:26,  2.84it/s][A
Epoch 3/5:  89%|████████▉ | 1963/2208 [11:45<01:26,  2.83it/s][A
Epoch 3/5:  89%|████████▉ | 1964/2208 [11:46<01:25,  2.85it/s][A
Epoch 3/5:  89%|████████▉ | 1965/2208 [11:46<01:24,  2.88it/s][A
Epoch 3/5:  89%|████████▉ | 1966/2208 [11:46<01:24,  2.87it/s][A
Epoch 3/5

Batch 1975: Training accuracy = 0.8594, F1 = 0.8458, Precision = 0.8424, Recall = 0.8594



Epoch 3/5:  90%|████████▉ | 1977/2208 [11:50<01:21,  2.82it/s][A
Epoch 3/5:  90%|████████▉ | 1978/2208 [11:50<01:20,  2.86it/s][A
Epoch 3/5:  90%|████████▉ | 1979/2208 [11:51<01:20,  2.83it/s][A
Epoch 3/5:  90%|████████▉ | 1980/2208 [11:51<01:19,  2.87it/s][A
Epoch 3/5:  90%|████████▉ | 1981/2208 [11:52<01:18,  2.88it/s][A
Epoch 3/5:  90%|████████▉ | 1982/2208 [11:52<01:17,  2.90it/s][A
Epoch 3/5:  90%|████████▉ | 1983/2208 [11:52<01:17,  2.91it/s][A
Epoch 3/5:  90%|████████▉ | 1984/2208 [11:53<01:17,  2.89it/s][A
Epoch 3/5:  90%|████████▉ | 1985/2208 [11:53<01:17,  2.88it/s][A
Epoch 3/5:  90%|████████▉ | 1986/2208 [11:53<01:16,  2.90it/s][A
Epoch 3/5:  90%|████████▉ | 1987/2208 [11:54<01:18,  2.83it/s][A
Epoch 3/5:  90%|█████████ | 1988/2208 [11:54<01:17,  2.84it/s][A
Epoch 3/5:  90%|█████████ | 1989/2208 [11:54<01:18,  2.80it/s][A
Epoch 3/5:  90%|█████████ | 1990/2208 [11:55<01:19,  2.75it/s][A
Epoch 3/5:  90%|█████████ | 1991/2208 [11:55<01:19,  2.72it/s][A
Epoch 3/5

Batch 2000: Training accuracy = 0.8438, F1 = 0.8286, Precision = 0.8281, Recall = 0.8438



Epoch 3/5:  91%|█████████ | 2002/2208 [11:59<01:12,  2.84it/s][A
Epoch 3/5:  91%|█████████ | 2003/2208 [11:59<01:11,  2.86it/s][A
Epoch 3/5:  91%|█████████ | 2004/2208 [12:00<01:11,  2.87it/s][A
Epoch 3/5:  91%|█████████ | 2005/2208 [12:00<01:12,  2.81it/s][A
Epoch 3/5:  91%|█████████ | 2006/2208 [12:00<01:12,  2.78it/s][A
Epoch 3/5:  91%|█████████ | 2007/2208 [12:01<01:11,  2.81it/s][A
Epoch 3/5:  91%|█████████ | 2008/2208 [12:01<01:11,  2.78it/s][A
Epoch 3/5:  91%|█████████ | 2009/2208 [12:02<01:11,  2.79it/s][A
Epoch 3/5:  91%|█████████ | 2010/2208 [12:02<01:10,  2.79it/s][A
Epoch 3/5:  91%|█████████ | 2011/2208 [12:02<01:13,  2.69it/s][A
Epoch 3/5:  91%|█████████ | 2012/2208 [12:03<01:13,  2.65it/s][A
Epoch 3/5:  91%|█████████ | 2013/2208 [12:03<01:12,  2.68it/s][A
Epoch 3/5:  91%|█████████ | 2014/2208 [12:03<01:10,  2.75it/s][A
Epoch 3/5:  91%|█████████▏| 2015/2208 [12:04<01:10,  2.74it/s][A
Epoch 3/5:  91%|█████████▏| 2016/2208 [12:04<01:08,  2.81it/s][A
Epoch 3/5

Batch 2025: Training accuracy = 0.8281, F1 = 0.8159, Precision = 0.8255, Recall = 0.8281



Epoch 3/5:  92%|█████████▏| 2027/2208 [12:08<01:05,  2.75it/s][A
Epoch 3/5:  92%|█████████▏| 2028/2208 [12:08<01:04,  2.79it/s][A
Epoch 3/5:  92%|█████████▏| 2029/2208 [12:09<01:03,  2.80it/s][A
Epoch 3/5:  92%|█████████▏| 2030/2208 [12:09<01:03,  2.79it/s][A
Epoch 3/5:  92%|█████████▏| 2031/2208 [12:10<01:04,  2.76it/s][A
Epoch 3/5:  92%|█████████▏| 2032/2208 [12:10<01:02,  2.81it/s][A
Epoch 3/5:  92%|█████████▏| 2033/2208 [12:10<01:02,  2.78it/s][A
Epoch 3/5:  92%|█████████▏| 2034/2208 [12:11<01:01,  2.83it/s][A
Epoch 3/5:  92%|█████████▏| 2035/2208 [12:11<01:00,  2.86it/s][A
Epoch 3/5:  92%|█████████▏| 2036/2208 [12:11<00:59,  2.87it/s][A
Epoch 3/5:  92%|█████████▏| 2037/2208 [12:12<01:00,  2.83it/s][A
Epoch 3/5:  92%|█████████▏| 2038/2208 [12:12<00:59,  2.86it/s][A
Epoch 3/5:  92%|█████████▏| 2039/2208 [12:12<00:59,  2.86it/s][A
Epoch 3/5:  92%|█████████▏| 2040/2208 [12:13<00:59,  2.83it/s][A
Epoch 3/5:  92%|█████████▏| 2041/2208 [12:13<01:00,  2.75it/s][A
Epoch 3/5

Batch 2050: Training accuracy = 0.8203, F1 = 0.8097, Precision = 0.8227, Recall = 0.8203



Epoch 3/5:  93%|█████████▎| 2052/2208 [12:17<00:56,  2.76it/s][A
Epoch 3/5:  93%|█████████▎| 2053/2208 [12:17<00:55,  2.80it/s][A
Epoch 3/5:  93%|█████████▎| 2054/2208 [12:18<00:57,  2.68it/s][A
Epoch 3/5:  93%|█████████▎| 2055/2208 [12:18<00:56,  2.69it/s][A
Epoch 3/5:  93%|█████████▎| 2056/2208 [12:19<00:55,  2.73it/s][A
Epoch 3/5:  93%|█████████▎| 2057/2208 [12:19<00:56,  2.65it/s][A
Epoch 3/5:  93%|█████████▎| 2058/2208 [12:19<00:55,  2.70it/s][A
Epoch 3/5:  93%|█████████▎| 2059/2208 [12:20<00:53,  2.77it/s][A
Epoch 3/5:  93%|█████████▎| 2060/2208 [12:20<00:54,  2.70it/s][A
Epoch 3/5:  93%|█████████▎| 2061/2208 [12:20<00:54,  2.72it/s][A
Epoch 3/5:  93%|█████████▎| 2062/2208 [12:21<00:53,  2.71it/s][A
Epoch 3/5:  93%|█████████▎| 2063/2208 [12:21<00:53,  2.71it/s][A
Epoch 3/5:  93%|█████████▎| 2064/2208 [12:22<00:51,  2.77it/s][A
Epoch 3/5:  94%|█████████▎| 2065/2208 [12:22<00:50,  2.81it/s][A
Epoch 3/5:  94%|█████████▎| 2066/2208 [12:22<00:49,  2.85it/s][A
Epoch 3/5

Batch 2075: Training accuracy = 0.8906, F1 = 0.8797, Precision = 0.8854, Recall = 0.8906



Epoch 3/5:  94%|█████████▍| 2077/2208 [12:26<00:47,  2.76it/s][A
Epoch 3/5:  94%|█████████▍| 2078/2208 [12:26<00:46,  2.81it/s][A
Epoch 3/5:  94%|█████████▍| 2079/2208 [12:27<00:46,  2.77it/s][A
Epoch 3/5:  94%|█████████▍| 2080/2208 [12:27<00:45,  2.79it/s][A
Epoch 3/5:  94%|█████████▍| 2081/2208 [12:28<00:45,  2.78it/s][A
Epoch 3/5:  94%|█████████▍| 2082/2208 [12:28<00:44,  2.81it/s][A
Epoch 3/5:  94%|█████████▍| 2083/2208 [12:28<00:45,  2.77it/s][A
Epoch 3/5:  94%|█████████▍| 2084/2208 [12:29<00:44,  2.76it/s][A
Epoch 3/5:  94%|█████████▍| 2085/2208 [12:29<00:44,  2.79it/s][A
Epoch 3/5:  94%|█████████▍| 2086/2208 [12:29<00:43,  2.81it/s][A
Epoch 3/5:  95%|█████████▍| 2087/2208 [12:30<00:43,  2.80it/s][A
Epoch 3/5:  95%|█████████▍| 2088/2208 [12:30<00:42,  2.83it/s][A
Epoch 3/5:  95%|█████████▍| 2089/2208 [12:30<00:42,  2.82it/s][A
Epoch 3/5:  95%|█████████▍| 2090/2208 [12:31<00:42,  2.78it/s][A
Epoch 3/5:  95%|█████████▍| 2091/2208 [12:31<00:41,  2.79it/s][A
Epoch 3/5

Batch 2100: Training accuracy = 0.8750, F1 = 0.8659, Precision = 0.8763, Recall = 0.8750



Epoch 3/5:  95%|█████████▌| 2102/2208 [12:35<00:38,  2.79it/s][A
Epoch 3/5:  95%|█████████▌| 2103/2208 [12:35<00:38,  2.72it/s][A
Epoch 3/5:  95%|█████████▌| 2104/2208 [12:36<00:37,  2.77it/s][A
Epoch 3/5:  95%|█████████▌| 2105/2208 [12:36<00:36,  2.80it/s][A
Epoch 3/5:  95%|█████████▌| 2106/2208 [12:36<00:36,  2.80it/s][A
Epoch 3/5:  95%|█████████▌| 2107/2208 [12:37<00:35,  2.85it/s][A
Epoch 3/5:  95%|█████████▌| 2108/2208 [12:37<00:35,  2.84it/s][A
Epoch 3/5:  96%|█████████▌| 2109/2208 [12:37<00:35,  2.82it/s][A
Epoch 3/5:  96%|█████████▌| 2110/2208 [12:38<00:35,  2.79it/s][A
Epoch 3/5:  96%|█████████▌| 2111/2208 [12:38<00:35,  2.71it/s][A
Epoch 3/5:  96%|█████████▌| 2112/2208 [12:39<00:35,  2.69it/s][A
Epoch 3/5:  96%|█████████▌| 2113/2208 [12:39<00:34,  2.73it/s][A
Epoch 3/5:  96%|█████████▌| 2114/2208 [12:39<00:34,  2.73it/s][A
Epoch 3/5:  96%|█████████▌| 2115/2208 [12:40<00:33,  2.74it/s][A
Epoch 3/5:  96%|█████████▌| 2116/2208 [12:40<00:33,  2.78it/s][A
Epoch 3/5

Batch 2125: Training accuracy = 0.8672, F1 = 0.8565, Precision = 0.8711, Recall = 0.8672



Epoch 3/5:  96%|█████████▋| 2127/2208 [12:44<00:28,  2.80it/s][A
Epoch 3/5:  96%|█████████▋| 2128/2208 [12:44<00:28,  2.78it/s][A
Epoch 3/5:  96%|█████████▋| 2129/2208 [12:45<00:28,  2.77it/s][A
Epoch 3/5:  96%|█████████▋| 2130/2208 [12:45<00:28,  2.73it/s][A
Epoch 3/5:  97%|█████████▋| 2131/2208 [12:45<00:27,  2.77it/s][A
Epoch 3/5:  97%|█████████▋| 2132/2208 [12:46<00:27,  2.75it/s][A
Epoch 3/5:  97%|█████████▋| 2133/2208 [12:46<00:26,  2.78it/s][A
Epoch 3/5:  97%|█████████▋| 2134/2208 [12:47<00:27,  2.73it/s][A
Epoch 3/5:  97%|█████████▋| 2135/2208 [12:47<00:26,  2.75it/s][A
Epoch 3/5:  97%|█████████▋| 2136/2208 [12:47<00:26,  2.71it/s][A
Epoch 3/5:  97%|█████████▋| 2137/2208 [12:48<00:26,  2.64it/s][A
Epoch 3/5:  97%|█████████▋| 2138/2208 [12:48<00:26,  2.63it/s][A
Epoch 3/5:  97%|█████████▋| 2139/2208 [12:48<00:25,  2.69it/s][A
Epoch 3/5:  97%|█████████▋| 2140/2208 [12:49<00:25,  2.64it/s][A
Epoch 3/5:  97%|█████████▋| 2141/2208 [12:49<00:24,  2.69it/s][A
Epoch 3/5

Batch 2150: Training accuracy = 0.8906, F1 = 0.8841, Precision = 0.8854, Recall = 0.8906



Epoch 3/5:  97%|█████████▋| 2152/2208 [12:53<00:20,  2.79it/s][A
Epoch 3/5:  98%|█████████▊| 2153/2208 [12:53<00:19,  2.83it/s][A
Epoch 3/5:  98%|█████████▊| 2154/2208 [12:54<00:18,  2.87it/s][A
Epoch 3/5:  98%|█████████▊| 2155/2208 [12:54<00:18,  2.89it/s][A
Epoch 3/5:  98%|█████████▊| 2156/2208 [12:55<00:18,  2.88it/s][A
Epoch 3/5:  98%|█████████▊| 2157/2208 [12:55<00:18,  2.82it/s][A
Epoch 3/5:  98%|█████████▊| 2158/2208 [12:55<00:18,  2.77it/s][A
Epoch 3/5:  98%|█████████▊| 2159/2208 [12:56<00:17,  2.75it/s][A
Epoch 3/5:  98%|█████████▊| 2160/2208 [12:56<00:17,  2.80it/s][A
Epoch 3/5:  98%|█████████▊| 2161/2208 [12:56<00:17,  2.75it/s][A
Epoch 3/5:  98%|█████████▊| 2162/2208 [12:57<00:16,  2.80it/s][A
Epoch 3/5:  98%|█████████▊| 2163/2208 [12:57<00:16,  2.80it/s][A
Epoch 3/5:  98%|█████████▊| 2164/2208 [12:57<00:15,  2.84it/s][A
Epoch 3/5:  98%|█████████▊| 2165/2208 [12:58<00:15,  2.84it/s][A
Epoch 3/5:  98%|█████████▊| 2166/2208 [12:58<00:15,  2.76it/s][A
Epoch 3/5

Batch 2175: Training accuracy = 0.8516, F1 = 0.8427, Precision = 0.8490, Recall = 0.8516



Epoch 3/5:  99%|█████████▊| 2177/2208 [13:02<00:11,  2.73it/s][A
Epoch 3/5:  99%|█████████▊| 2178/2208 [13:03<00:10,  2.78it/s][A
Epoch 3/5:  99%|█████████▊| 2179/2208 [13:03<00:10,  2.80it/s][A
Epoch 3/5:  99%|█████████▊| 2180/2208 [13:03<00:09,  2.84it/s][A
Epoch 3/5:  99%|█████████▉| 2181/2208 [13:04<00:09,  2.86it/s][A
Epoch 3/5:  99%|█████████▉| 2182/2208 [13:04<00:09,  2.86it/s][A
Epoch 3/5:  99%|█████████▉| 2183/2208 [13:04<00:08,  2.87it/s][A
Epoch 3/5:  99%|█████████▉| 2184/2208 [13:05<00:08,  2.88it/s][A
Epoch 3/5:  99%|█████████▉| 2185/2208 [13:05<00:07,  2.90it/s][A
Epoch 3/5:  99%|█████████▉| 2186/2208 [13:05<00:07,  2.92it/s][A
Epoch 3/5:  99%|█████████▉| 2187/2208 [13:06<00:07,  2.85it/s][A
Epoch 3/5:  99%|█████████▉| 2188/2208 [13:06<00:07,  2.82it/s][A
Epoch 3/5:  99%|█████████▉| 2189/2208 [13:06<00:06,  2.79it/s][A
Epoch 3/5:  99%|█████████▉| 2190/2208 [13:07<00:06,  2.82it/s][A
Epoch 3/5:  99%|█████████▉| 2191/2208 [13:07<00:06,  2.80it/s][A
Epoch 3/5

Batch 2200: Training accuracy = 0.8516, F1 = 0.8315, Precision = 0.8444, Recall = 0.8516



Epoch 3/5: 100%|█████████▉| 2202/2208 [13:11<00:02,  2.79it/s][A
Epoch 3/5: 100%|█████████▉| 2203/2208 [13:11<00:01,  2.85it/s][A
Epoch 3/5: 100%|█████████▉| 2204/2208 [13:12<00:01,  2.89it/s][A
Epoch 3/5: 100%|█████████▉| 2205/2208 [13:12<00:01,  2.91it/s][A
Epoch 3/5: 100%|█████████▉| 2206/2208 [13:12<00:00,  2.91it/s][A
Epoch 3/5: 100%|█████████▉| 2207/2208 [13:13<00:00,  2.92it/s][A
Epoch 3/5: 100%|██████████| 2208/2208 [13:13<00:00,  2.90it/s][A
                                                              [A


Epoch 3 training accuracy: 0.86%
Epoch 3 training F1 score: 0.8656
Epoch 3 training precision: 0.8749
Epoch 3 training recall: 0.8601

Starting validation...



Validation:   0%|          | 0/552 [00:00<?, ?it/s][A
Validation:   0%|          | 1/552 [00:01<15:38,  1.70s/it][A
Validation:   1%|          | 4/552 [00:01<03:12,  2.85it/s][A
Validation:   1%|          | 6/552 [00:02<02:20,  3.90it/s][A
Validation:   2%|▏         | 9/552 [00:02<01:22,  6.56it/s][A
Validation:   2%|▏         | 11/552 [00:02<01:13,  7.37it/s][A
Validation:   2%|▏         | 13/552 [00:02<00:59,  9.02it/s][A
Validation:   3%|▎         | 15/552 [00:02<01:00,  8.85it/s][A
Validation:   3%|▎         | 17/552 [00:02<00:53, 10.03it/s][A
Validation:   3%|▎         | 19/552 [00:03<00:51, 10.35it/s][A
Validation:   4%|▍         | 21/552 [00:03<00:53,  9.99it/s][A
Validation:   4%|▍         | 23/552 [00:03<00:58,  8.98it/s][A
Validation:   5%|▍         | 25/552 [00:03<00:49, 10.70it/s][A
Validation:   5%|▍         | 27/552 [00:03<00:55,  9.42it/s][A
Validation:   5%|▌         | 30/552 [00:04<00:44, 11.71it/s][A
Validation:   6%|▌         | 32/552 [00:04<00:42, 12

Validation accuracy: 0.74%
Validation F1 score: 0.7492
Validation precision: 0.8140
Validation recall: 0.7438

Starting epoch 4/5



  _warn_prf(average, modifier, f"{metric.capitalize()} is", len(result))
  _warn_prf(average, modifier, f"{metric.capitalize()} is", len(result))

Epoch 4/5:   0%|          | 1/2208 [00:02<1:28:44,  2.41s/it][A

Batch 0: Training accuracy = 0.8984, F1 = 0.8919, Precision = 0.8932, Recall = 0.8984



Epoch 4/5:   0%|          | 2/2208 [00:02<43:57,  1.20s/it]  [A
Epoch 4/5:   0%|          | 3/2208 [00:03<30:09,  1.22it/s][A
Epoch 4/5:   0%|          | 4/2208 [00:03<23:21,  1.57it/s][A
Epoch 4/5:   0%|          | 5/2208 [00:03<19:27,  1.89it/s][A
Epoch 4/5:   0%|          | 6/2208 [00:04<17:21,  2.11it/s][A
Epoch 4/5:   0%|          | 7/2208 [00:04<15:44,  2.33it/s][A
Epoch 4/5:   0%|          | 8/2208 [00:04<14:42,  2.49it/s][A
Epoch 4/5:   0%|          | 9/2208 [00:05<13:58,  2.62it/s][A
Epoch 4/5:   0%|          | 10/2208 [00:05<13:32,  2.71it/s][A
Epoch 4/5:   0%|          | 11/2208 [00:05<13:18,  2.75it/s][A
Epoch 4/5:   1%|          | 12/2208 [00:06<13:13,  2.77it/s][A
Epoch 4/5:   1%|          | 13/2208 [00:06<13:21,  2.74it/s][A
Epoch 4/5:   1%|          | 14/2208 [00:07<13:31,  2.70it/s][A
Epoch 4/5:   1%|          | 15/2208 [00:07<13:13,  2.76it/s][A
Epoch 4/5:   1%|          | 16/2208 [00:07<13:27,  2.72it/s][A
Epoch 4/5:   1%|          | 17/2208 [00:08<13

Batch 25: Training accuracy = 0.8906, F1 = 0.8906, Precision = 0.9023, Recall = 0.8906



Epoch 4/5:   1%|          | 27/2208 [00:11<13:04,  2.78it/s][A
Epoch 4/5:   1%|▏         | 28/2208 [00:12<12:54,  2.82it/s][A
Epoch 4/5:   1%|▏         | 29/2208 [00:12<12:56,  2.81it/s][A
Epoch 4/5:   1%|▏         | 30/2208 [00:12<12:47,  2.84it/s][A
Epoch 4/5:   1%|▏         | 31/2208 [00:13<12:39,  2.87it/s][A
Epoch 4/5:   1%|▏         | 32/2208 [00:13<12:32,  2.89it/s][A
Epoch 4/5:   1%|▏         | 33/2208 [00:13<12:30,  2.90it/s][A
Epoch 4/5:   2%|▏         | 34/2208 [00:14<12:37,  2.87it/s][A
Epoch 4/5:   2%|▏         | 35/2208 [00:14<12:31,  2.89it/s][A
Epoch 4/5:   2%|▏         | 36/2208 [00:14<12:50,  2.82it/s][A
Epoch 4/5:   2%|▏         | 37/2208 [00:15<12:40,  2.86it/s][A
Epoch 4/5:   2%|▏         | 38/2208 [00:15<12:39,  2.86it/s][A
Epoch 4/5:   2%|▏         | 39/2208 [00:15<12:33,  2.88it/s][A
Epoch 4/5:   2%|▏         | 40/2208 [00:16<12:45,  2.83it/s][A
Epoch 4/5:   2%|▏         | 41/2208 [00:16<12:35,  2.87it/s][A
Epoch 4/5:   2%|▏         | 42/2208 [00

Batch 50: Training accuracy = 0.8828, F1 = 0.8682, Precision = 0.8672, Recall = 0.8828



Epoch 4/5:   2%|▏         | 52/2208 [00:20<13:00,  2.76it/s][A
Epoch 4/5:   2%|▏         | 53/2208 [00:20<13:23,  2.68it/s][A
Epoch 4/5:   2%|▏         | 54/2208 [00:21<13:12,  2.72it/s][A
Epoch 4/5:   2%|▏         | 55/2208 [00:21<13:04,  2.75it/s][A
Epoch 4/5:   3%|▎         | 56/2208 [00:22<12:54,  2.78it/s][A
Epoch 4/5:   3%|▎         | 57/2208 [00:22<13:00,  2.76it/s][A
Epoch 4/5:   3%|▎         | 58/2208 [00:22<12:58,  2.76it/s][A
Epoch 4/5:   3%|▎         | 59/2208 [00:23<13:10,  2.72it/s][A
Epoch 4/5:   3%|▎         | 60/2208 [00:23<13:16,  2.70it/s][A
Epoch 4/5:   3%|▎         | 61/2208 [00:23<13:19,  2.68it/s][A
Epoch 4/5:   3%|▎         | 62/2208 [00:24<13:28,  2.66it/s][A
Epoch 4/5:   3%|▎         | 63/2208 [00:24<13:08,  2.72it/s][A
Epoch 4/5:   3%|▎         | 64/2208 [00:24<13:05,  2.73it/s][A
Epoch 4/5:   3%|▎         | 65/2208 [00:25<12:48,  2.79it/s][A
Epoch 4/5:   3%|▎         | 66/2208 [00:25<12:46,  2.79it/s][A
Epoch 4/5:   3%|▎         | 67/2208 [00

Batch 75: Training accuracy = 0.8438, F1 = 0.8365, Precision = 0.8529, Recall = 0.8438



Epoch 4/5:   3%|▎         | 77/2208 [00:29<12:39,  2.81it/s][A
Epoch 4/5:   4%|▎         | 78/2208 [00:29<12:45,  2.78it/s][A
Epoch 4/5:   4%|▎         | 79/2208 [00:30<12:47,  2.77it/s][A
Epoch 4/5:   4%|▎         | 80/2208 [00:30<12:36,  2.81it/s][A
Epoch 4/5:   4%|▎         | 81/2208 [00:31<12:42,  2.79it/s][A
Epoch 4/5:   4%|▎         | 82/2208 [00:31<12:49,  2.76it/s][A
Epoch 4/5:   4%|▍         | 83/2208 [00:31<12:36,  2.81it/s][A
Epoch 4/5:   4%|▍         | 84/2208 [00:32<12:30,  2.83it/s][A
Epoch 4/5:   4%|▍         | 85/2208 [00:32<12:28,  2.84it/s][A
Epoch 4/5:   4%|▍         | 86/2208 [00:32<12:20,  2.87it/s][A
Epoch 4/5:   4%|▍         | 87/2208 [00:33<12:15,  2.88it/s][A
Epoch 4/5:   4%|▍         | 88/2208 [00:33<12:19,  2.87it/s][A
Epoch 4/5:   4%|▍         | 89/2208 [00:33<12:21,  2.86it/s][A
Epoch 4/5:   4%|▍         | 90/2208 [00:34<12:25,  2.84it/s][A
Epoch 4/5:   4%|▍         | 91/2208 [00:34<12:21,  2.86it/s][A
Epoch 4/5:   4%|▍         | 92/2208 [00

Batch 100: Training accuracy = 0.8906, F1 = 0.8802, Precision = 0.8874, Recall = 0.8906



Epoch 4/5:   5%|▍         | 102/2208 [00:38<12:44,  2.76it/s][A
Epoch 4/5:   5%|▍         | 103/2208 [00:38<12:44,  2.75it/s][A
Epoch 4/5:   5%|▍         | 104/2208 [00:39<12:43,  2.76it/s][A
Epoch 4/5:   5%|▍         | 105/2208 [00:39<12:56,  2.71it/s][A
Epoch 4/5:   5%|▍         | 106/2208 [00:39<12:44,  2.75it/s][A
Epoch 4/5:   5%|▍         | 107/2208 [00:40<12:43,  2.75it/s][A
Epoch 4/5:   5%|▍         | 108/2208 [00:40<12:48,  2.73it/s][A
Epoch 4/5:   5%|▍         | 109/2208 [00:41<12:31,  2.79it/s][A
Epoch 4/5:   5%|▍         | 110/2208 [00:41<12:21,  2.83it/s][A
Epoch 4/5:   5%|▌         | 111/2208 [00:41<12:12,  2.86it/s][A
Epoch 4/5:   5%|▌         | 112/2208 [00:42<12:12,  2.86it/s][A
Epoch 4/5:   5%|▌         | 113/2208 [00:42<12:07,  2.88it/s][A
Epoch 4/5:   5%|▌         | 114/2208 [00:42<12:00,  2.91it/s][A
Epoch 4/5:   5%|▌         | 115/2208 [00:43<12:05,  2.89it/s][A
Epoch 4/5:   5%|▌         | 116/2208 [00:43<12:18,  2.83it/s][A
Epoch 4/5:   5%|▌       

Batch 125: Training accuracy = 0.8672, F1 = 0.8516, Precision = 0.8555, Recall = 0.8672



Epoch 4/5:   6%|▌         | 127/2208 [00:47<12:36,  2.75it/s][A
Epoch 4/5:   6%|▌         | 128/2208 [00:47<12:34,  2.76it/s][A
Epoch 4/5:   6%|▌         | 129/2208 [00:48<12:24,  2.79it/s][A
Epoch 4/5:   6%|▌         | 130/2208 [00:48<12:56,  2.68it/s][A
Epoch 4/5:   6%|▌         | 131/2208 [00:48<12:58,  2.67it/s][A
Epoch 4/5:   6%|▌         | 132/2208 [00:49<12:38,  2.74it/s][A
Epoch 4/5:   6%|▌         | 133/2208 [00:49<12:25,  2.78it/s][A
Epoch 4/5:   6%|▌         | 134/2208 [00:50<12:48,  2.70it/s][A
Epoch 4/5:   6%|▌         | 135/2208 [00:50<12:28,  2.77it/s][A
Epoch 4/5:   6%|▌         | 136/2208 [00:50<12:38,  2.73it/s][A
Epoch 4/5:   6%|▌         | 137/2208 [00:51<12:28,  2.77it/s][A
Epoch 4/5:   6%|▋         | 138/2208 [00:51<12:31,  2.76it/s][A
Epoch 4/5:   6%|▋         | 139/2208 [00:51<13:02,  2.64it/s][A
Epoch 4/5:   6%|▋         | 140/2208 [00:52<12:52,  2.68it/s][A
Epoch 4/5:   6%|▋         | 141/2208 [00:52<12:50,  2.68it/s][A
Epoch 4/5:   6%|▋       

Batch 150: Training accuracy = 0.9062, F1 = 0.8964, Precision = 0.8984, Recall = 0.9062



Epoch 4/5:   7%|▋         | 152/2208 [00:56<12:31,  2.74it/s][A
Epoch 4/5:   7%|▋         | 153/2208 [00:57<12:12,  2.80it/s][A
Epoch 4/5:   7%|▋         | 154/2208 [00:57<12:04,  2.84it/s][A
Epoch 4/5:   7%|▋         | 155/2208 [00:57<12:02,  2.84it/s][A
Epoch 4/5:   7%|▋         | 156/2208 [00:58<12:00,  2.85it/s][A
Epoch 4/5:   7%|▋         | 157/2208 [00:58<12:01,  2.84it/s][A
Epoch 4/5:   7%|▋         | 158/2208 [00:58<12:21,  2.77it/s][A
Epoch 4/5:   7%|▋         | 159/2208 [00:59<12:06,  2.82it/s][A
Epoch 4/5:   7%|▋         | 160/2208 [00:59<11:57,  2.85it/s][A
Epoch 4/5:   7%|▋         | 161/2208 [00:59<12:13,  2.79it/s][A
Epoch 4/5:   7%|▋         | 162/2208 [01:00<12:01,  2.84it/s][A
Epoch 4/5:   7%|▋         | 163/2208 [01:00<12:10,  2.80it/s][A
Epoch 4/5:   7%|▋         | 164/2208 [01:00<12:03,  2.83it/s][A
Epoch 4/5:   7%|▋         | 165/2208 [01:01<12:03,  2.82it/s][A
Epoch 4/5:   8%|▊         | 166/2208 [01:01<12:24,  2.74it/s][A
Epoch 4/5:   8%|▊       

Batch 175: Training accuracy = 0.8750, F1 = 0.8708, Precision = 0.8867, Recall = 0.8750



Epoch 4/5:   8%|▊         | 177/2208 [01:05<12:37,  2.68it/s][A
Epoch 4/5:   8%|▊         | 178/2208 [01:06<12:40,  2.67it/s][A
Epoch 4/5:   8%|▊         | 179/2208 [01:06<12:22,  2.73it/s][A
Epoch 4/5:   8%|▊         | 180/2208 [01:06<12:27,  2.71it/s][A
Epoch 4/5:   8%|▊         | 181/2208 [01:07<12:25,  2.72it/s][A
Epoch 4/5:   8%|▊         | 182/2208 [01:07<12:08,  2.78it/s][A
Epoch 4/5:   8%|▊         | 183/2208 [01:07<12:03,  2.80it/s][A
Epoch 4/5:   8%|▊         | 184/2208 [01:08<12:44,  2.65it/s][A
Epoch 4/5:   8%|▊         | 185/2208 [01:08<12:36,  2.68it/s][A
Epoch 4/5:   8%|▊         | 186/2208 [01:08<12:32,  2.69it/s][A
Epoch 4/5:   8%|▊         | 187/2208 [01:09<12:25,  2.71it/s][A
Epoch 4/5:   9%|▊         | 188/2208 [01:09<12:29,  2.70it/s][A
Epoch 4/5:   9%|▊         | 189/2208 [01:10<12:14,  2.75it/s][A
Epoch 4/5:   9%|▊         | 190/2208 [01:10<11:58,  2.81it/s][A
Epoch 4/5:   9%|▊         | 191/2208 [01:10<12:10,  2.76it/s][A
Epoch 4/5:   9%|▊       

Batch 200: Training accuracy = 0.8828, F1 = 0.8737, Precision = 0.8737, Recall = 0.8828



Epoch 4/5:   9%|▉         | 202/2208 [01:14<11:57,  2.80it/s][A
Epoch 4/5:   9%|▉         | 203/2208 [01:15<11:48,  2.83it/s][A
Epoch 4/5:   9%|▉         | 204/2208 [01:15<11:38,  2.87it/s][A
Epoch 4/5:   9%|▉         | 205/2208 [01:15<11:32,  2.89it/s][A
Epoch 4/5:   9%|▉         | 206/2208 [01:16<11:34,  2.88it/s][A
Epoch 4/5:   9%|▉         | 207/2208 [01:16<11:47,  2.83it/s][A
Epoch 4/5:   9%|▉         | 208/2208 [01:16<11:47,  2.83it/s][A
Epoch 4/5:   9%|▉         | 209/2208 [01:17<11:40,  2.85it/s][A
Epoch 4/5:  10%|▉         | 210/2208 [01:17<11:47,  2.82it/s][A
Epoch 4/5:  10%|▉         | 211/2208 [01:17<11:39,  2.85it/s][A
Epoch 4/5:  10%|▉         | 212/2208 [01:18<11:52,  2.80it/s][A
Epoch 4/5:  10%|▉         | 213/2208 [01:18<11:40,  2.85it/s][A
Epoch 4/5:  10%|▉         | 214/2208 [01:18<11:32,  2.88it/s][A
Epoch 4/5:  10%|▉         | 215/2208 [01:19<11:30,  2.88it/s][A
Epoch 4/5:  10%|▉         | 216/2208 [01:19<11:38,  2.85it/s][A
Epoch 4/5:  10%|▉       

Batch 225: Training accuracy = 0.8516, F1 = 0.8427, Precision = 0.8451, Recall = 0.8516



Epoch 4/5:  10%|█         | 227/2208 [01:23<12:02,  2.74it/s][A
Epoch 4/5:  10%|█         | 228/2208 [01:23<12:11,  2.71it/s][A
Epoch 4/5:  10%|█         | 229/2208 [01:24<11:56,  2.76it/s][A
Epoch 4/5:  10%|█         | 230/2208 [01:24<11:42,  2.82it/s][A
Epoch 4/5:  10%|█         | 231/2208 [01:24<11:49,  2.79it/s][A
Epoch 4/5:  11%|█         | 232/2208 [01:25<11:39,  2.82it/s][A
Epoch 4/5:  11%|█         | 233/2208 [01:25<11:39,  2.82it/s][A
Epoch 4/5:  11%|█         | 234/2208 [01:25<11:29,  2.86it/s][A
Epoch 4/5:  11%|█         | 235/2208 [01:26<11:22,  2.89it/s][A
Epoch 4/5:  11%|█         | 236/2208 [01:26<11:34,  2.84it/s][A
Epoch 4/5:  11%|█         | 237/2208 [01:27<11:26,  2.87it/s][A
Epoch 4/5:  11%|█         | 238/2208 [01:27<11:20,  2.90it/s][A
Epoch 4/5:  11%|█         | 239/2208 [01:27<11:22,  2.88it/s][A
Epoch 4/5:  11%|█         | 240/2208 [01:28<11:22,  2.88it/s][A
Epoch 4/5:  11%|█         | 241/2208 [01:28<11:36,  2.82it/s][A
Epoch 4/5:  11%|█       

Batch 250: Training accuracy = 0.8047, F1 = 0.8016, Precision = 0.8073, Recall = 0.8047



Epoch 4/5:  11%|█▏        | 252/2208 [01:32<11:38,  2.80it/s][A
Epoch 4/5:  11%|█▏        | 253/2208 [01:32<11:30,  2.83it/s][A
Epoch 4/5:  12%|█▏        | 254/2208 [01:33<11:22,  2.86it/s][A
Epoch 4/5:  12%|█▏        | 255/2208 [01:33<11:28,  2.84it/s][A
Epoch 4/5:  12%|█▏        | 256/2208 [01:33<11:27,  2.84it/s][A
Epoch 4/5:  12%|█▏        | 257/2208 [01:34<11:28,  2.83it/s][A
Epoch 4/5:  12%|█▏        | 258/2208 [01:34<11:40,  2.78it/s][A
Epoch 4/5:  12%|█▏        | 259/2208 [01:34<11:37,  2.80it/s][A
Epoch 4/5:  12%|█▏        | 260/2208 [01:35<11:27,  2.83it/s][A
Epoch 4/5:  12%|█▏        | 261/2208 [01:35<11:37,  2.79it/s][A
Epoch 4/5:  12%|█▏        | 262/2208 [01:35<11:42,  2.77it/s][A
Epoch 4/5:  12%|█▏        | 263/2208 [01:36<11:42,  2.77it/s][A
Epoch 4/5:  12%|█▏        | 264/2208 [01:36<11:29,  2.82it/s][A
Epoch 4/5:  12%|█▏        | 265/2208 [01:37<11:31,  2.81it/s][A
Epoch 4/5:  12%|█▏        | 266/2208 [01:37<11:25,  2.83it/s][A
Epoch 4/5:  12%|█▏      

Batch 275: Training accuracy = 0.9141, F1 = 0.8993, Precision = 0.8978, Recall = 0.9141



Epoch 4/5:  13%|█▎        | 277/2208 [01:41<11:31,  2.79it/s][A
Epoch 4/5:  13%|█▎        | 278/2208 [01:41<11:27,  2.81it/s][A
Epoch 4/5:  13%|█▎        | 279/2208 [01:42<11:19,  2.84it/s][A
Epoch 4/5:  13%|█▎        | 280/2208 [01:42<11:14,  2.86it/s][A
Epoch 4/5:  13%|█▎        | 281/2208 [01:42<11:21,  2.83it/s][A
Epoch 4/5:  13%|█▎        | 282/2208 [01:43<11:15,  2.85it/s][A
Epoch 4/5:  13%|█▎        | 283/2208 [01:43<11:10,  2.87it/s][A
Epoch 4/5:  13%|█▎        | 284/2208 [01:43<11:15,  2.85it/s][A
Epoch 4/5:  13%|█▎        | 285/2208 [01:44<11:27,  2.80it/s][A
Epoch 4/5:  13%|█▎        | 286/2208 [01:44<11:19,  2.83it/s][A
Epoch 4/5:  13%|█▎        | 287/2208 [01:44<11:14,  2.85it/s][A
Epoch 4/5:  13%|█▎        | 288/2208 [01:45<11:16,  2.84it/s][A
Epoch 4/5:  13%|█▎        | 289/2208 [01:45<11:12,  2.85it/s][A
Epoch 4/5:  13%|█▎        | 290/2208 [01:45<11:35,  2.76it/s][A
Epoch 4/5:  13%|█▎        | 291/2208 [01:46<11:33,  2.76it/s][A
Epoch 4/5:  13%|█▎      

Batch 300: Training accuracy = 0.8359, F1 = 0.8289, Precision = 0.8359, Recall = 0.8359



Epoch 4/5:  14%|█▎        | 302/2208 [01:50<11:22,  2.79it/s][A
Epoch 4/5:  14%|█▎        | 303/2208 [01:50<11:14,  2.83it/s][A
Epoch 4/5:  14%|█▍        | 304/2208 [01:50<11:41,  2.71it/s][A
Epoch 4/5:  14%|█▍        | 305/2208 [01:51<12:12,  2.60it/s][A
Epoch 4/5:  14%|█▍        | 306/2208 [01:51<11:57,  2.65it/s][A
Epoch 4/5:  14%|█▍        | 307/2208 [01:52<11:53,  2.66it/s][A
Epoch 4/5:  14%|█▍        | 308/2208 [01:52<12:14,  2.59it/s][A
Epoch 4/5:  14%|█▍        | 309/2208 [01:52<11:56,  2.65it/s][A
Epoch 4/5:  14%|█▍        | 310/2208 [01:53<11:53,  2.66it/s][A
Epoch 4/5:  14%|█▍        | 311/2208 [01:53<11:50,  2.67it/s][A
Epoch 4/5:  14%|█▍        | 312/2208 [01:53<11:31,  2.74it/s][A
Epoch 4/5:  14%|█▍        | 313/2208 [01:54<11:17,  2.80it/s][A
Epoch 4/5:  14%|█▍        | 314/2208 [01:54<11:26,  2.76it/s][A
Epoch 4/5:  14%|█▍        | 315/2208 [01:55<11:20,  2.78it/s][A
Epoch 4/5:  14%|█▍        | 316/2208 [01:55<11:32,  2.73it/s][A
Epoch 4/5:  14%|█▍      

Batch 325: Training accuracy = 0.7969, F1 = 0.7885, Precision = 0.7962, Recall = 0.7969



Epoch 4/5:  15%|█▍        | 327/2208 [01:59<11:12,  2.80it/s][A
Epoch 4/5:  15%|█▍        | 328/2208 [01:59<11:02,  2.84it/s][A
Epoch 4/5:  15%|█▍        | 329/2208 [01:59<11:21,  2.76it/s][A
Epoch 4/5:  15%|█▍        | 330/2208 [02:00<11:07,  2.81it/s][A
Epoch 4/5:  15%|█▍        | 331/2208 [02:00<11:04,  2.82it/s][A
Epoch 4/5:  15%|█▌        | 332/2208 [02:01<10:55,  2.86it/s][A
Epoch 4/5:  15%|█▌        | 333/2208 [02:01<10:50,  2.88it/s][A
Epoch 4/5:  15%|█▌        | 334/2208 [02:01<11:01,  2.83it/s][A
Epoch 4/5:  15%|█▌        | 335/2208 [02:02<11:11,  2.79it/s][A
Epoch 4/5:  15%|█▌        | 336/2208 [02:02<11:27,  2.72it/s][A
Epoch 4/5:  15%|█▌        | 337/2208 [02:02<11:35,  2.69it/s][A
Epoch 4/5:  15%|█▌        | 338/2208 [02:03<11:21,  2.74it/s][A
Epoch 4/5:  15%|█▌        | 339/2208 [02:03<11:14,  2.77it/s][A
Epoch 4/5:  15%|█▌        | 340/2208 [02:03<11:05,  2.81it/s][A
Epoch 4/5:  15%|█▌        | 341/2208 [02:04<11:06,  2.80it/s][A
Epoch 4/5:  15%|█▌      

Batch 350: Training accuracy = 0.8359, F1 = 0.8224, Precision = 0.8275, Recall = 0.8359



Epoch 4/5:  16%|█▌        | 352/2208 [02:08<11:08,  2.78it/s][A
Epoch 4/5:  16%|█▌        | 353/2208 [02:08<10:59,  2.81it/s][A
Epoch 4/5:  16%|█▌        | 354/2208 [02:08<10:53,  2.84it/s][A
Epoch 4/5:  16%|█▌        | 355/2208 [02:09<11:04,  2.79it/s][A
Epoch 4/5:  16%|█▌        | 356/2208 [02:09<11:16,  2.74it/s][A
Epoch 4/5:  16%|█▌        | 357/2208 [02:10<11:00,  2.80it/s][A
Epoch 4/5:  16%|█▌        | 358/2208 [02:10<11:02,  2.79it/s][A
Epoch 4/5:  16%|█▋        | 359/2208 [02:10<11:02,  2.79it/s][A
Epoch 4/5:  16%|█▋        | 360/2208 [02:11<10:56,  2.82it/s][A
Epoch 4/5:  16%|█▋        | 361/2208 [02:11<11:05,  2.78it/s][A
Epoch 4/5:  16%|█▋        | 362/2208 [02:11<11:06,  2.77it/s][A
Epoch 4/5:  16%|█▋        | 363/2208 [02:12<11:06,  2.77it/s][A
Epoch 4/5:  16%|█▋        | 364/2208 [02:12<10:54,  2.82it/s][A
Epoch 4/5:  17%|█▋        | 365/2208 [02:12<11:04,  2.77it/s][A
Epoch 4/5:  17%|█▋        | 366/2208 [02:13<11:03,  2.78it/s][A
Epoch 4/5:  17%|█▋      

Batch 375: Training accuracy = 0.8750, F1 = 0.8679, Precision = 0.8772, Recall = 0.8750



Epoch 4/5:  17%|█▋        | 377/2208 [02:17<11:15,  2.71it/s][A
Epoch 4/5:  17%|█▋        | 378/2208 [02:17<11:00,  2.77it/s][A
Epoch 4/5:  17%|█▋        | 379/2208 [02:17<10:51,  2.81it/s][A
Epoch 4/5:  17%|█▋        | 380/2208 [02:18<10:50,  2.81it/s][A
Epoch 4/5:  17%|█▋        | 381/2208 [02:18<10:42,  2.84it/s][A
Epoch 4/5:  17%|█▋        | 382/2208 [02:19<11:02,  2.76it/s][A
Epoch 4/5:  17%|█▋        | 383/2208 [02:19<11:20,  2.68it/s][A
Epoch 4/5:  17%|█▋        | 384/2208 [02:19<11:19,  2.69it/s][A
Epoch 4/5:  17%|█▋        | 385/2208 [02:20<11:27,  2.65it/s][A
Epoch 4/5:  17%|█▋        | 386/2208 [02:20<11:18,  2.69it/s][A
Epoch 4/5:  18%|█▊        | 387/2208 [02:20<11:07,  2.73it/s][A
Epoch 4/5:  18%|█▊        | 388/2208 [02:21<11:04,  2.74it/s][A
Epoch 4/5:  18%|█▊        | 389/2208 [02:21<11:11,  2.71it/s][A
Epoch 4/5:  18%|█▊        | 390/2208 [02:22<11:12,  2.70it/s][A
Epoch 4/5:  18%|█▊        | 391/2208 [02:22<11:24,  2.66it/s][A
Epoch 4/5:  18%|█▊      

Batch 400: Training accuracy = 0.9219, F1 = 0.9070, Precision = 0.9036, Recall = 0.9219



Epoch 4/5:  18%|█▊        | 402/2208 [02:26<10:42,  2.81it/s][A
Epoch 4/5:  18%|█▊        | 403/2208 [02:26<11:04,  2.72it/s][A
Epoch 4/5:  18%|█▊        | 404/2208 [02:27<10:54,  2.76it/s][A
Epoch 4/5:  18%|█▊        | 405/2208 [02:27<10:43,  2.80it/s][A
Epoch 4/5:  18%|█▊        | 406/2208 [02:27<10:54,  2.75it/s][A
Epoch 4/5:  18%|█▊        | 407/2208 [02:28<10:55,  2.75it/s][A
Epoch 4/5:  18%|█▊        | 408/2208 [02:28<11:10,  2.68it/s][A
Epoch 4/5:  19%|█▊        | 409/2208 [02:28<11:05,  2.70it/s][A
Epoch 4/5:  19%|█▊        | 410/2208 [02:29<11:03,  2.71it/s][A
Epoch 4/5:  19%|█▊        | 411/2208 [02:29<11:05,  2.70it/s][A
Epoch 4/5:  19%|█▊        | 412/2208 [02:30<10:51,  2.76it/s][A
Epoch 4/5:  19%|█▊        | 413/2208 [02:30<10:37,  2.81it/s][A
Epoch 4/5:  19%|█▉        | 414/2208 [02:30<10:39,  2.80it/s][A
Epoch 4/5:  19%|█▉        | 415/2208 [02:31<10:31,  2.84it/s][A
Epoch 4/5:  19%|█▉        | 416/2208 [02:31<10:23,  2.88it/s][A
Epoch 4/5:  19%|█▉      

Batch 425: Training accuracy = 0.8828, F1 = 0.8717, Precision = 0.8770, Recall = 0.8828



Epoch 4/5:  19%|█▉        | 427/2208 [02:35<10:45,  2.76it/s][A
Epoch 4/5:  19%|█▉        | 428/2208 [02:35<10:54,  2.72it/s][A
Epoch 4/5:  19%|█▉        | 429/2208 [02:36<10:40,  2.78it/s][A
Epoch 4/5:  19%|█▉        | 430/2208 [02:36<10:51,  2.73it/s][A
Epoch 4/5:  20%|█▉        | 431/2208 [02:36<10:48,  2.74it/s][A
Epoch 4/5:  20%|█▉        | 432/2208 [02:37<10:48,  2.74it/s][A
Epoch 4/5:  20%|█▉        | 433/2208 [02:37<11:16,  2.62it/s][A
Epoch 4/5:  20%|█▉        | 434/2208 [02:37<10:56,  2.70it/s][A
Epoch 4/5:  20%|█▉        | 435/2208 [02:38<10:42,  2.76it/s][A
Epoch 4/5:  20%|█▉        | 436/2208 [02:38<10:54,  2.71it/s][A
Epoch 4/5:  20%|█▉        | 437/2208 [02:38<10:39,  2.77it/s][A
Epoch 4/5:  20%|█▉        | 438/2208 [02:39<10:31,  2.80it/s][A
Epoch 4/5:  20%|█▉        | 439/2208 [02:39<10:22,  2.84it/s][A
Epoch 4/5:  20%|█▉        | 440/2208 [02:40<10:15,  2.87it/s][A
Epoch 4/5:  20%|█▉        | 441/2208 [02:40<10:10,  2.89it/s][A
Epoch 4/5:  20%|██      

Batch 450: Training accuracy = 0.8750, F1 = 0.8776, Precision = 0.8945, Recall = 0.8750



Epoch 4/5:  20%|██        | 452/2208 [02:44<10:43,  2.73it/s][A
Epoch 4/5:  21%|██        | 453/2208 [02:44<10:36,  2.76it/s][A
Epoch 4/5:  21%|██        | 454/2208 [02:45<10:24,  2.81it/s][A
Epoch 4/5:  21%|██        | 455/2208 [02:45<10:15,  2.85it/s][A
Epoch 4/5:  21%|██        | 456/2208 [02:45<10:12,  2.86it/s][A
Epoch 4/5:  21%|██        | 457/2208 [02:46<10:08,  2.88it/s][A
Epoch 4/5:  21%|██        | 458/2208 [02:46<10:05,  2.89it/s][A
Epoch 4/5:  21%|██        | 459/2208 [02:46<10:14,  2.85it/s][A
Epoch 4/5:  21%|██        | 460/2208 [02:47<10:13,  2.85it/s][A
Epoch 4/5:  21%|██        | 461/2208 [02:47<10:11,  2.86it/s][A
Epoch 4/5:  21%|██        | 462/2208 [02:47<10:13,  2.85it/s][A
Epoch 4/5:  21%|██        | 463/2208 [02:48<10:42,  2.72it/s][A
Epoch 4/5:  21%|██        | 464/2208 [02:48<10:28,  2.78it/s][A
Epoch 4/5:  21%|██        | 465/2208 [02:48<10:18,  2.82it/s][A
Epoch 4/5:  21%|██        | 466/2208 [02:49<10:26,  2.78it/s][A
Epoch 4/5:  21%|██      

Batch 475: Training accuracy = 0.8750, F1 = 0.8591, Precision = 0.8565, Recall = 0.8750



Epoch 4/5:  22%|██▏       | 477/2208 [02:53<10:20,  2.79it/s][A
Epoch 4/5:  22%|██▏       | 478/2208 [02:53<10:14,  2.81it/s][A
Epoch 4/5:  22%|██▏       | 479/2208 [02:53<10:14,  2.81it/s][A
Epoch 4/5:  22%|██▏       | 480/2208 [02:54<10:18,  2.79it/s][A
Epoch 4/5:  22%|██▏       | 481/2208 [02:54<10:27,  2.75it/s][A
Epoch 4/5:  22%|██▏       | 482/2208 [02:55<10:15,  2.81it/s][A
Epoch 4/5:  22%|██▏       | 483/2208 [02:55<10:16,  2.80it/s][A
Epoch 4/5:  22%|██▏       | 484/2208 [02:55<10:23,  2.76it/s][A
Epoch 4/5:  22%|██▏       | 485/2208 [02:56<10:14,  2.81it/s][A
Epoch 4/5:  22%|██▏       | 486/2208 [02:56<10:13,  2.81it/s][A
Epoch 4/5:  22%|██▏       | 489/2208 [02:57<10:05,  2.84it/s][A
Epoch 4/5:  22%|██▏       | 490/2208 [02:57<10:07,  2.83it/s][A
Epoch 4/5:  22%|██▏       | 491/2208 [02:58<10:18,  2.78it/s][A
Epoch 4/5:  22%|██▏       | 492/2208 [02:58<10:26,  2.74it/s][A
Epoch 4/5:  22%|██▏       | 493/2208 [02:58<10:30,  2.72it/s][A
Epoch 4/5:  22%|██▏     

Batch 500: Training accuracy = 0.8125, F1 = 0.8049, Precision = 0.8268, Recall = 0.8125



Epoch 4/5:  23%|██▎       | 502/2208 [03:02<10:23,  2.74it/s][A
Epoch 4/5:  23%|██▎       | 503/2208 [03:02<10:33,  2.69it/s][A
Epoch 4/5:  23%|██▎       | 504/2208 [03:02<10:25,  2.73it/s][A
Epoch 4/5:  23%|██▎       | 505/2208 [03:03<10:24,  2.73it/s][A
Epoch 4/5:  23%|██▎       | 506/2208 [03:03<10:10,  2.79it/s][A
Epoch 4/5:  23%|██▎       | 507/2208 [03:04<10:21,  2.74it/s][A
Epoch 4/5:  23%|██▎       | 508/2208 [03:04<10:22,  2.73it/s][A
Epoch 4/5:  23%|██▎       | 509/2208 [03:04<10:18,  2.75it/s][A
Epoch 4/5:  23%|██▎       | 510/2208 [03:05<10:15,  2.76it/s][A
Epoch 4/5:  23%|██▎       | 511/2208 [03:05<10:26,  2.71it/s][A
Epoch 4/5:  23%|██▎       | 512/2208 [03:05<10:26,  2.71it/s][A
Epoch 4/5:  23%|██▎       | 513/2208 [03:06<10:26,  2.71it/s][A
Epoch 4/5:  23%|██▎       | 514/2208 [03:06<10:12,  2.77it/s][A
Epoch 4/5:  23%|██▎       | 515/2208 [03:06<10:04,  2.80it/s][A
Epoch 4/5:  23%|██▎       | 516/2208 [03:07<10:02,  2.81it/s][A
Epoch 4/5:  23%|██▎     

Batch 525: Training accuracy = 0.8672, F1 = 0.8717, Precision = 0.8956, Recall = 0.8672



Epoch 4/5:  24%|██▍       | 527/2208 [03:11<09:49,  2.85it/s][A
Epoch 4/5:  24%|██▍       | 528/2208 [03:11<09:43,  2.88it/s][A
Epoch 4/5:  24%|██▍       | 529/2208 [03:11<09:44,  2.87it/s][A
Epoch 4/5:  24%|██▍       | 530/2208 [03:12<09:38,  2.90it/s][A
Epoch 4/5:  24%|██▍       | 531/2208 [03:12<09:39,  2.89it/s][A
Epoch 4/5:  24%|██▍       | 532/2208 [03:12<09:36,  2.91it/s][A
Epoch 4/5:  24%|██▍       | 533/2208 [03:13<09:42,  2.88it/s][A
Epoch 4/5:  24%|██▍       | 534/2208 [03:13<09:42,  2.87it/s][A
Epoch 4/5:  24%|██▍       | 535/2208 [03:13<09:48,  2.84it/s][A
Epoch 4/5:  24%|██▍       | 536/2208 [03:14<09:56,  2.80it/s][A
Epoch 4/5:  24%|██▍       | 537/2208 [03:14<09:51,  2.82it/s][A
Epoch 4/5:  24%|██▍       | 538/2208 [03:14<09:52,  2.82it/s][A
Epoch 4/5:  24%|██▍       | 539/2208 [03:15<09:43,  2.86it/s][A
Epoch 4/5:  24%|██▍       | 540/2208 [03:15<09:43,  2.86it/s][A
Epoch 4/5:  25%|██▍       | 541/2208 [03:16<09:37,  2.89it/s][A
Epoch 4/5:  25%|██▍     

Batch 550: Training accuracy = 0.8047, F1 = 0.7917, Precision = 0.8001, Recall = 0.8047



Epoch 4/5:  25%|██▌       | 552/2208 [03:19<10:05,  2.73it/s][A
Epoch 4/5:  25%|██▌       | 553/2208 [03:20<10:21,  2.66it/s][A
Epoch 4/5:  25%|██▌       | 554/2208 [03:20<10:21,  2.66it/s][A
Epoch 4/5:  25%|██▌       | 555/2208 [03:21<10:37,  2.59it/s][A
Epoch 4/5:  25%|██▌       | 556/2208 [03:21<10:26,  2.64it/s][A
Epoch 4/5:  25%|██▌       | 557/2208 [03:21<10:17,  2.67it/s][A
Epoch 4/5:  25%|██▌       | 558/2208 [03:22<10:12,  2.70it/s][A
Epoch 4/5:  25%|██▌       | 559/2208 [03:22<10:05,  2.72it/s][A
Epoch 4/5:  25%|██▌       | 560/2208 [03:22<10:01,  2.74it/s][A
Epoch 4/5:  25%|██▌       | 561/2208 [03:23<10:03,  2.73it/s][A
Epoch 4/5:  25%|██▌       | 562/2208 [03:23<09:52,  2.78it/s][A
Epoch 4/5:  25%|██▌       | 563/2208 [03:24<09:42,  2.82it/s][A
Epoch 4/5:  26%|██▌       | 564/2208 [03:24<09:34,  2.86it/s][A
Epoch 4/5:  26%|██▌       | 565/2208 [03:24<09:43,  2.82it/s][A
Epoch 4/5:  26%|██▌       | 566/2208 [03:25<09:39,  2.83it/s][A
Epoch 4/5:  26%|██▌     

Batch 575: Training accuracy = 0.8438, F1 = 0.8432, Precision = 0.8542, Recall = 0.8438



Epoch 4/5:  26%|██▌       | 577/2208 [03:28<09:38,  2.82it/s][A
Epoch 4/5:  26%|██▌       | 578/2208 [03:29<09:41,  2.80it/s][A
Epoch 4/5:  26%|██▌       | 579/2208 [03:29<09:55,  2.73it/s][A
Epoch 4/5:  26%|██▋       | 580/2208 [03:30<09:59,  2.72it/s][A
Epoch 4/5:  26%|██▋       | 581/2208 [03:30<09:57,  2.72it/s][A
Epoch 4/5:  26%|██▋       | 582/2208 [03:30<09:43,  2.79it/s][A
Epoch 4/5:  26%|██▋       | 583/2208 [03:31<09:44,  2.78it/s][A
Epoch 4/5:  26%|██▋       | 584/2208 [03:31<09:50,  2.75it/s][A
Epoch 4/5:  26%|██▋       | 585/2208 [03:31<09:39,  2.80it/s][A
Epoch 4/5:  27%|██▋       | 586/2208 [03:32<09:37,  2.81it/s][A
Epoch 4/5:  27%|██▋       | 587/2208 [03:32<09:47,  2.76it/s][A
Epoch 4/5:  27%|██▋       | 588/2208 [03:32<09:43,  2.78it/s][A
Epoch 4/5:  27%|██▋       | 589/2208 [03:33<09:34,  2.82it/s][A
Epoch 4/5:  27%|██▋       | 590/2208 [03:33<09:44,  2.77it/s][A
Epoch 4/5:  27%|██▋       | 591/2208 [03:33<09:35,  2.81it/s][A
Epoch 4/5:  27%|██▋     

Batch 600: Training accuracy = 0.8281, F1 = 0.8065, Precision = 0.8034, Recall = 0.8281



Epoch 4/5:  27%|██▋       | 602/2208 [03:37<09:36,  2.79it/s][A
Epoch 4/5:  27%|██▋       | 603/2208 [03:38<09:27,  2.83it/s][A
Epoch 4/5:  27%|██▋       | 604/2208 [03:38<09:29,  2.82it/s][A
Epoch 4/5:  27%|██▋       | 605/2208 [03:39<09:32,  2.80it/s][A
Epoch 4/5:  27%|██▋       | 606/2208 [03:39<09:24,  2.84it/s][A
Epoch 4/5:  27%|██▋       | 607/2208 [03:39<09:27,  2.82it/s][A
Epoch 4/5:  28%|██▊       | 608/2208 [03:40<09:20,  2.85it/s][A
Epoch 4/5:  28%|██▊       | 609/2208 [03:40<09:21,  2.85it/s][A
Epoch 4/5:  28%|██▊       | 610/2208 [03:40<09:21,  2.85it/s][A
Epoch 4/5:  28%|██▊       | 611/2208 [03:41<09:32,  2.79it/s][A
Epoch 4/5:  28%|██▊       | 612/2208 [03:41<09:25,  2.82it/s][A
Epoch 4/5:  28%|██▊       | 613/2208 [03:41<09:20,  2.85it/s][A
Epoch 4/5:  28%|██▊       | 614/2208 [03:42<09:16,  2.87it/s][A
Epoch 4/5:  28%|██▊       | 615/2208 [03:42<09:18,  2.85it/s][A
Epoch 4/5:  28%|██▊       | 616/2208 [03:42<09:20,  2.84it/s][A
Epoch 4/5:  28%|██▊     

Batch 625: Training accuracy = 0.8828, F1 = 0.8737, Precision = 0.8753, Recall = 0.8828



Epoch 4/5:  28%|██▊       | 627/2208 [03:46<09:40,  2.72it/s][A
Epoch 4/5:  28%|██▊       | 628/2208 [03:47<09:30,  2.77it/s][A
Epoch 4/5:  28%|██▊       | 629/2208 [03:47<09:22,  2.81it/s][A
Epoch 4/5:  29%|██▊       | 630/2208 [03:47<09:14,  2.85it/s][A
Epoch 4/5:  29%|██▊       | 631/2208 [03:48<09:10,  2.87it/s][A
Epoch 4/5:  29%|██▊       | 632/2208 [03:48<09:21,  2.81it/s][A
Epoch 4/5:  29%|██▊       | 633/2208 [03:48<09:25,  2.78it/s][A
Epoch 4/5:  29%|██▊       | 634/2208 [03:49<09:20,  2.81it/s][A
Epoch 4/5:  29%|██▉       | 635/2208 [03:49<09:31,  2.75it/s][A
Epoch 4/5:  29%|██▉       | 636/2208 [03:50<09:33,  2.74it/s][A
Epoch 4/5:  29%|██▉       | 637/2208 [03:50<09:34,  2.73it/s][A
Epoch 4/5:  29%|██▉       | 638/2208 [03:50<09:37,  2.72it/s][A
Epoch 4/5:  29%|██▉       | 639/2208 [03:51<09:35,  2.73it/s][A
Epoch 4/5:  29%|██▉       | 640/2208 [03:51<09:26,  2.77it/s][A
Epoch 4/5:  29%|██▉       | 641/2208 [03:51<09:16,  2.82it/s][A
Epoch 4/5:  29%|██▉     

Batch 650: Training accuracy = 0.8828, F1 = 0.8732, Precision = 0.8789, Recall = 0.8828



Epoch 4/5:  30%|██▉       | 652/2208 [03:55<09:23,  2.76it/s][A
Epoch 4/5:  30%|██▉       | 653/2208 [03:56<09:12,  2.82it/s][A
Epoch 4/5:  30%|██▉       | 654/2208 [03:56<09:17,  2.78it/s][A
Epoch 4/5:  30%|██▉       | 655/2208 [03:56<09:25,  2.74it/s][A
Epoch 4/5:  30%|██▉       | 656/2208 [03:57<09:19,  2.78it/s][A
Epoch 4/5:  30%|██▉       | 657/2208 [03:57<09:19,  2.77it/s][A
Epoch 4/5:  30%|██▉       | 658/2208 [03:57<09:13,  2.80it/s][A
Epoch 4/5:  30%|██▉       | 659/2208 [03:58<09:11,  2.81it/s][A
Epoch 4/5:  30%|██▉       | 660/2208 [03:58<09:20,  2.76it/s][A
Epoch 4/5:  30%|██▉       | 661/2208 [03:59<09:22,  2.75it/s][A
Epoch 4/5:  30%|██▉       | 662/2208 [03:59<09:27,  2.72it/s][A
Epoch 4/5:  30%|███       | 663/2208 [03:59<09:15,  2.78it/s][A
Epoch 4/5:  30%|███       | 664/2208 [04:00<09:27,  2.72it/s][A
Epoch 4/5:  30%|███       | 665/2208 [04:00<09:16,  2.77it/s][A
Epoch 4/5:  30%|███       | 666/2208 [04:00<09:14,  2.78it/s][A
Epoch 4/5:  30%|███     

Batch 675: Training accuracy = 0.8594, F1 = 0.8484, Precision = 0.8451, Recall = 0.8594



Epoch 4/5:  31%|███       | 677/2208 [04:04<09:24,  2.71it/s][A
Epoch 4/5:  31%|███       | 678/2208 [04:05<09:11,  2.78it/s][A
Epoch 4/5:  31%|███       | 679/2208 [04:05<09:01,  2.82it/s][A
Epoch 4/5:  31%|███       | 680/2208 [04:05<09:04,  2.81it/s][A
Epoch 4/5:  31%|███       | 681/2208 [04:06<09:09,  2.78it/s][A
Epoch 4/5:  31%|███       | 682/2208 [04:06<09:02,  2.81it/s][A
Epoch 4/5:  31%|███       | 683/2208 [04:06<09:08,  2.78it/s][A
Epoch 4/5:  31%|███       | 684/2208 [04:07<08:58,  2.83it/s][A
Epoch 4/5:  31%|███       | 685/2208 [04:07<08:51,  2.86it/s][A
Epoch 4/5:  31%|███       | 686/2208 [04:08<08:54,  2.85it/s][A
Epoch 4/5:  31%|███       | 687/2208 [04:08<09:02,  2.80it/s][A
Epoch 4/5:  31%|███       | 688/2208 [04:08<08:59,  2.82it/s][A
Epoch 4/5:  31%|███       | 689/2208 [04:09<08:51,  2.86it/s][A
Epoch 4/5:  31%|███▏      | 690/2208 [04:09<08:48,  2.87it/s][A
Epoch 4/5:  31%|███▏      | 691/2208 [04:09<08:58,  2.82it/s][A
Epoch 4/5:  31%|███▏    

Batch 700: Training accuracy = 0.8203, F1 = 0.8107, Precision = 0.8164, Recall = 0.8203



Epoch 4/5:  32%|███▏      | 702/2208 [04:13<09:13,  2.72it/s][A
Epoch 4/5:  32%|███▏      | 703/2208 [04:14<09:13,  2.72it/s][A
Epoch 4/5:  32%|███▏      | 704/2208 [04:14<09:14,  2.71it/s][A
Epoch 4/5:  32%|███▏      | 705/2208 [04:14<09:00,  2.78it/s][A
Epoch 4/5:  32%|███▏      | 706/2208 [04:15<08:57,  2.79it/s][A
Epoch 4/5:  32%|███▏      | 707/2208 [04:15<08:49,  2.83it/s][A
Epoch 4/5:  32%|███▏      | 708/2208 [04:15<08:54,  2.81it/s][A
Epoch 4/5:  32%|███▏      | 709/2208 [04:16<08:57,  2.79it/s][A
Epoch 4/5:  32%|███▏      | 710/2208 [04:16<09:07,  2.73it/s][A
Epoch 4/5:  32%|███▏      | 711/2208 [04:17<09:10,  2.72it/s][A
Epoch 4/5:  32%|███▏      | 712/2208 [04:17<09:00,  2.77it/s][A
Epoch 4/5:  32%|███▏      | 713/2208 [04:17<08:50,  2.82it/s][A
Epoch 4/5:  32%|███▏      | 714/2208 [04:18<08:42,  2.86it/s][A
Epoch 4/5:  32%|███▏      | 715/2208 [04:18<08:39,  2.87it/s][A
Epoch 4/5:  32%|███▏      | 716/2208 [04:18<08:35,  2.90it/s][A
Epoch 4/5:  32%|███▏    

Batch 725: Training accuracy = 0.8750, F1 = 0.8698, Precision = 0.8789, Recall = 0.8750



Epoch 4/5:  33%|███▎      | 727/2208 [04:22<08:41,  2.84it/s][A
Epoch 4/5:  33%|███▎      | 728/2208 [04:23<08:47,  2.81it/s][A
Epoch 4/5:  33%|███▎      | 729/2208 [04:23<08:37,  2.86it/s][A
Epoch 4/5:  33%|███▎      | 730/2208 [04:23<08:35,  2.87it/s][A
Epoch 4/5:  33%|███▎      | 731/2208 [04:24<08:31,  2.89it/s][A
Epoch 4/5:  33%|███▎      | 732/2208 [04:24<08:28,  2.90it/s][A
Epoch 4/5:  33%|███▎      | 733/2208 [04:24<08:32,  2.88it/s][A
Epoch 4/5:  33%|███▎      | 734/2208 [04:25<08:34,  2.86it/s][A
Epoch 4/5:  33%|███▎      | 735/2208 [04:25<08:43,  2.81it/s][A
Epoch 4/5:  33%|███▎      | 736/2208 [04:25<08:49,  2.78it/s][A
Epoch 4/5:  33%|███▎      | 737/2208 [04:26<08:50,  2.77it/s][A
Epoch 4/5:  33%|███▎      | 738/2208 [04:26<08:44,  2.80it/s][A
Epoch 4/5:  33%|███▎      | 739/2208 [04:26<08:40,  2.82it/s][A
Epoch 4/5:  34%|███▎      | 740/2208 [04:27<08:34,  2.85it/s][A
Epoch 4/5:  34%|███▎      | 741/2208 [04:27<08:34,  2.85it/s][A
Epoch 4/5:  34%|███▎    

Batch 750: Training accuracy = 0.7812, F1 = 0.7686, Precision = 0.7764, Recall = 0.7812



Epoch 4/5:  34%|███▍      | 752/2208 [04:31<08:50,  2.75it/s][A
Epoch 4/5:  34%|███▍      | 753/2208 [04:31<08:53,  2.73it/s][A
Epoch 4/5:  34%|███▍      | 754/2208 [04:32<08:47,  2.76it/s][A
Epoch 4/5:  34%|███▍      | 755/2208 [04:32<08:38,  2.80it/s][A
Epoch 4/5:  34%|███▍      | 756/2208 [04:32<08:45,  2.76it/s][A
Epoch 4/5:  34%|███▍      | 757/2208 [04:33<08:48,  2.74it/s][A
Epoch 4/5:  34%|███▍      | 758/2208 [04:33<08:50,  2.73it/s][A
Epoch 4/5:  34%|███▍      | 759/2208 [04:34<08:47,  2.75it/s][A
Epoch 4/5:  34%|███▍      | 760/2208 [04:34<08:54,  2.71it/s][A
Epoch 4/5:  34%|███▍      | 761/2208 [04:34<08:59,  2.68it/s][A
Epoch 4/5:  35%|███▍      | 762/2208 [04:35<08:53,  2.71it/s][A
Epoch 4/5:  35%|███▍      | 763/2208 [04:35<08:53,  2.71it/s][A
Epoch 4/5:  35%|███▍      | 764/2208 [04:35<08:40,  2.77it/s][A
Epoch 4/5:  35%|███▍      | 765/2208 [04:36<08:40,  2.77it/s][A
Epoch 4/5:  35%|███▍      | 766/2208 [04:36<08:35,  2.80it/s][A
Epoch 4/5:  35%|███▍    

Batch 775: Training accuracy = 0.8828, F1 = 0.8609, Precision = 0.8490, Recall = 0.8828



Epoch 4/5:  35%|███▌      | 777/2208 [04:40<08:27,  2.82it/s][A
Epoch 4/5:  35%|███▌      | 778/2208 [04:40<08:22,  2.85it/s][A
Epoch 4/5:  35%|███▌      | 779/2208 [04:41<08:16,  2.88it/s][A
Epoch 4/5:  35%|███▌      | 780/2208 [04:41<08:16,  2.87it/s][A
Epoch 4/5:  35%|███▌      | 781/2208 [04:41<08:13,  2.89it/s][A
Epoch 4/5:  35%|███▌      | 782/2208 [04:42<08:11,  2.90it/s][A
Epoch 4/5:  35%|███▌      | 783/2208 [04:42<08:12,  2.89it/s][A
Epoch 4/5:  36%|███▌      | 784/2208 [04:42<08:29,  2.79it/s][A
Epoch 4/5:  36%|███▌      | 785/2208 [04:43<08:30,  2.79it/s][A
Epoch 4/5:  36%|███▌      | 786/2208 [04:43<08:27,  2.80it/s][A
Epoch 4/5:  36%|███▌      | 787/2208 [04:43<08:19,  2.84it/s][A
Epoch 4/5:  36%|███▌      | 788/2208 [04:44<08:16,  2.86it/s][A
Epoch 4/5:  36%|███▌      | 789/2208 [04:44<08:14,  2.87it/s][A
Epoch 4/5:  36%|███▌      | 790/2208 [04:45<08:12,  2.88it/s][A
Epoch 4/5:  36%|███▌      | 791/2208 [04:45<08:11,  2.88it/s][A
Epoch 4/5:  36%|███▌    

Batch 800: Training accuracy = 0.8984, F1 = 0.8886, Precision = 0.8878, Recall = 0.8984



Epoch 4/5:  36%|███▋      | 802/2208 [04:49<08:39,  2.71it/s][A
Epoch 4/5:  36%|███▋      | 803/2208 [04:49<08:29,  2.76it/s][A
Epoch 4/5:  36%|███▋      | 804/2208 [04:50<08:18,  2.82it/s][A
Epoch 4/5:  36%|███▋      | 805/2208 [04:50<08:12,  2.85it/s][A
Epoch 4/5:  37%|███▋      | 806/2208 [04:50<08:10,  2.86it/s][A
Epoch 4/5:  37%|███▋      | 807/2208 [04:51<08:11,  2.85it/s][A
Epoch 4/5:  37%|███▋      | 808/2208 [04:51<08:15,  2.83it/s][A
Epoch 4/5:  37%|███▋      | 809/2208 [04:51<08:22,  2.78it/s][A
Epoch 4/5:  37%|███▋      | 810/2208 [04:52<08:18,  2.80it/s][A
Epoch 4/5:  37%|███▋      | 811/2208 [04:52<08:17,  2.81it/s][A
Epoch 4/5:  37%|███▋      | 812/2208 [04:52<08:22,  2.78it/s][A
Epoch 4/5:  37%|███▋      | 813/2208 [04:53<08:30,  2.73it/s][A
Epoch 4/5:  37%|███▋      | 814/2208 [04:53<08:42,  2.67it/s][A
Epoch 4/5:  37%|███▋      | 815/2208 [04:54<08:47,  2.64it/s][A
Epoch 4/5:  37%|███▋      | 816/2208 [04:54<08:29,  2.73it/s][A
Epoch 4/5:  37%|███▋    

Batch 825: Training accuracy = 0.8516, F1 = 0.8414, Precision = 0.8490, Recall = 0.8516



Epoch 4/5:  37%|███▋      | 827/2208 [04:58<08:02,  2.86it/s][A
Epoch 4/5:  38%|███▊      | 828/2208 [04:58<07:57,  2.89it/s][A
Epoch 4/5:  38%|███▊      | 829/2208 [04:58<08:02,  2.86it/s][A
Epoch 4/5:  38%|███▊      | 830/2208 [04:59<07:59,  2.88it/s][A
Epoch 4/5:  38%|███▊      | 831/2208 [04:59<07:55,  2.89it/s][A
Epoch 4/5:  38%|███▊      | 832/2208 [04:59<08:03,  2.85it/s][A
Epoch 4/5:  38%|███▊      | 833/2208 [05:00<08:04,  2.84it/s][A
Epoch 4/5:  38%|███▊      | 834/2208 [05:00<08:07,  2.82it/s][A
Epoch 4/5:  38%|███▊      | 835/2208 [05:01<08:15,  2.77it/s][A
Epoch 4/5:  38%|███▊      | 836/2208 [05:01<08:12,  2.79it/s][A
Epoch 4/5:  38%|███▊      | 837/2208 [05:01<08:19,  2.75it/s][A
Epoch 4/5:  38%|███▊      | 838/2208 [05:02<08:33,  2.67it/s][A
Epoch 4/5:  38%|███▊      | 839/2208 [05:02<08:34,  2.66it/s][A
Epoch 4/5:  38%|███▊      | 840/2208 [05:02<08:31,  2.67it/s][A
Epoch 4/5:  38%|███▊      | 841/2208 [05:03<08:19,  2.74it/s][A
Epoch 4/5:  38%|███▊    

Batch 850: Training accuracy = 0.8359, F1 = 0.8385, Precision = 0.8542, Recall = 0.8359



Epoch 4/5:  39%|███▊      | 852/2208 [05:07<07:55,  2.85it/s][A
Epoch 4/5:  39%|███▊      | 853/2208 [05:07<07:50,  2.88it/s][A
Epoch 4/5:  39%|███▊      | 854/2208 [05:07<07:51,  2.87it/s][A
Epoch 4/5:  39%|███▊      | 855/2208 [05:08<07:47,  2.89it/s][A
Epoch 4/5:  39%|███▉      | 856/2208 [05:08<07:49,  2.88it/s][A
Epoch 4/5:  39%|███▉      | 857/2208 [05:08<07:46,  2.90it/s][A
Epoch 4/5:  39%|███▉      | 858/2208 [05:09<08:03,  2.79it/s][A
Epoch 4/5:  39%|███▉      | 859/2208 [05:09<07:59,  2.82it/s][A
Epoch 4/5:  39%|███▉      | 860/2208 [05:09<08:05,  2.78it/s][A
Epoch 4/5:  39%|███▉      | 861/2208 [05:10<08:19,  2.70it/s][A
Epoch 4/5:  39%|███▉      | 862/2208 [05:10<08:21,  2.68it/s][A
Epoch 4/5:  39%|███▉      | 863/2208 [05:11<08:20,  2.68it/s][A
Epoch 4/5:  39%|███▉      | 864/2208 [05:11<08:13,  2.73it/s][A
Epoch 4/5:  39%|███▉      | 865/2208 [05:11<08:10,  2.74it/s][A
Epoch 4/5:  39%|███▉      | 866/2208 [05:12<08:13,  2.72it/s][A
Epoch 4/5:  39%|███▉    

Batch 875: Training accuracy = 0.8203, F1 = 0.8130, Precision = 0.8210, Recall = 0.8203



Epoch 4/5:  40%|███▉      | 877/2208 [05:16<08:01,  2.77it/s][A
Epoch 4/5:  40%|███▉      | 878/2208 [05:16<07:58,  2.78it/s][A
Epoch 4/5:  40%|███▉      | 879/2208 [05:16<07:51,  2.82it/s][A
Epoch 4/5:  40%|███▉      | 880/2208 [05:17<07:52,  2.81it/s][A
Epoch 4/5:  40%|███▉      | 881/2208 [05:17<07:54,  2.80it/s][A
Epoch 4/5:  40%|███▉      | 882/2208 [05:17<07:52,  2.81it/s][A
Epoch 4/5:  40%|███▉      | 883/2208 [05:18<07:48,  2.83it/s][A
Epoch 4/5:  40%|████      | 884/2208 [05:18<07:42,  2.86it/s][A
Epoch 4/5:  40%|████      | 885/2208 [05:18<07:49,  2.82it/s][A
Epoch 4/5:  40%|████      | 886/2208 [05:19<07:53,  2.79it/s][A
Epoch 4/5:  40%|████      | 887/2208 [05:19<08:04,  2.73it/s][A
Epoch 4/5:  40%|████      | 888/2208 [05:20<08:10,  2.69it/s][A
Epoch 4/5:  40%|████      | 889/2208 [05:20<08:03,  2.73it/s][A
Epoch 4/5:  40%|████      | 890/2208 [05:20<07:54,  2.78it/s][A
Epoch 4/5:  40%|████      | 891/2208 [05:21<07:50,  2.80it/s][A
Epoch 4/5:  40%|████    

Batch 900: Training accuracy = 0.8438, F1 = 0.8458, Precision = 0.8620, Recall = 0.8438



Epoch 4/5:  41%|████      | 902/2208 [05:25<07:59,  2.72it/s][A
Epoch 4/5:  41%|████      | 903/2208 [05:25<08:01,  2.71it/s][A
Epoch 4/5:  41%|████      | 904/2208 [05:25<07:51,  2.77it/s][A
Epoch 4/5:  41%|████      | 905/2208 [05:26<07:45,  2.80it/s][A
Epoch 4/5:  41%|████      | 906/2208 [05:26<07:48,  2.78it/s][A
Epoch 4/5:  41%|████      | 907/2208 [05:26<07:59,  2.71it/s][A
Epoch 4/5:  41%|████      | 908/2208 [05:27<07:57,  2.72it/s][A
Epoch 4/5:  41%|████      | 909/2208 [05:27<07:50,  2.76it/s][A
Epoch 4/5:  41%|████      | 910/2208 [05:27<07:53,  2.74it/s][A
Epoch 4/5:  41%|████▏     | 911/2208 [05:28<07:46,  2.78it/s][A
Epoch 4/5:  41%|████▏     | 912/2208 [05:28<07:45,  2.78it/s][A
Epoch 4/5:  41%|████▏     | 913/2208 [05:29<07:46,  2.77it/s][A
Epoch 4/5:  41%|████▏     | 914/2208 [05:29<07:50,  2.75it/s][A
Epoch 4/5:  41%|████▏     | 915/2208 [05:29<07:49,  2.75it/s][A
Epoch 4/5:  41%|████▏     | 916/2208 [05:30<07:43,  2.79it/s][A
Epoch 4/5:  42%|████▏   

Batch 925: Training accuracy = 0.8594, F1 = 0.8458, Precision = 0.8464, Recall = 0.8594



Epoch 4/5:  42%|████▏     | 927/2208 [05:34<07:43,  2.77it/s][A
Epoch 4/5:  42%|████▏     | 928/2208 [05:34<07:41,  2.78it/s][A
Epoch 4/5:  42%|████▏     | 929/2208 [05:34<07:34,  2.81it/s][A
Epoch 4/5:  42%|████▏     | 930/2208 [05:35<07:40,  2.77it/s][A
Epoch 4/5:  42%|████▏     | 931/2208 [05:35<07:50,  2.71it/s][A
Epoch 4/5:  42%|████▏     | 932/2208 [05:35<07:39,  2.78it/s][A
Epoch 4/5:  42%|████▏     | 933/2208 [05:36<07:38,  2.78it/s][A
Epoch 4/5:  42%|████▏     | 934/2208 [05:36<07:40,  2.77it/s][A
Epoch 4/5:  42%|████▏     | 935/2208 [05:37<07:38,  2.77it/s][A
Epoch 4/5:  42%|████▏     | 936/2208 [05:37<07:33,  2.80it/s][A
Epoch 4/5:  42%|████▏     | 937/2208 [05:37<07:34,  2.80it/s][A
Epoch 4/5:  42%|████▏     | 938/2208 [05:38<07:27,  2.84it/s][A
Epoch 4/5:  43%|████▎     | 939/2208 [05:38<07:29,  2.82it/s][A
Epoch 4/5:  43%|████▎     | 940/2208 [05:38<07:27,  2.83it/s][A
Epoch 4/5:  43%|████▎     | 941/2208 [05:39<07:28,  2.83it/s][A
Epoch 4/5:  43%|████▎   

Batch 950: Training accuracy = 0.8672, F1 = 0.8570, Precision = 0.8672, Recall = 0.8672



Epoch 4/5:  43%|████▎     | 952/2208 [05:43<07:48,  2.68it/s][A
Epoch 4/5:  43%|████▎     | 953/2208 [05:43<08:02,  2.60it/s][A
Epoch 4/5:  43%|████▎     | 954/2208 [05:43<07:46,  2.69it/s][A
Epoch 4/5:  43%|████▎     | 955/2208 [05:44<07:34,  2.76it/s][A
Epoch 4/5:  43%|████▎     | 956/2208 [05:44<07:29,  2.78it/s][A
Epoch 4/5:  43%|████▎     | 957/2208 [05:44<07:25,  2.81it/s][A
Epoch 4/5:  43%|████▎     | 958/2208 [05:45<07:34,  2.75it/s][A
Epoch 4/5:  43%|████▎     | 959/2208 [05:45<07:39,  2.72it/s][A
Epoch 4/5:  43%|████▎     | 960/2208 [05:46<07:56,  2.62it/s][A
Epoch 4/5:  44%|████▎     | 961/2208 [05:46<07:56,  2.62it/s][A
Epoch 4/5:  44%|████▎     | 962/2208 [05:46<07:50,  2.65it/s][A
Epoch 4/5:  44%|████▎     | 963/2208 [05:47<07:38,  2.72it/s][A
Epoch 4/5:  44%|████▎     | 964/2208 [05:47<07:31,  2.75it/s][A
Epoch 4/5:  44%|████▎     | 965/2208 [05:47<07:24,  2.80it/s][A
Epoch 4/5:  44%|████▍     | 966/2208 [05:48<07:18,  2.83it/s][A
Epoch 4/5:  44%|████▍   

Batch 975: Training accuracy = 0.8516, F1 = 0.8354, Precision = 0.8346, Recall = 0.8516



Epoch 4/5:  44%|████▍     | 977/2208 [05:52<07:14,  2.83it/s][A
Epoch 4/5:  44%|████▍     | 978/2208 [05:52<07:10,  2.86it/s][A
Epoch 4/5:  44%|████▍     | 979/2208 [05:52<07:17,  2.81it/s][A
Epoch 4/5:  44%|████▍     | 980/2208 [05:53<07:12,  2.84it/s][A
Epoch 4/5:  44%|████▍     | 981/2208 [05:53<07:08,  2.87it/s][A
Epoch 4/5:  44%|████▍     | 982/2208 [05:53<07:09,  2.85it/s][A
Epoch 4/5:  45%|████▍     | 983/2208 [05:54<07:07,  2.86it/s][A
Epoch 4/5:  45%|████▍     | 984/2208 [05:54<07:04,  2.88it/s][A
Epoch 4/5:  45%|████▍     | 985/2208 [05:54<07:07,  2.86it/s][A
Epoch 4/5:  45%|████▍     | 986/2208 [05:55<07:15,  2.80it/s][A
Epoch 4/5:  45%|████▍     | 987/2208 [05:55<07:16,  2.80it/s][A
Epoch 4/5:  45%|████▍     | 988/2208 [05:55<07:23,  2.75it/s][A
Epoch 4/5:  45%|████▍     | 989/2208 [05:56<07:16,  2.79it/s][A
Epoch 4/5:  45%|████▍     | 990/2208 [05:56<07:11,  2.82it/s][A
Epoch 4/5:  45%|████▍     | 991/2208 [05:57<07:16,  2.79it/s][A
Epoch 4/5:  45%|████▍   

Batch 1000: Training accuracy = 0.8281, F1 = 0.8214, Precision = 0.8444, Recall = 0.8281



Epoch 4/5:  45%|████▌     | 1002/2208 [06:01<07:17,  2.76it/s][A
Epoch 4/5:  45%|████▌     | 1003/2208 [06:01<07:07,  2.82it/s][A
Epoch 4/5:  45%|████▌     | 1004/2208 [06:01<07:10,  2.80it/s][A
Epoch 4/5:  46%|████▌     | 1005/2208 [06:02<07:14,  2.77it/s][A
Epoch 4/5:  46%|████▌     | 1006/2208 [06:02<07:05,  2.82it/s][A
Epoch 4/5:  46%|████▌     | 1007/2208 [06:02<07:00,  2.86it/s][A
Epoch 4/5:  46%|████▌     | 1008/2208 [06:03<07:01,  2.84it/s][A
Epoch 4/5:  46%|████▌     | 1009/2208 [06:03<06:57,  2.87it/s][A
Epoch 4/5:  46%|████▌     | 1010/2208 [06:03<06:54,  2.89it/s][A
Epoch 4/5:  46%|████▌     | 1011/2208 [06:04<07:06,  2.81it/s][A
Epoch 4/5:  46%|████▌     | 1012/2208 [06:04<07:03,  2.82it/s][A
Epoch 4/5:  46%|████▌     | 1013/2208 [06:04<07:02,  2.83it/s][A
Epoch 4/5:  46%|████▌     | 1014/2208 [06:05<06:57,  2.86it/s][A
Epoch 4/5:  46%|████▌     | 1015/2208 [06:05<06:52,  2.89it/s][A
Epoch 4/5:  46%|████▌     | 1016/2208 [06:05<06:50,  2.91it/s][A
Epoch 4/5

Batch 1025: Training accuracy = 0.8906, F1 = 0.8732, Precision = 0.8646, Recall = 0.8906



Epoch 4/5:  47%|████▋     | 1027/2208 [06:09<07:07,  2.77it/s][A
Epoch 4/5:  47%|████▋     | 1028/2208 [06:10<07:11,  2.74it/s][A
Epoch 4/5:  47%|████▋     | 1029/2208 [06:10<07:07,  2.76it/s][A
Epoch 4/5:  47%|████▋     | 1030/2208 [06:10<07:06,  2.76it/s][A
Epoch 4/5:  47%|████▋     | 1031/2208 [06:11<07:02,  2.79it/s][A
Epoch 4/5:  47%|████▋     | 1032/2208 [06:11<06:55,  2.83it/s][A
Epoch 4/5:  47%|████▋     | 1033/2208 [06:11<06:57,  2.81it/s][A
Epoch 4/5:  47%|████▋     | 1034/2208 [06:12<06:58,  2.80it/s][A
Epoch 4/5:  47%|████▋     | 1035/2208 [06:12<06:59,  2.80it/s][A
Epoch 4/5:  47%|████▋     | 1036/2208 [06:13<06:55,  2.82it/s][A
Epoch 4/5:  47%|████▋     | 1037/2208 [06:13<06:50,  2.85it/s][A
Epoch 4/5:  47%|████▋     | 1038/2208 [06:13<06:54,  2.83it/s][A
Epoch 4/5:  47%|████▋     | 1039/2208 [06:14<07:00,  2.78it/s][A
Epoch 4/5:  47%|████▋     | 1040/2208 [06:14<06:56,  2.80it/s][A
Epoch 4/5:  47%|████▋     | 1041/2208 [06:14<07:03,  2.76it/s][A
Epoch 4/5

Batch 1050: Training accuracy = 0.8906, F1 = 0.8703, Precision = 0.8652, Recall = 0.8906



Epoch 4/5:  48%|████▊     | 1052/2208 [06:18<06:56,  2.77it/s][A
Epoch 4/5:  48%|████▊     | 1053/2208 [06:19<06:56,  2.77it/s][A
Epoch 4/5:  48%|████▊     | 1054/2208 [06:19<06:53,  2.79it/s][A
Epoch 4/5:  48%|████▊     | 1055/2208 [06:19<06:46,  2.83it/s][A
Epoch 4/5:  48%|████▊     | 1056/2208 [06:20<06:46,  2.84it/s][A
Epoch 4/5:  48%|████▊     | 1057/2208 [06:20<06:47,  2.82it/s][A
Epoch 4/5:  48%|████▊     | 1058/2208 [06:20<06:43,  2.85it/s][A
Epoch 4/5:  48%|████▊     | 1059/2208 [06:21<06:43,  2.85it/s][A
Epoch 4/5:  48%|████▊     | 1060/2208 [06:21<06:44,  2.84it/s][A
Epoch 4/5:  48%|████▊     | 1061/2208 [06:21<06:41,  2.86it/s][A
Epoch 4/5:  48%|████▊     | 1062/2208 [06:22<06:42,  2.85it/s][A
Epoch 4/5:  48%|████▊     | 1063/2208 [06:22<06:45,  2.82it/s][A
Epoch 4/5:  48%|████▊     | 1064/2208 [06:23<06:41,  2.85it/s][A
Epoch 4/5:  48%|████▊     | 1065/2208 [06:23<06:49,  2.79it/s][A
Epoch 4/5:  48%|████▊     | 1066/2208 [06:23<06:59,  2.72it/s][A
Epoch 4/5

Batch 1075: Training accuracy = 0.8672, F1 = 0.8568, Precision = 0.8672, Recall = 0.8672



Epoch 4/5:  49%|████▉     | 1077/2208 [06:27<07:01,  2.68it/s][A
Epoch 4/5:  49%|████▉     | 1078/2208 [06:28<07:08,  2.63it/s][A
Epoch 4/5:  49%|████▉     | 1079/2208 [06:28<07:04,  2.66it/s][A
Epoch 4/5:  49%|████▉     | 1080/2208 [06:28<07:06,  2.65it/s][A
Epoch 4/5:  49%|████▉     | 1081/2208 [06:29<07:09,  2.62it/s][A
Epoch 4/5:  49%|████▉     | 1082/2208 [06:29<07:12,  2.60it/s][A
Epoch 4/5:  49%|████▉     | 1083/2208 [06:30<06:58,  2.69it/s][A
Epoch 4/5:  49%|████▉     | 1084/2208 [06:30<06:48,  2.75it/s][A
Epoch 4/5:  49%|████▉     | 1085/2208 [06:30<06:52,  2.72it/s][A
Epoch 4/5:  49%|████▉     | 1086/2208 [06:31<06:53,  2.71it/s][A
Epoch 4/5:  49%|████▉     | 1087/2208 [06:31<06:52,  2.72it/s][A
Epoch 4/5:  49%|████▉     | 1088/2208 [06:31<06:50,  2.73it/s][A
Epoch 4/5:  49%|████▉     | 1089/2208 [06:32<06:46,  2.75it/s][A
Epoch 4/5:  49%|████▉     | 1090/2208 [06:32<06:42,  2.78it/s][A
Epoch 4/5:  49%|████▉     | 1091/2208 [06:32<06:38,  2.80it/s][A
Epoch 4/5

Batch 1100: Training accuracy = 0.8828, F1 = 0.8737, Precision = 0.8828, Recall = 0.8828



Epoch 4/5:  50%|████▉     | 1102/2208 [06:36<06:34,  2.80it/s][A
Epoch 4/5:  50%|████▉     | 1103/2208 [06:37<06:27,  2.85it/s][A
Epoch 4/5:  50%|█████     | 1104/2208 [06:37<06:27,  2.85it/s][A
Epoch 4/5:  50%|█████     | 1105/2208 [06:37<06:22,  2.88it/s][A
Epoch 4/5:  50%|█████     | 1106/2208 [06:38<06:27,  2.84it/s][A
Epoch 4/5:  50%|█████     | 1107/2208 [06:38<06:27,  2.84it/s][A
Epoch 4/5:  50%|█████     | 1108/2208 [06:39<06:37,  2.76it/s][A
Epoch 4/5:  50%|█████     | 1109/2208 [06:39<06:39,  2.75it/s][A
Epoch 4/5:  50%|█████     | 1110/2208 [06:39<06:33,  2.79it/s][A
Epoch 4/5:  50%|█████     | 1111/2208 [06:40<06:39,  2.74it/s][A
Epoch 4/5:  50%|█████     | 1112/2208 [06:40<06:34,  2.78it/s][A
Epoch 4/5:  50%|█████     | 1113/2208 [06:40<06:28,  2.82it/s][A
Epoch 4/5:  50%|█████     | 1114/2208 [06:41<06:39,  2.74it/s][A
Epoch 4/5:  50%|█████     | 1115/2208 [06:41<06:43,  2.71it/s][A
Epoch 4/5:  51%|█████     | 1116/2208 [06:41<06:37,  2.75it/s][A
Epoch 4/5

Batch 1125: Training accuracy = 0.8359, F1 = 0.8281, Precision = 0.8438, Recall = 0.8359



Epoch 4/5:  51%|█████     | 1127/2208 [06:45<06:46,  2.66it/s][A
Epoch 4/5:  51%|█████     | 1128/2208 [06:46<06:33,  2.75it/s][A
Epoch 4/5:  51%|█████     | 1129/2208 [06:46<06:24,  2.81it/s][A
Epoch 4/5:  51%|█████     | 1130/2208 [06:47<06:30,  2.76it/s][A
Epoch 4/5:  51%|█████     | 1131/2208 [06:47<06:31,  2.75it/s][A
Epoch 4/5:  51%|█████▏    | 1132/2208 [06:47<06:23,  2.80it/s][A
Epoch 4/5:  51%|█████▏    | 1133/2208 [06:48<06:19,  2.84it/s][A
Epoch 4/5:  51%|█████▏    | 1134/2208 [06:48<06:23,  2.80it/s][A
Epoch 4/5:  51%|█████▏    | 1135/2208 [06:48<06:16,  2.85it/s][A
Epoch 4/5:  51%|█████▏    | 1136/2208 [06:49<06:18,  2.83it/s][A
Epoch 4/5:  51%|█████▏    | 1137/2208 [06:49<06:12,  2.87it/s][A
Epoch 4/5:  52%|█████▏    | 1138/2208 [06:49<06:09,  2.89it/s][A
Epoch 4/5:  52%|█████▏    | 1139/2208 [06:50<06:11,  2.87it/s][A
Epoch 4/5:  52%|█████▏    | 1140/2208 [06:50<06:24,  2.78it/s][A
Epoch 4/5:  52%|█████▏    | 1141/2208 [06:50<06:18,  2.82it/s][A
Epoch 4/5

Batch 1150: Training accuracy = 0.8672, F1 = 0.8581, Precision = 0.8646, Recall = 0.8672



Epoch 4/5:  52%|█████▏    | 1152/2208 [06:54<06:18,  2.79it/s][A
Epoch 4/5:  52%|█████▏    | 1153/2208 [06:55<06:12,  2.83it/s][A
Epoch 4/5:  52%|█████▏    | 1154/2208 [06:55<06:14,  2.81it/s][A
Epoch 4/5:  52%|█████▏    | 1155/2208 [06:55<06:08,  2.85it/s][A
Epoch 4/5:  52%|█████▏    | 1156/2208 [06:56<06:05,  2.88it/s][A
Epoch 4/5:  52%|█████▏    | 1157/2208 [06:56<06:06,  2.87it/s][A
Epoch 4/5:  52%|█████▏    | 1158/2208 [06:56<06:14,  2.81it/s][A
Epoch 4/5:  52%|█████▏    | 1159/2208 [06:57<06:16,  2.79it/s][A
Epoch 4/5:  53%|█████▎    | 1160/2208 [06:57<06:20,  2.76it/s][A
Epoch 4/5:  53%|█████▎    | 1161/2208 [06:58<06:16,  2.78it/s][A
Epoch 4/5:  53%|█████▎    | 1162/2208 [06:58<06:12,  2.81it/s][A
Epoch 4/5:  53%|█████▎    | 1163/2208 [06:58<06:10,  2.82it/s][A
Epoch 4/5:  53%|█████▎    | 1164/2208 [06:59<06:09,  2.83it/s][A
Epoch 4/5:  53%|█████▎    | 1165/2208 [06:59<06:06,  2.84it/s][A
Epoch 4/5:  53%|█████▎    | 1166/2208 [06:59<06:18,  2.75it/s][A
Epoch 4/5

Batch 1175: Training accuracy = 0.8906, F1 = 0.8906, Precision = 0.9049, Recall = 0.8906



Epoch 4/5:  53%|█████▎    | 1177/2208 [07:03<06:26,  2.67it/s][A
Epoch 4/5:  53%|█████▎    | 1178/2208 [07:04<06:19,  2.71it/s][A
Epoch 4/5:  53%|█████▎    | 1179/2208 [07:04<06:18,  2.72it/s][A
Epoch 4/5:  53%|█████▎    | 1180/2208 [07:04<06:13,  2.75it/s][A
Epoch 4/5:  53%|█████▎    | 1181/2208 [07:05<06:15,  2.74it/s][A
Epoch 4/5:  54%|█████▎    | 1182/2208 [07:05<06:06,  2.80it/s][A
Epoch 4/5:  54%|█████▎    | 1183/2208 [07:05<06:02,  2.83it/s][A
Epoch 4/5:  54%|█████▎    | 1184/2208 [07:06<05:58,  2.86it/s][A
Epoch 4/5:  54%|█████▎    | 1185/2208 [07:06<06:05,  2.80it/s][A
Epoch 4/5:  54%|█████▎    | 1186/2208 [07:07<06:09,  2.77it/s][A
Epoch 4/5:  54%|█████▍    | 1187/2208 [07:07<06:13,  2.74it/s][A
Epoch 4/5:  54%|█████▍    | 1188/2208 [07:07<06:08,  2.77it/s][A
Epoch 4/5:  54%|█████▍    | 1189/2208 [07:08<06:06,  2.78it/s][A
Epoch 4/5:  54%|█████▍    | 1190/2208 [07:08<06:10,  2.75it/s][A
Epoch 4/5:  54%|█████▍    | 1191/2208 [07:08<06:05,  2.78it/s][A
Epoch 4/5

Batch 1200: Training accuracy = 0.8047, F1 = 0.7944, Precision = 0.8079, Recall = 0.8047



Epoch 4/5:  54%|█████▍    | 1202/2208 [07:12<06:04,  2.76it/s][A
Epoch 4/5:  54%|█████▍    | 1203/2208 [07:13<05:56,  2.82it/s][A
Epoch 4/5:  55%|█████▍    | 1204/2208 [07:13<05:52,  2.85it/s][A
Epoch 4/5:  55%|█████▍    | 1205/2208 [07:13<05:50,  2.86it/s][A
Epoch 4/5:  55%|█████▍    | 1206/2208 [07:14<05:59,  2.78it/s][A
Epoch 4/5:  55%|█████▍    | 1207/2208 [07:14<06:02,  2.76it/s][A
Epoch 4/5:  55%|█████▍    | 1208/2208 [07:14<05:56,  2.80it/s][A
Epoch 4/5:  55%|█████▍    | 1209/2208 [07:15<05:50,  2.85it/s][A
Epoch 4/5:  55%|█████▍    | 1210/2208 [07:15<05:49,  2.86it/s][A
Epoch 4/5:  55%|█████▍    | 1211/2208 [07:15<05:47,  2.87it/s][A
Epoch 4/5:  55%|█████▍    | 1212/2208 [07:16<05:47,  2.87it/s][A
Epoch 4/5:  55%|█████▍    | 1213/2208 [07:16<05:53,  2.81it/s][A
Epoch 4/5:  55%|█████▍    | 1214/2208 [07:16<05:48,  2.85it/s][A
Epoch 4/5:  55%|█████▌    | 1215/2208 [07:17<05:50,  2.84it/s][A
Epoch 4/5:  55%|█████▌    | 1216/2208 [07:17<05:56,  2.78it/s][A
Epoch 4/5

Batch 1225: Training accuracy = 0.9453, F1 = 0.9409, Precision = 0.9427, Recall = 0.9453



Epoch 4/5:  56%|█████▌    | 1227/2208 [07:21<05:57,  2.75it/s][A
Epoch 4/5:  56%|█████▌    | 1228/2208 [07:21<06:00,  2.72it/s][A
Epoch 4/5:  56%|█████▌    | 1229/2208 [07:22<05:52,  2.78it/s][A
Epoch 4/5:  56%|█████▌    | 1230/2208 [07:22<05:49,  2.80it/s][A
Epoch 4/5:  56%|█████▌    | 1231/2208 [07:23<05:51,  2.78it/s][A
Epoch 4/5:  56%|█████▌    | 1232/2208 [07:23<05:48,  2.80it/s][A
Epoch 4/5:  56%|█████▌    | 1233/2208 [07:23<05:47,  2.81it/s][A
Epoch 4/5:  56%|█████▌    | 1234/2208 [07:24<05:41,  2.85it/s][A
Epoch 4/5:  56%|█████▌    | 1235/2208 [07:24<05:38,  2.87it/s][A
Epoch 4/5:  56%|█████▌    | 1236/2208 [07:24<05:40,  2.85it/s][A
Epoch 4/5:  56%|█████▌    | 1237/2208 [07:25<05:37,  2.88it/s][A
Epoch 4/5:  56%|█████▌    | 1238/2208 [07:25<05:34,  2.90it/s][A
Epoch 4/5:  56%|█████▌    | 1239/2208 [07:25<05:41,  2.83it/s][A
Epoch 4/5:  56%|█████▌    | 1240/2208 [07:26<05:40,  2.84it/s][A
Epoch 4/5:  56%|█████▌    | 1241/2208 [07:26<05:38,  2.85it/s][A
Epoch 4/5

Batch 1250: Training accuracy = 0.8672, F1 = 0.8464, Precision = 0.8405, Recall = 0.8672



Epoch 4/5:  57%|█████▋    | 1252/2208 [07:30<05:50,  2.73it/s][A
Epoch 4/5:  57%|█████▋    | 1253/2208 [07:30<05:41,  2.80it/s][A
Epoch 4/5:  57%|█████▋    | 1254/2208 [07:31<05:37,  2.83it/s][A
Epoch 4/5:  57%|█████▋    | 1255/2208 [07:31<05:44,  2.77it/s][A
Epoch 4/5:  57%|█████▋    | 1256/2208 [07:31<05:46,  2.75it/s][A
Epoch 4/5:  57%|█████▋    | 1257/2208 [07:32<05:43,  2.77it/s][A
Epoch 4/5:  57%|█████▋    | 1258/2208 [07:32<05:46,  2.74it/s][A
Epoch 4/5:  57%|█████▋    | 1259/2208 [07:33<05:39,  2.79it/s][A
Epoch 4/5:  57%|█████▋    | 1260/2208 [07:33<05:33,  2.84it/s][A
Epoch 4/5:  57%|█████▋    | 1261/2208 [07:33<05:38,  2.80it/s][A
Epoch 4/5:  57%|█████▋    | 1262/2208 [07:34<05:37,  2.80it/s][A
Epoch 4/5:  57%|█████▋    | 1263/2208 [07:34<05:35,  2.82it/s][A
Epoch 4/5:  57%|█████▋    | 1264/2208 [07:34<05:39,  2.78it/s][A
Epoch 4/5:  57%|█████▋    | 1265/2208 [07:35<05:32,  2.84it/s][A
Epoch 4/5:  57%|█████▋    | 1266/2208 [07:35<05:38,  2.78it/s][A
Epoch 4/5

Batch 1275: Training accuracy = 0.8906, F1 = 0.8828, Precision = 0.8867, Recall = 0.8906



Epoch 4/5:  58%|█████▊    | 1277/2208 [07:39<05:33,  2.79it/s][A
Epoch 4/5:  58%|█████▊    | 1278/2208 [07:39<05:27,  2.84it/s][A
Epoch 4/5:  58%|█████▊    | 1279/2208 [07:40<05:33,  2.79it/s][A
Epoch 4/5:  58%|█████▊    | 1280/2208 [07:40<05:37,  2.75it/s][A
Epoch 4/5:  58%|█████▊    | 1281/2208 [07:40<05:42,  2.70it/s][A
Epoch 4/5:  58%|█████▊    | 1282/2208 [07:41<05:36,  2.75it/s][A
Epoch 4/5:  58%|█████▊    | 1283/2208 [07:41<05:37,  2.74it/s][A
Epoch 4/5:  58%|█████▊    | 1284/2208 [07:41<05:35,  2.75it/s][A
Epoch 4/5:  58%|█████▊    | 1285/2208 [07:42<05:38,  2.73it/s][A
Epoch 4/5:  58%|█████▊    | 1286/2208 [07:42<05:40,  2.71it/s][A
Epoch 4/5:  58%|█████▊    | 1287/2208 [07:43<05:44,  2.68it/s][A
Epoch 4/5:  58%|█████▊    | 1288/2208 [07:43<05:36,  2.73it/s][A
Epoch 4/5:  58%|█████▊    | 1289/2208 [07:43<05:38,  2.72it/s][A
Epoch 4/5:  58%|█████▊    | 1290/2208 [07:44<05:30,  2.78it/s][A
Epoch 4/5:  58%|█████▊    | 1291/2208 [07:44<05:25,  2.82it/s][A
Epoch 4/5

Batch 1300: Training accuracy = 0.8516, F1 = 0.8398, Precision = 0.8464, Recall = 0.8516



Epoch 4/5:  59%|█████▉    | 1302/2208 [07:48<05:24,  2.79it/s][A
Epoch 4/5:  59%|█████▉    | 1303/2208 [07:48<05:18,  2.84it/s][A
Epoch 4/5:  59%|█████▉    | 1304/2208 [07:49<05:21,  2.82it/s][A
Epoch 4/5:  59%|█████▉    | 1305/2208 [07:49<05:19,  2.82it/s][A
Epoch 4/5:  59%|█████▉    | 1306/2208 [07:49<05:28,  2.75it/s][A
Epoch 4/5:  59%|█████▉    | 1307/2208 [07:50<05:20,  2.81it/s][A
Epoch 4/5:  59%|█████▉    | 1308/2208 [07:50<05:18,  2.83it/s][A
Epoch 4/5:  59%|█████▉    | 1309/2208 [07:50<05:13,  2.87it/s][A
Epoch 4/5:  59%|█████▉    | 1310/2208 [07:51<05:10,  2.90it/s][A
Epoch 4/5:  59%|█████▉    | 1311/2208 [07:51<05:08,  2.91it/s][A
Epoch 4/5:  59%|█████▉    | 1312/2208 [07:51<05:06,  2.92it/s][A
Epoch 4/5:  59%|█████▉    | 1313/2208 [07:52<05:07,  2.91it/s][A
Epoch 4/5:  60%|█████▉    | 1314/2208 [07:52<05:15,  2.84it/s][A
Epoch 4/5:  60%|█████▉    | 1315/2208 [07:52<05:16,  2.82it/s][A
Epoch 4/5:  60%|█████▉    | 1316/2208 [07:53<05:15,  2.83it/s][A
Epoch 4/5

Batch 1325: Training accuracy = 0.8828, F1 = 0.8768, Precision = 0.8861, Recall = 0.8828



Epoch 4/5:  60%|██████    | 1327/2208 [07:57<05:23,  2.72it/s][A
Epoch 4/5:  60%|██████    | 1328/2208 [07:57<05:25,  2.70it/s][A
Epoch 4/5:  60%|██████    | 1329/2208 [07:58<05:38,  2.60it/s][A
Epoch 4/5:  60%|██████    | 1330/2208 [07:58<05:35,  2.62it/s][A
Epoch 4/5:  60%|██████    | 1331/2208 [07:58<05:33,  2.63it/s][A
Epoch 4/5:  60%|██████    | 1332/2208 [07:59<05:34,  2.62it/s][A
Epoch 4/5:  60%|██████    | 1333/2208 [07:59<05:32,  2.63it/s][A
Epoch 4/5:  60%|██████    | 1334/2208 [07:59<05:21,  2.71it/s][A
Epoch 4/5:  60%|██████    | 1335/2208 [08:00<05:16,  2.76it/s][A
Epoch 4/5:  61%|██████    | 1336/2208 [08:00<05:09,  2.82it/s][A
Epoch 4/5:  61%|██████    | 1337/2208 [08:00<05:05,  2.85it/s][A
Epoch 4/5:  61%|██████    | 1338/2208 [08:01<05:04,  2.86it/s][A
Epoch 4/5:  61%|██████    | 1339/2208 [08:01<05:07,  2.83it/s][A
Epoch 4/5:  61%|██████    | 1340/2208 [08:02<05:12,  2.78it/s][A
Epoch 4/5:  61%|██████    | 1341/2208 [08:02<05:11,  2.78it/s][A
Epoch 4/5

Batch 1350: Training accuracy = 0.8281, F1 = 0.8063, Precision = 0.8021, Recall = 0.8281



Epoch 4/5:  61%|██████    | 1352/2208 [08:06<05:06,  2.80it/s][A
Epoch 4/5:  61%|██████▏   | 1353/2208 [08:06<05:00,  2.84it/s][A
Epoch 4/5:  61%|██████▏   | 1354/2208 [08:07<04:57,  2.87it/s][A
Epoch 4/5:  61%|██████▏   | 1355/2208 [08:07<04:55,  2.89it/s][A
Epoch 4/5:  61%|██████▏   | 1356/2208 [08:07<04:56,  2.87it/s][A
Epoch 4/5:  61%|██████▏   | 1357/2208 [08:08<04:56,  2.87it/s][A
Epoch 4/5:  62%|██████▏   | 1358/2208 [08:08<04:59,  2.83it/s][A
Epoch 4/5:  62%|██████▏   | 1359/2208 [08:08<05:05,  2.78it/s][A
Epoch 4/5:  62%|██████▏   | 1360/2208 [08:09<04:59,  2.83it/s][A
Epoch 4/5:  62%|██████▏   | 1361/2208 [08:09<05:07,  2.75it/s][A
Epoch 4/5:  62%|██████▏   | 1362/2208 [08:09<05:07,  2.75it/s][A
Epoch 4/5:  62%|██████▏   | 1363/2208 [08:10<05:02,  2.79it/s][A
Epoch 4/5:  62%|██████▏   | 1364/2208 [08:10<04:59,  2.82it/s][A
Epoch 4/5:  62%|██████▏   | 1365/2208 [08:10<05:02,  2.78it/s][A
Epoch 4/5:  62%|██████▏   | 1366/2208 [08:11<04:59,  2.81it/s][A
Epoch 4/5

Batch 1375: Training accuracy = 0.8516, F1 = 0.8419, Precision = 0.8529, Recall = 0.8516



Epoch 4/5:  62%|██████▏   | 1377/2208 [08:15<04:51,  2.86it/s][A
Epoch 4/5:  62%|██████▏   | 1378/2208 [08:15<04:51,  2.85it/s][A
Epoch 4/5:  62%|██████▏   | 1379/2208 [08:15<04:48,  2.87it/s][A
Epoch 4/5:  62%|██████▎   | 1380/2208 [08:16<04:48,  2.87it/s][A
Epoch 4/5:  63%|██████▎   | 1381/2208 [08:16<04:47,  2.88it/s][A
Epoch 4/5:  63%|██████▎   | 1382/2208 [08:16<04:51,  2.84it/s][A
Epoch 4/5:  63%|██████▎   | 1383/2208 [08:17<04:56,  2.78it/s][A
Epoch 4/5:  63%|██████▎   | 1384/2208 [08:17<04:54,  2.80it/s][A
Epoch 4/5:  63%|██████▎   | 1385/2208 [08:18<04:52,  2.82it/s][A
Epoch 4/5:  63%|██████▎   | 1386/2208 [08:18<04:55,  2.78it/s][A
Epoch 4/5:  63%|██████▎   | 1387/2208 [08:18<04:50,  2.82it/s][A
Epoch 4/5:  63%|██████▎   | 1388/2208 [08:19<04:55,  2.78it/s][A
Epoch 4/5:  63%|██████▎   | 1389/2208 [08:19<04:50,  2.82it/s][A
Epoch 4/5:  63%|██████▎   | 1390/2208 [08:19<04:52,  2.80it/s][A
Epoch 4/5:  63%|██████▎   | 1391/2208 [08:20<04:46,  2.85it/s][A
Epoch 4/5

Batch 1400: Training accuracy = 0.8828, F1 = 0.8797, Precision = 0.8948, Recall = 0.8828



Epoch 4/5:  63%|██████▎   | 1402/2208 [08:24<04:55,  2.72it/s][A
Epoch 4/5:  64%|██████▎   | 1403/2208 [08:24<04:51,  2.76it/s][A
Epoch 4/5:  64%|██████▎   | 1404/2208 [08:24<04:53,  2.74it/s][A
Epoch 4/5:  64%|██████▎   | 1405/2208 [08:25<04:47,  2.79it/s][A
Epoch 4/5:  64%|██████▎   | 1406/2208 [08:25<04:54,  2.72it/s][A
Epoch 4/5:  64%|██████▎   | 1407/2208 [08:25<04:58,  2.69it/s][A
Epoch 4/5:  64%|██████▍   | 1408/2208 [08:26<04:59,  2.67it/s][A
Epoch 4/5:  64%|██████▍   | 1409/2208 [08:26<04:58,  2.68it/s][A
Epoch 4/5:  64%|██████▍   | 1410/2208 [08:27<04:55,  2.70it/s][A
Epoch 4/5:  64%|██████▍   | 1411/2208 [08:27<04:49,  2.75it/s][A
Epoch 4/5:  64%|██████▍   | 1412/2208 [08:27<04:55,  2.69it/s][A
Epoch 4/5:  64%|██████▍   | 1413/2208 [08:28<05:03,  2.62it/s][A
Epoch 4/5:  64%|██████▍   | 1414/2208 [08:28<04:54,  2.70it/s][A
Epoch 4/5:  64%|██████▍   | 1415/2208 [08:28<04:46,  2.76it/s][A
Epoch 4/5:  64%|██████▍   | 1416/2208 [08:29<04:50,  2.73it/s][A
Epoch 4/5

Batch 1425: Training accuracy = 0.8438, F1 = 0.8225, Precision = 0.8109, Recall = 0.8438



Epoch 4/5:  65%|██████▍   | 1427/2208 [08:33<04:31,  2.87it/s][A
Epoch 4/5:  65%|██████▍   | 1428/2208 [08:33<04:30,  2.89it/s][A
Epoch 4/5:  65%|██████▍   | 1429/2208 [08:33<04:29,  2.89it/s][A
Epoch 4/5:  65%|██████▍   | 1430/2208 [08:34<04:28,  2.90it/s][A
Epoch 4/5:  65%|██████▍   | 1431/2208 [08:34<04:27,  2.91it/s][A
Epoch 4/5:  65%|██████▍   | 1432/2208 [08:34<04:26,  2.91it/s][A
Epoch 4/5:  65%|██████▍   | 1433/2208 [08:35<04:28,  2.89it/s][A
Epoch 4/5:  65%|██████▍   | 1434/2208 [08:35<04:26,  2.90it/s][A
Epoch 4/5:  65%|██████▍   | 1435/2208 [08:35<04:27,  2.89it/s][A
Epoch 4/5:  65%|██████▌   | 1436/2208 [08:36<04:32,  2.83it/s][A
Epoch 4/5:  65%|██████▌   | 1437/2208 [08:36<04:30,  2.85it/s][A
Epoch 4/5:  65%|██████▌   | 1438/2208 [08:37<04:32,  2.82it/s][A
Epoch 4/5:  65%|██████▌   | 1439/2208 [08:37<04:31,  2.83it/s][A
Epoch 4/5:  65%|██████▌   | 1440/2208 [08:37<04:29,  2.85it/s][A
Epoch 4/5:  65%|██████▌   | 1441/2208 [08:38<04:27,  2.87it/s][A
Epoch 4/5

Batch 1450: Training accuracy = 0.8828, F1 = 0.8661, Precision = 0.8568, Recall = 0.8828



Epoch 4/5:  66%|██████▌   | 1452/2208 [08:42<04:40,  2.70it/s][A
Epoch 4/5:  66%|██████▌   | 1453/2208 [08:42<04:43,  2.66it/s][A
Epoch 4/5:  66%|██████▌   | 1454/2208 [08:42<04:38,  2.71it/s][A
Epoch 4/5:  66%|██████▌   | 1455/2208 [08:43<04:38,  2.71it/s][A
Epoch 4/5:  66%|██████▌   | 1456/2208 [08:43<04:34,  2.74it/s][A
Epoch 4/5:  66%|██████▌   | 1457/2208 [08:43<04:36,  2.72it/s][A
Epoch 4/5:  66%|██████▌   | 1458/2208 [08:44<04:30,  2.77it/s][A
Epoch 4/5:  66%|██████▌   | 1459/2208 [08:44<04:25,  2.82it/s][A
Epoch 4/5:  66%|██████▌   | 1460/2208 [08:44<04:22,  2.85it/s][A
Epoch 4/5:  66%|██████▌   | 1461/2208 [08:45<04:22,  2.85it/s][A
Epoch 4/5:  66%|██████▌   | 1462/2208 [08:45<04:22,  2.85it/s][A
Epoch 4/5:  66%|██████▋   | 1463/2208 [08:45<04:24,  2.82it/s][A
Epoch 4/5:  66%|██████▋   | 1464/2208 [08:46<04:19,  2.86it/s][A
Epoch 4/5:  66%|██████▋   | 1465/2208 [08:46<04:20,  2.85it/s][A
Epoch 4/5:  66%|██████▋   | 1466/2208 [08:47<04:26,  2.78it/s][A
Epoch 4/5

Batch 1475: Training accuracy = 0.8594, F1 = 0.8542, Precision = 0.8711, Recall = 0.8594



Epoch 4/5:  67%|██████▋   | 1477/2208 [08:50<04:21,  2.79it/s][A
Epoch 4/5:  67%|██████▋   | 1478/2208 [08:51<04:21,  2.79it/s][A
Epoch 4/5:  67%|██████▋   | 1479/2208 [08:51<04:17,  2.83it/s][A
Epoch 4/5:  67%|██████▋   | 1480/2208 [08:52<04:18,  2.82it/s][A
Epoch 4/5:  67%|██████▋   | 1481/2208 [08:52<04:19,  2.80it/s][A
Epoch 4/5:  67%|██████▋   | 1482/2208 [08:52<04:18,  2.81it/s][A
Epoch 4/5:  67%|██████▋   | 1483/2208 [08:53<04:23,  2.75it/s][A
Epoch 4/5:  67%|██████▋   | 1484/2208 [08:53<04:24,  2.74it/s][A
Epoch 4/5:  67%|██████▋   | 1485/2208 [08:53<04:28,  2.69it/s][A
Epoch 4/5:  67%|██████▋   | 1486/2208 [08:54<04:23,  2.74it/s][A
Epoch 4/5:  67%|██████▋   | 1487/2208 [08:54<04:29,  2.67it/s][A
Epoch 4/5:  67%|██████▋   | 1488/2208 [08:55<04:27,  2.69it/s][A
Epoch 4/5:  67%|██████▋   | 1489/2208 [08:55<04:20,  2.76it/s][A
Epoch 4/5:  67%|██████▋   | 1490/2208 [08:55<04:24,  2.72it/s][A
Epoch 4/5:  68%|██████▊   | 1491/2208 [08:56<04:21,  2.74it/s][A
Epoch 4/5

Batch 1500: Training accuracy = 0.9141, F1 = 0.9083, Precision = 0.9089, Recall = 0.9141



Epoch 4/5:  68%|██████▊   | 1502/2208 [09:00<04:23,  2.68it/s][A
Epoch 4/5:  68%|██████▊   | 1503/2208 [09:00<04:16,  2.75it/s][A
Epoch 4/5:  68%|██████▊   | 1504/2208 [09:00<04:12,  2.79it/s][A
Epoch 4/5:  68%|██████▊   | 1505/2208 [09:01<04:07,  2.84it/s][A
Epoch 4/5:  68%|██████▊   | 1506/2208 [09:01<04:16,  2.74it/s][A
Epoch 4/5:  68%|██████▊   | 1507/2208 [09:01<04:10,  2.80it/s][A
Epoch 4/5:  68%|██████▊   | 1508/2208 [09:02<04:06,  2.84it/s][A
Epoch 4/5:  68%|██████▊   | 1509/2208 [09:02<04:06,  2.83it/s][A
Epoch 4/5:  68%|██████▊   | 1510/2208 [09:02<04:05,  2.84it/s][A
Epoch 4/5:  68%|██████▊   | 1511/2208 [09:03<04:04,  2.84it/s][A
Epoch 4/5:  68%|██████▊   | 1512/2208 [09:03<04:03,  2.86it/s][A
Epoch 4/5:  69%|██████▊   | 1513/2208 [09:04<04:05,  2.83it/s][A
Epoch 4/5:  69%|██████▊   | 1514/2208 [09:04<04:04,  2.84it/s][A
Epoch 4/5:  69%|██████▊   | 1515/2208 [09:04<04:04,  2.83it/s][A
Epoch 4/5:  69%|██████▊   | 1516/2208 [09:05<04:00,  2.87it/s][A
Epoch 4/5

Batch 1525: Training accuracy = 0.8672, F1 = 0.8573, Precision = 0.8635, Recall = 0.8672



Epoch 4/5:  69%|██████▉   | 1527/2208 [09:09<04:06,  2.76it/s][A
Epoch 4/5:  69%|██████▉   | 1528/2208 [09:09<04:07,  2.75it/s][A
Epoch 4/5:  69%|██████▉   | 1529/2208 [09:09<04:07,  2.75it/s][A
Epoch 4/5:  69%|██████▉   | 1530/2208 [09:10<04:12,  2.69it/s][A
Epoch 4/5:  69%|██████▉   | 1531/2208 [09:10<04:10,  2.70it/s][A
Epoch 4/5:  69%|██████▉   | 1532/2208 [09:10<04:04,  2.76it/s][A
Epoch 4/5:  69%|██████▉   | 1533/2208 [09:11<04:07,  2.73it/s][A
Epoch 4/5:  69%|██████▉   | 1534/2208 [09:11<04:03,  2.77it/s][A
Epoch 4/5:  70%|██████▉   | 1535/2208 [09:11<04:01,  2.79it/s][A
Epoch 4/5:  70%|██████▉   | 1536/2208 [09:12<04:00,  2.79it/s][A
Epoch 4/5:  70%|██████▉   | 1537/2208 [09:12<03:56,  2.84it/s][A
Epoch 4/5:  70%|██████▉   | 1538/2208 [09:12<04:00,  2.79it/s][A
Epoch 4/5:  70%|██████▉   | 1539/2208 [09:13<03:55,  2.84it/s][A
Epoch 4/5:  70%|██████▉   | 1540/2208 [09:13<03:58,  2.81it/s][A
Epoch 4/5:  70%|██████▉   | 1541/2208 [09:14<03:56,  2.82it/s][A
Epoch 4/5

Batch 1550: Training accuracy = 0.8906, F1 = 0.8854, Precision = 0.8945, Recall = 0.8906



Epoch 4/5:  70%|███████   | 1552/2208 [09:17<03:47,  2.88it/s][A
Epoch 4/5:  70%|███████   | 1553/2208 [09:18<03:51,  2.83it/s][A
Epoch 4/5:  70%|███████   | 1554/2208 [09:18<03:55,  2.78it/s][A
Epoch 4/5:  70%|███████   | 1555/2208 [09:18<03:50,  2.83it/s][A
Epoch 4/5:  70%|███████   | 1556/2208 [09:19<03:50,  2.83it/s][A
Epoch 4/5:  71%|███████   | 1557/2208 [09:19<03:48,  2.85it/s][A
Epoch 4/5:  71%|███████   | 1558/2208 [09:20<03:48,  2.85it/s][A
Epoch 4/5:  71%|███████   | 1559/2208 [09:20<03:47,  2.85it/s][A
Epoch 4/5:  71%|███████   | 1560/2208 [09:20<03:50,  2.81it/s][A
Epoch 4/5:  71%|███████   | 1561/2208 [09:21<03:54,  2.76it/s][A
Epoch 4/5:  71%|███████   | 1562/2208 [09:21<03:50,  2.81it/s][A
Epoch 4/5:  71%|███████   | 1563/2208 [09:21<03:47,  2.83it/s][A
Epoch 4/5:  71%|███████   | 1564/2208 [09:22<03:50,  2.79it/s][A
Epoch 4/5:  71%|███████   | 1565/2208 [09:22<03:51,  2.78it/s][A
Epoch 4/5:  71%|███████   | 1566/2208 [09:22<03:52,  2.77it/s][A
Epoch 4/5

Batch 1575: Training accuracy = 0.8984, F1 = 0.8979, Precision = 0.9010, Recall = 0.8984



Epoch 4/5:  71%|███████▏  | 1577/2208 [09:26<03:43,  2.82it/s][A
Epoch 4/5:  71%|███████▏  | 1578/2208 [09:27<03:43,  2.82it/s][A
Epoch 4/5:  72%|███████▏  | 1579/2208 [09:27<03:40,  2.86it/s][A
Epoch 4/5:  72%|███████▏  | 1580/2208 [09:28<03:44,  2.79it/s][A
Epoch 4/5:  72%|███████▏  | 1581/2208 [09:28<03:47,  2.76it/s][A
Epoch 4/5:  72%|███████▏  | 1582/2208 [09:28<03:45,  2.78it/s][A
Epoch 4/5:  72%|███████▏  | 1583/2208 [09:29<03:41,  2.82it/s][A
Epoch 4/5:  72%|███████▏  | 1584/2208 [09:29<03:43,  2.79it/s][A
Epoch 4/5:  72%|███████▏  | 1585/2208 [09:29<03:45,  2.76it/s][A
Epoch 4/5:  72%|███████▏  | 1586/2208 [09:30<03:44,  2.77it/s][A
Epoch 4/5:  72%|███████▏  | 1587/2208 [09:30<03:45,  2.75it/s][A
Epoch 4/5:  72%|███████▏  | 1588/2208 [09:30<03:42,  2.79it/s][A
Epoch 4/5:  72%|███████▏  | 1589/2208 [09:31<03:38,  2.83it/s][A
Epoch 4/5:  72%|███████▏  | 1590/2208 [09:31<03:35,  2.86it/s][A
Epoch 4/5:  72%|███████▏  | 1591/2208 [09:31<03:35,  2.86it/s][A
Epoch 4/5

Batch 1600: Training accuracy = 0.8203, F1 = 0.8034, Precision = 0.8021, Recall = 0.8203



Epoch 4/5:  73%|███████▎  | 1602/2208 [09:35<03:42,  2.73it/s][A
Epoch 4/5:  73%|███████▎  | 1603/2208 [09:36<03:36,  2.79it/s][A
Epoch 4/5:  73%|███████▎  | 1604/2208 [09:36<03:35,  2.80it/s][A
Epoch 4/5:  73%|███████▎  | 1605/2208 [09:36<03:38,  2.76it/s][A
Epoch 4/5:  73%|███████▎  | 1606/2208 [09:37<03:40,  2.73it/s][A
Epoch 4/5:  73%|███████▎  | 1607/2208 [09:37<03:38,  2.76it/s][A
Epoch 4/5:  73%|███████▎  | 1608/2208 [09:38<03:38,  2.75it/s][A
Epoch 4/5:  73%|███████▎  | 1609/2208 [09:38<03:37,  2.75it/s][A
Epoch 4/5:  73%|███████▎  | 1610/2208 [09:38<03:39,  2.72it/s][A
Epoch 4/5:  73%|███████▎  | 1611/2208 [09:39<03:40,  2.71it/s][A
Epoch 4/5:  73%|███████▎  | 1612/2208 [09:39<03:40,  2.70it/s][A
Epoch 4/5:  73%|███████▎  | 1613/2208 [09:39<03:41,  2.69it/s][A
Epoch 4/5:  73%|███████▎  | 1614/2208 [09:40<03:36,  2.75it/s][A
Epoch 4/5:  73%|███████▎  | 1615/2208 [09:40<03:33,  2.78it/s][A
Epoch 4/5:  73%|███████▎  | 1616/2208 [09:40<03:30,  2.81it/s][A
Epoch 4/5

Batch 1625: Training accuracy = 0.8594, F1 = 0.8456, Precision = 0.8483, Recall = 0.8594



Epoch 4/5:  74%|███████▎  | 1627/2208 [09:44<03:24,  2.83it/s][A
Epoch 4/5:  74%|███████▎  | 1628/2208 [09:45<03:26,  2.81it/s][A
Epoch 4/5:  74%|███████▍  | 1629/2208 [09:45<03:25,  2.82it/s][A
Epoch 4/5:  74%|███████▍  | 1630/2208 [09:45<03:23,  2.84it/s][A
Epoch 4/5:  74%|███████▍  | 1631/2208 [09:46<03:21,  2.87it/s][A
Epoch 4/5:  74%|███████▍  | 1632/2208 [09:46<03:20,  2.88it/s][A
Epoch 4/5:  74%|███████▍  | 1633/2208 [09:46<03:20,  2.87it/s][A
Epoch 4/5:  74%|███████▍  | 1634/2208 [09:47<03:24,  2.81it/s][A
Epoch 4/5:  74%|███████▍  | 1635/2208 [09:47<03:26,  2.77it/s][A
Epoch 4/5:  74%|███████▍  | 1636/2208 [09:48<03:29,  2.72it/s][A
Epoch 4/5:  74%|███████▍  | 1637/2208 [09:48<03:24,  2.79it/s][A
Epoch 4/5:  74%|███████▍  | 1638/2208 [09:48<03:26,  2.76it/s][A
Epoch 4/5:  74%|███████▍  | 1639/2208 [09:49<03:21,  2.82it/s][A
Epoch 4/5:  74%|███████▍  | 1640/2208 [09:49<03:18,  2.86it/s][A
Epoch 4/5:  74%|███████▍  | 1641/2208 [09:49<03:16,  2.89it/s][A
Epoch 4/5

Batch 1650: Training accuracy = 0.8203, F1 = 0.8065, Precision = 0.8092, Recall = 0.8203



Epoch 4/5:  75%|███████▍  | 1652/2208 [09:53<03:24,  2.72it/s][A
Epoch 4/5:  75%|███████▍  | 1653/2208 [09:54<03:22,  2.74it/s][A
Epoch 4/5:  75%|███████▍  | 1654/2208 [09:54<03:24,  2.71it/s][A
Epoch 4/5:  75%|███████▍  | 1655/2208 [09:54<03:20,  2.76it/s][A
Epoch 4/5:  75%|███████▌  | 1656/2208 [09:55<03:17,  2.79it/s][A
Epoch 4/5:  75%|███████▌  | 1657/2208 [09:55<03:16,  2.80it/s][A
Epoch 4/5:  75%|███████▌  | 1658/2208 [09:55<03:16,  2.80it/s][A
Epoch 4/5:  75%|███████▌  | 1659/2208 [09:56<03:13,  2.84it/s][A
Epoch 4/5:  75%|███████▌  | 1660/2208 [09:56<03:11,  2.87it/s][A
Epoch 4/5:  75%|███████▌  | 1661/2208 [09:56<03:11,  2.85it/s][A
Epoch 4/5:  75%|███████▌  | 1662/2208 [09:57<03:14,  2.80it/s][A
Epoch 4/5:  75%|███████▌  | 1663/2208 [09:57<03:16,  2.77it/s][A
Epoch 4/5:  75%|███████▌  | 1664/2208 [09:58<03:13,  2.81it/s][A
Epoch 4/5:  75%|███████▌  | 1665/2208 [09:58<03:13,  2.81it/s][A
Epoch 4/5:  75%|███████▌  | 1666/2208 [09:58<03:10,  2.85it/s][A
Epoch 4/5

Batch 1675: Training accuracy = 0.8828, F1 = 0.8797, Precision = 0.8893, Recall = 0.8828



Epoch 4/5:  76%|███████▌  | 1677/2208 [10:02<03:13,  2.74it/s][A
Epoch 4/5:  76%|███████▌  | 1678/2208 [10:03<03:14,  2.72it/s][A
Epoch 4/5:  76%|███████▌  | 1679/2208 [10:03<03:13,  2.73it/s][A
Epoch 4/5:  76%|███████▌  | 1680/2208 [10:03<03:08,  2.80it/s][A
Epoch 4/5:  76%|███████▌  | 1681/2208 [10:04<03:06,  2.83it/s][A
Epoch 4/5:  76%|███████▌  | 1682/2208 [10:04<03:08,  2.79it/s][A
Epoch 4/5:  76%|███████▌  | 1683/2208 [10:04<03:07,  2.80it/s][A
Epoch 4/5:  76%|███████▋  | 1684/2208 [10:05<03:07,  2.79it/s][A
Epoch 4/5:  76%|███████▋  | 1685/2208 [10:05<03:09,  2.76it/s][A
Epoch 4/5:  76%|███████▋  | 1686/2208 [10:05<03:05,  2.82it/s][A
Epoch 4/5:  76%|███████▋  | 1687/2208 [10:06<03:06,  2.79it/s][A
Epoch 4/5:  76%|███████▋  | 1688/2208 [10:06<03:04,  2.81it/s][A
Epoch 4/5:  76%|███████▋  | 1689/2208 [10:07<03:08,  2.76it/s][A
Epoch 4/5:  77%|███████▋  | 1690/2208 [10:07<03:05,  2.79it/s][A
Epoch 4/5:  77%|███████▋  | 1691/2208 [10:07<03:05,  2.78it/s][A
Epoch 4/5

Batch 1700: Training accuracy = 0.8516, F1 = 0.8464, Precision = 0.8568, Recall = 0.8516



Epoch 4/5:  77%|███████▋  | 1702/2208 [10:11<03:00,  2.81it/s][A
Epoch 4/5:  77%|███████▋  | 1703/2208 [10:12<02:57,  2.84it/s][A
Epoch 4/5:  77%|███████▋  | 1704/2208 [10:12<02:55,  2.87it/s][A
Epoch 4/5:  77%|███████▋  | 1705/2208 [10:12<02:55,  2.87it/s][A
Epoch 4/5:  77%|███████▋  | 1706/2208 [10:13<02:55,  2.85it/s][A
Epoch 4/5:  77%|███████▋  | 1707/2208 [10:13<02:54,  2.87it/s][A
Epoch 4/5:  77%|███████▋  | 1708/2208 [10:13<02:55,  2.85it/s][A
Epoch 4/5:  77%|███████▋  | 1709/2208 [10:14<02:53,  2.87it/s][A
Epoch 4/5:  77%|███████▋  | 1710/2208 [10:14<02:57,  2.80it/s][A
Epoch 4/5:  77%|███████▋  | 1711/2208 [10:14<02:59,  2.77it/s][A
Epoch 4/5:  78%|███████▊  | 1712/2208 [10:15<02:55,  2.83it/s][A
Epoch 4/5:  78%|███████▊  | 1713/2208 [10:15<02:57,  2.79it/s][A
Epoch 4/5:  78%|███████▊  | 1714/2208 [10:15<02:54,  2.83it/s][A
Epoch 4/5:  78%|███████▊  | 1715/2208 [10:16<02:52,  2.85it/s][A
Epoch 4/5:  78%|███████▊  | 1716/2208 [10:16<02:52,  2.85it/s][A
Epoch 4/5

Batch 1725: Training accuracy = 0.8672, F1 = 0.8542, Precision = 0.8555, Recall = 0.8672



Epoch 4/5:  78%|███████▊  | 1727/2208 [10:20<02:52,  2.79it/s][A
Epoch 4/5:  78%|███████▊  | 1728/2208 [10:20<02:50,  2.81it/s][A
Epoch 4/5:  78%|███████▊  | 1729/2208 [10:21<02:53,  2.77it/s][A
Epoch 4/5:  78%|███████▊  | 1730/2208 [10:21<02:57,  2.69it/s][A
Epoch 4/5:  78%|███████▊  | 1731/2208 [10:21<02:56,  2.70it/s][A
Epoch 4/5:  78%|███████▊  | 1732/2208 [10:22<02:52,  2.75it/s][A
Epoch 4/5:  78%|███████▊  | 1733/2208 [10:22<02:53,  2.74it/s][A
Epoch 4/5:  79%|███████▊  | 1734/2208 [10:23<02:49,  2.80it/s][A
Epoch 4/5:  79%|███████▊  | 1735/2208 [10:23<02:50,  2.77it/s][A
Epoch 4/5:  79%|███████▊  | 1736/2208 [10:23<02:55,  2.69it/s][A
Epoch 4/5:  79%|███████▊  | 1737/2208 [10:24<02:58,  2.64it/s][A
Epoch 4/5:  79%|███████▊  | 1738/2208 [10:24<02:52,  2.72it/s][A
Epoch 4/5:  79%|███████▉  | 1739/2208 [10:24<02:54,  2.69it/s][A
Epoch 4/5:  79%|███████▉  | 1740/2208 [10:25<02:49,  2.75it/s][A
Epoch 4/5:  79%|███████▉  | 1741/2208 [10:25<02:48,  2.77it/s][A
Epoch 4/5

Batch 1750: Training accuracy = 0.9062, F1 = 0.8995, Precision = 0.8997, Recall = 0.9062



Epoch 4/5:  79%|███████▉  | 1752/2208 [10:29<02:42,  2.81it/s][A
Epoch 4/5:  79%|███████▉  | 1753/2208 [10:29<02:39,  2.85it/s][A
Epoch 4/5:  79%|███████▉  | 1754/2208 [10:30<02:38,  2.86it/s][A
Epoch 4/5:  79%|███████▉  | 1755/2208 [10:30<02:37,  2.88it/s][A
Epoch 4/5:  80%|███████▉  | 1756/2208 [10:30<02:35,  2.90it/s][A
Epoch 4/5:  80%|███████▉  | 1757/2208 [10:31<02:35,  2.89it/s][A
Epoch 4/5:  80%|███████▉  | 1758/2208 [10:31<02:38,  2.85it/s][A
Epoch 4/5:  80%|███████▉  | 1759/2208 [10:31<02:38,  2.84it/s][A
Epoch 4/5:  80%|███████▉  | 1760/2208 [10:32<02:37,  2.85it/s][A
Epoch 4/5:  80%|███████▉  | 1761/2208 [10:32<02:37,  2.84it/s][A
Epoch 4/5:  80%|███████▉  | 1762/2208 [10:32<02:36,  2.86it/s][A
Epoch 4/5:  80%|███████▉  | 1763/2208 [10:33<02:34,  2.89it/s][A
Epoch 4/5:  80%|███████▉  | 1764/2208 [10:33<02:32,  2.90it/s][A
Epoch 4/5:  80%|███████▉  | 1765/2208 [10:34<02:32,  2.91it/s][A
Epoch 4/5:  80%|███████▉  | 1766/2208 [10:34<02:31,  2.92it/s][A
Epoch 4/5

Batch 1775: Training accuracy = 0.8672, F1 = 0.8594, Precision = 0.8633, Recall = 0.8672



Epoch 4/5:  80%|████████  | 1777/2208 [10:38<02:35,  2.77it/s][A
Epoch 4/5:  81%|████████  | 1778/2208 [10:38<02:36,  2.75it/s][A
Epoch 4/5:  81%|████████  | 1779/2208 [10:39<02:33,  2.80it/s][A
Epoch 4/5:  81%|████████  | 1780/2208 [10:39<02:34,  2.77it/s][A
Epoch 4/5:  81%|████████  | 1781/2208 [10:39<02:32,  2.79it/s][A
Epoch 4/5:  81%|████████  | 1782/2208 [10:40<02:30,  2.83it/s][A
Epoch 4/5:  81%|████████  | 1783/2208 [10:40<02:31,  2.80it/s][A
Epoch 4/5:  81%|████████  | 1784/2208 [10:40<02:29,  2.84it/s][A
Epoch 4/5:  81%|████████  | 1785/2208 [10:41<02:27,  2.87it/s][A
Epoch 4/5:  81%|████████  | 1786/2208 [10:41<02:25,  2.90it/s][A
Epoch 4/5:  81%|████████  | 1787/2208 [10:41<02:30,  2.80it/s][A
Epoch 4/5:  81%|████████  | 1788/2208 [10:42<02:29,  2.81it/s][A
Epoch 4/5:  81%|████████  | 1789/2208 [10:42<02:28,  2.83it/s][A
Epoch 4/5:  81%|████████  | 1790/2208 [10:42<02:29,  2.80it/s][A
Epoch 4/5:  81%|████████  | 1791/2208 [10:43<02:30,  2.77it/s][A
Epoch 4/5

Batch 1800: Training accuracy = 0.8906, F1 = 0.8906, Precision = 0.9167, Recall = 0.8906



Epoch 4/5:  82%|████████▏ | 1802/2208 [10:47<02:27,  2.75it/s][A
Epoch 4/5:  82%|████████▏ | 1803/2208 [10:47<02:24,  2.80it/s][A
Epoch 4/5:  82%|████████▏ | 1804/2208 [10:47<02:23,  2.81it/s][A
Epoch 4/5:  82%|████████▏ | 1805/2208 [10:48<02:22,  2.82it/s][A
Epoch 4/5:  82%|████████▏ | 1806/2208 [10:48<02:21,  2.84it/s][A
Epoch 4/5:  82%|████████▏ | 1807/2208 [10:48<02:21,  2.82it/s][A
Epoch 4/5:  82%|████████▏ | 1808/2208 [10:49<02:20,  2.84it/s][A
Epoch 4/5:  82%|████████▏ | 1809/2208 [10:49<02:20,  2.85it/s][A
Epoch 4/5:  82%|████████▏ | 1810/2208 [10:49<02:20,  2.83it/s][A
Epoch 4/5:  82%|████████▏ | 1811/2208 [10:50<02:22,  2.78it/s][A
Epoch 4/5:  82%|████████▏ | 1812/2208 [10:50<02:22,  2.79it/s][A
Epoch 4/5:  82%|████████▏ | 1813/2208 [10:51<02:26,  2.70it/s][A
Epoch 4/5:  82%|████████▏ | 1814/2208 [10:51<02:27,  2.68it/s][A
Epoch 4/5:  82%|████████▏ | 1815/2208 [10:51<02:23,  2.74it/s][A
Epoch 4/5:  82%|████████▏ | 1816/2208 [10:52<02:22,  2.75it/s][A
Epoch 4/5

Batch 1825: Training accuracy = 0.8750, F1 = 0.8680, Precision = 0.8685, Recall = 0.8750



Epoch 4/5:  83%|████████▎ | 1827/2208 [10:56<02:17,  2.78it/s][A
Epoch 4/5:  83%|████████▎ | 1828/2208 [10:56<02:14,  2.83it/s][A
Epoch 4/5:  83%|████████▎ | 1829/2208 [10:56<02:15,  2.80it/s][A
Epoch 4/5:  83%|████████▎ | 1830/2208 [10:57<02:16,  2.76it/s][A
Epoch 4/5:  83%|████████▎ | 1831/2208 [10:57<02:17,  2.74it/s][A
Epoch 4/5:  83%|████████▎ | 1832/2208 [10:58<02:16,  2.76it/s][A
Epoch 4/5:  83%|████████▎ | 1833/2208 [10:58<02:14,  2.78it/s][A
Epoch 4/5:  83%|████████▎ | 1834/2208 [10:58<02:14,  2.77it/s][A
Epoch 4/5:  83%|████████▎ | 1835/2208 [10:59<02:14,  2.77it/s][A
Epoch 4/5:  83%|████████▎ | 1836/2208 [10:59<02:12,  2.82it/s][A
Epoch 4/5:  83%|████████▎ | 1837/2208 [10:59<02:10,  2.85it/s][A
Epoch 4/5:  83%|████████▎ | 1838/2208 [11:00<02:08,  2.89it/s][A
Epoch 4/5:  83%|████████▎ | 1839/2208 [11:00<02:10,  2.83it/s][A
Epoch 4/5:  83%|████████▎ | 1840/2208 [11:00<02:08,  2.86it/s][A
Epoch 4/5:  83%|████████▎ | 1841/2208 [11:01<02:10,  2.82it/s][A
Epoch 4/5

Batch 1850: Training accuracy = 0.8984, F1 = 0.8844, Precision = 0.8763, Recall = 0.8984



Epoch 4/5:  84%|████████▍ | 1852/2208 [11:05<02:08,  2.77it/s][A
Epoch 4/5:  84%|████████▍ | 1853/2208 [11:05<02:09,  2.75it/s][A
Epoch 4/5:  84%|████████▍ | 1854/2208 [11:05<02:06,  2.79it/s][A
Epoch 4/5:  84%|████████▍ | 1855/2208 [11:06<02:04,  2.83it/s][A
Epoch 4/5:  84%|████████▍ | 1856/2208 [11:06<02:03,  2.86it/s][A
Epoch 4/5:  84%|████████▍ | 1857/2208 [11:07<02:05,  2.79it/s][A
Epoch 4/5:  84%|████████▍ | 1858/2208 [11:07<02:07,  2.75it/s][A
Epoch 4/5:  84%|████████▍ | 1859/2208 [11:07<02:08,  2.72it/s][A
Epoch 4/5:  84%|████████▍ | 1860/2208 [11:08<02:06,  2.76it/s][A
Epoch 4/5:  84%|████████▍ | 1861/2208 [11:08<02:05,  2.77it/s][A
Epoch 4/5:  84%|████████▍ | 1862/2208 [11:08<02:05,  2.76it/s][A
Epoch 4/5:  84%|████████▍ | 1863/2208 [11:09<02:02,  2.81it/s][A
Epoch 4/5:  84%|████████▍ | 1864/2208 [11:09<02:04,  2.77it/s][A
Epoch 4/5:  84%|████████▍ | 1865/2208 [11:09<02:04,  2.75it/s][A
Epoch 4/5:  85%|████████▍ | 1866/2208 [11:10<02:01,  2.81it/s][A
Epoch 4/5

Batch 1875: Training accuracy = 0.8203, F1 = 0.8079, Precision = 0.8148, Recall = 0.8203



Epoch 4/5:  85%|████████▌ | 1877/2208 [11:14<01:58,  2.78it/s][A
Epoch 4/5:  85%|████████▌ | 1878/2208 [11:14<01:58,  2.79it/s][A
Epoch 4/5:  85%|████████▌ | 1879/2208 [11:14<01:58,  2.79it/s][A
Epoch 4/5:  85%|████████▌ | 1880/2208 [11:15<01:55,  2.84it/s][A
Epoch 4/5:  85%|████████▌ | 1881/2208 [11:15<01:56,  2.81it/s][A
Epoch 4/5:  85%|████████▌ | 1882/2208 [11:16<01:55,  2.81it/s][A
Epoch 4/5:  85%|████████▌ | 1883/2208 [11:16<01:55,  2.80it/s][A
Epoch 4/5:  85%|████████▌ | 1884/2208 [11:16<01:54,  2.84it/s][A
Epoch 4/5:  85%|████████▌ | 1885/2208 [11:17<01:55,  2.80it/s][A
Epoch 4/5:  85%|████████▌ | 1886/2208 [11:17<01:53,  2.84it/s][A
Epoch 4/5:  85%|████████▌ | 1887/2208 [11:17<01:54,  2.80it/s][A
Epoch 4/5:  86%|████████▌ | 1888/2208 [11:18<01:52,  2.85it/s][A
Epoch 4/5:  86%|████████▌ | 1889/2208 [11:18<01:50,  2.88it/s][A
Epoch 4/5:  86%|████████▌ | 1890/2208 [11:18<01:50,  2.88it/s][A
Epoch 4/5:  86%|████████▌ | 1891/2208 [11:19<01:50,  2.86it/s][A
Epoch 4/5

Batch 1900: Training accuracy = 0.9219, F1 = 0.9115, Precision = 0.9115, Recall = 0.9219



Epoch 4/5:  86%|████████▌ | 1902/2208 [11:23<01:52,  2.71it/s][A
Epoch 4/5:  86%|████████▌ | 1903/2208 [11:23<01:50,  2.76it/s][A
Epoch 4/5:  86%|████████▌ | 1904/2208 [11:23<01:48,  2.80it/s][A
Epoch 4/5:  86%|████████▋ | 1905/2208 [11:24<01:46,  2.84it/s][A
Epoch 4/5:  86%|████████▋ | 1906/2208 [11:24<01:46,  2.84it/s][A
Epoch 4/5:  86%|████████▋ | 1907/2208 [11:24<01:45,  2.86it/s][A
Epoch 4/5:  86%|████████▋ | 1908/2208 [11:25<01:44,  2.88it/s][A
Epoch 4/5:  86%|████████▋ | 1909/2208 [11:25<01:43,  2.88it/s][A
Epoch 4/5:  87%|████████▋ | 1910/2208 [11:25<01:44,  2.86it/s][A
Epoch 4/5:  87%|████████▋ | 1911/2208 [11:26<01:43,  2.87it/s][A
Epoch 4/5:  87%|████████▋ | 1912/2208 [11:26<01:45,  2.80it/s][A
Epoch 4/5:  87%|████████▋ | 1913/2208 [11:27<01:45,  2.81it/s][A
Epoch 4/5:  87%|████████▋ | 1914/2208 [11:27<01:44,  2.81it/s][A
Epoch 4/5:  87%|████████▋ | 1915/2208 [11:27<01:44,  2.81it/s][A
Epoch 4/5:  87%|████████▋ | 1916/2208 [11:28<01:43,  2.81it/s][A
Epoch 4/5

Batch 1925: Training accuracy = 0.8438, F1 = 0.8279, Precision = 0.8385, Recall = 0.8438



Epoch 4/5:  87%|████████▋ | 1927/2208 [11:32<01:42,  2.74it/s][A
Epoch 4/5:  87%|████████▋ | 1928/2208 [11:32<01:40,  2.79it/s][A
Epoch 4/5:  87%|████████▋ | 1929/2208 [11:32<01:39,  2.81it/s][A
Epoch 4/5:  87%|████████▋ | 1930/2208 [11:33<01:37,  2.85it/s][A
Epoch 4/5:  87%|████████▋ | 1931/2208 [11:33<01:38,  2.82it/s][A
Epoch 4/5:  88%|████████▊ | 1932/2208 [11:33<01:37,  2.84it/s][A
Epoch 4/5:  88%|████████▊ | 1933/2208 [11:34<01:36,  2.85it/s][A
Epoch 4/5:  88%|████████▊ | 1934/2208 [11:34<01:36,  2.84it/s][A
Epoch 4/5:  88%|████████▊ | 1935/2208 [11:34<01:36,  2.82it/s][A
Epoch 4/5:  88%|████████▊ | 1936/2208 [11:35<01:38,  2.77it/s][A
Epoch 4/5:  88%|████████▊ | 1937/2208 [11:35<01:36,  2.81it/s][A
Epoch 4/5:  88%|████████▊ | 1938/2208 [11:35<01:35,  2.82it/s][A
Epoch 4/5:  88%|████████▊ | 1939/2208 [11:36<01:36,  2.78it/s][A
Epoch 4/5:  88%|████████▊ | 1940/2208 [11:36<01:36,  2.79it/s][A
Epoch 4/5:  88%|████████▊ | 1941/2208 [11:37<01:36,  2.75it/s][A
Epoch 4/5

Batch 1950: Training accuracy = 0.8125, F1 = 0.7919, Precision = 0.7891, Recall = 0.8125



Epoch 4/5:  88%|████████▊ | 1952/2208 [11:41<01:31,  2.80it/s][A
Epoch 4/5:  88%|████████▊ | 1953/2208 [11:41<01:29,  2.85it/s][A
Epoch 4/5:  88%|████████▊ | 1954/2208 [11:41<01:28,  2.87it/s][A
Epoch 4/5:  89%|████████▊ | 1955/2208 [11:42<01:29,  2.82it/s][A
Epoch 4/5:  89%|████████▊ | 1956/2208 [11:42<01:30,  2.79it/s][A
Epoch 4/5:  89%|████████▊ | 1957/2208 [11:42<01:29,  2.80it/s][A
Epoch 4/5:  89%|████████▊ | 1958/2208 [11:43<01:29,  2.79it/s][A
Epoch 4/5:  89%|████████▊ | 1959/2208 [11:43<01:30,  2.76it/s][A
Epoch 4/5:  89%|████████▉ | 1960/2208 [11:43<01:29,  2.77it/s][A
Epoch 4/5:  89%|████████▉ | 1961/2208 [11:44<01:29,  2.75it/s][A
Epoch 4/5:  89%|████████▉ | 1962/2208 [11:44<01:27,  2.80it/s][A
Epoch 4/5:  89%|████████▉ | 1963/2208 [11:44<01:26,  2.84it/s][A
Epoch 4/5:  89%|████████▉ | 1964/2208 [11:45<01:28,  2.77it/s][A
Epoch 4/5:  89%|████████▉ | 1965/2208 [11:45<01:26,  2.81it/s][A
Epoch 4/5:  89%|████████▉ | 1966/2208 [11:46<01:24,  2.85it/s][A
Epoch 4/5

Batch 1975: Training accuracy = 0.8750, F1 = 0.8633, Precision = 0.8581, Recall = 0.8750



Epoch 4/5:  90%|████████▉ | 1977/2208 [11:49<01:23,  2.77it/s][A
Epoch 4/5:  90%|████████▉ | 1978/2208 [11:50<01:21,  2.81it/s][A
Epoch 4/5:  90%|████████▉ | 1979/2208 [11:50<01:23,  2.75it/s][A
Epoch 4/5:  90%|████████▉ | 1980/2208 [11:51<01:23,  2.74it/s][A
Epoch 4/5:  90%|████████▉ | 1981/2208 [11:51<01:23,  2.71it/s][A
Epoch 4/5:  90%|████████▉ | 1982/2208 [11:51<01:24,  2.67it/s][A
Epoch 4/5:  90%|████████▉ | 1983/2208 [11:52<01:23,  2.68it/s][A
Epoch 4/5:  90%|████████▉ | 1984/2208 [11:52<01:23,  2.67it/s][A
Epoch 4/5:  90%|████████▉ | 1985/2208 [11:52<01:21,  2.74it/s][A
Epoch 4/5:  90%|████████▉ | 1986/2208 [11:53<01:19,  2.78it/s][A
Epoch 4/5:  90%|████████▉ | 1987/2208 [11:53<01:18,  2.83it/s][A
Epoch 4/5:  90%|█████████ | 1988/2208 [11:53<01:17,  2.85it/s][A
Epoch 4/5:  90%|█████████ | 1989/2208 [11:54<01:18,  2.79it/s][A
Epoch 4/5:  90%|█████████ | 1990/2208 [11:54<01:18,  2.76it/s][A
Epoch 4/5:  90%|█████████ | 1991/2208 [11:55<01:18,  2.76it/s][A
Epoch 4/5

Batch 2000: Training accuracy = 0.8125, F1 = 0.8052, Precision = 0.8086, Recall = 0.8125



Epoch 4/5:  91%|█████████ | 2002/2208 [11:59<01:16,  2.68it/s][A
Epoch 4/5:  91%|█████████ | 2003/2208 [11:59<01:14,  2.75it/s][A
Epoch 4/5:  91%|█████████ | 2004/2208 [11:59<01:12,  2.80it/s][A
Epoch 4/5:  91%|█████████ | 2005/2208 [12:00<01:13,  2.77it/s][A
Epoch 4/5:  91%|█████████ | 2006/2208 [12:00<01:13,  2.76it/s][A
Epoch 4/5:  91%|█████████ | 2007/2208 [12:00<01:12,  2.76it/s][A
Epoch 4/5:  91%|█████████ | 2008/2208 [12:01<01:11,  2.80it/s][A
Epoch 4/5:  91%|█████████ | 2009/2208 [12:01<01:11,  2.77it/s][A
Epoch 4/5:  91%|█████████ | 2010/2208 [12:01<01:12,  2.73it/s][A
Epoch 4/5:  91%|█████████ | 2011/2208 [12:02<01:10,  2.80it/s][A
Epoch 4/5:  91%|█████████ | 2012/2208 [12:02<01:10,  2.80it/s][A
Epoch 4/5:  91%|█████████ | 2013/2208 [12:03<01:09,  2.82it/s][A
Epoch 4/5:  91%|█████████ | 2014/2208 [12:03<01:08,  2.84it/s][A
Epoch 4/5:  91%|█████████▏| 2015/2208 [12:03<01:08,  2.83it/s][A
Epoch 4/5:  91%|█████████▏| 2016/2208 [12:04<01:08,  2.80it/s][A
Epoch 4/5

Batch 2025: Training accuracy = 0.8750, F1 = 0.8684, Precision = 0.8740, Recall = 0.8750



Epoch 4/5:  92%|█████████▏| 2027/2208 [12:08<01:05,  2.74it/s][A
Epoch 4/5:  92%|█████████▏| 2028/2208 [12:08<01:04,  2.79it/s][A
Epoch 4/5:  92%|█████████▏| 2029/2208 [12:08<01:04,  2.78it/s][A
Epoch 4/5:  92%|█████████▏| 2030/2208 [12:09<01:05,  2.71it/s][A
Epoch 4/5:  92%|█████████▏| 2031/2208 [12:09<01:03,  2.77it/s][A
Epoch 4/5:  92%|█████████▏| 2032/2208 [12:09<01:04,  2.74it/s][A
Epoch 4/5:  92%|█████████▏| 2033/2208 [12:10<01:02,  2.81it/s][A
Epoch 4/5:  92%|█████████▏| 2034/2208 [12:10<01:01,  2.85it/s][A
Epoch 4/5:  92%|█████████▏| 2035/2208 [12:10<01:02,  2.75it/s][A
Epoch 4/5:  92%|█████████▏| 2036/2208 [12:11<01:02,  2.75it/s][A
Epoch 4/5:  92%|█████████▏| 2037/2208 [12:11<01:01,  2.78it/s][A
Epoch 4/5:  92%|█████████▏| 2038/2208 [12:12<01:01,  2.75it/s][A
Epoch 4/5:  92%|█████████▏| 2039/2208 [12:12<01:01,  2.73it/s][A
Epoch 4/5:  92%|█████████▏| 2040/2208 [12:12<01:00,  2.79it/s][A
Epoch 4/5:  92%|█████████▏| 2041/2208 [12:13<00:59,  2.82it/s][A
Epoch 4/5

Batch 2050: Training accuracy = 0.8750, F1 = 0.8625, Precision = 0.8698, Recall = 0.8750



Epoch 4/5:  93%|█████████▎| 2052/2208 [12:17<00:56,  2.74it/s][A
Epoch 4/5:  93%|█████████▎| 2053/2208 [12:17<00:55,  2.79it/s][A
Epoch 4/5:  93%|█████████▎| 2054/2208 [12:17<00:56,  2.75it/s][A
Epoch 4/5:  93%|█████████▎| 2055/2208 [12:18<00:54,  2.81it/s][A
Epoch 4/5:  93%|█████████▎| 2056/2208 [12:18<00:54,  2.77it/s][A
Epoch 4/5:  93%|█████████▎| 2057/2208 [12:18<00:54,  2.79it/s][A
Epoch 4/5:  93%|█████████▎| 2058/2208 [12:19<00:54,  2.77it/s][A
Epoch 4/5:  93%|█████████▎| 2059/2208 [12:19<00:54,  2.73it/s][A
Epoch 4/5:  93%|█████████▎| 2060/2208 [12:20<00:53,  2.78it/s][A
Epoch 4/5:  93%|█████████▎| 2061/2208 [12:20<00:51,  2.83it/s][A
Epoch 4/5:  93%|█████████▎| 2062/2208 [12:20<00:52,  2.79it/s][A
Epoch 4/5:  93%|█████████▎| 2063/2208 [12:21<00:51,  2.83it/s][A
Epoch 4/5:  93%|█████████▎| 2064/2208 [12:21<00:51,  2.77it/s][A
Epoch 4/5:  94%|█████████▎| 2065/2208 [12:21<00:52,  2.71it/s][A
Epoch 4/5:  94%|█████████▎| 2066/2208 [12:22<00:51,  2.74it/s][A
Epoch 4/5

Batch 2075: Training accuracy = 0.8828, F1 = 0.8693, Precision = 0.8750, Recall = 0.8828



Epoch 4/5:  94%|█████████▍| 2077/2208 [12:26<00:45,  2.85it/s][A
Epoch 4/5:  94%|█████████▍| 2078/2208 [12:26<00:46,  2.81it/s][A
Epoch 4/5:  94%|█████████▍| 2079/2208 [12:26<00:45,  2.81it/s][A
Epoch 4/5:  94%|█████████▍| 2080/2208 [12:27<00:45,  2.84it/s][A
Epoch 4/5:  94%|█████████▍| 2081/2208 [12:27<00:45,  2.82it/s][A
Epoch 4/5:  94%|█████████▍| 2082/2208 [12:27<00:44,  2.81it/s][A
Epoch 4/5:  94%|█████████▍| 2083/2208 [12:28<00:44,  2.84it/s][A
Epoch 4/5:  94%|█████████▍| 2084/2208 [12:28<00:43,  2.87it/s][A
Epoch 4/5:  94%|█████████▍| 2085/2208 [12:28<00:42,  2.88it/s][A
Epoch 4/5:  94%|█████████▍| 2086/2208 [12:29<00:43,  2.77it/s][A
Epoch 4/5:  95%|█████████▍| 2087/2208 [12:29<00:43,  2.78it/s][A
Epoch 4/5:  95%|█████████▍| 2088/2208 [12:29<00:42,  2.81it/s][A
Epoch 4/5:  95%|█████████▍| 2089/2208 [12:30<00:43,  2.77it/s][A
Epoch 4/5:  95%|█████████▍| 2090/2208 [12:30<00:42,  2.80it/s][A
Epoch 4/5:  95%|█████████▍| 2091/2208 [12:31<00:42,  2.77it/s][A
Epoch 4/5

Batch 2100: Training accuracy = 0.8672, F1 = 0.8737, Precision = 0.8984, Recall = 0.8672



Epoch 4/5:  95%|█████████▌| 2102/2208 [12:35<00:38,  2.78it/s][A
Epoch 4/5:  95%|█████████▌| 2103/2208 [12:35<00:37,  2.77it/s][A
Epoch 4/5:  95%|█████████▌| 2104/2208 [12:35<00:37,  2.74it/s][A
Epoch 4/5:  95%|█████████▌| 2105/2208 [12:36<00:37,  2.77it/s][A
Epoch 4/5:  95%|█████████▌| 2106/2208 [12:36<00:37,  2.74it/s][A
Epoch 4/5:  95%|█████████▌| 2107/2208 [12:36<00:36,  2.78it/s][A
Epoch 4/5:  95%|█████████▌| 2108/2208 [12:37<00:36,  2.77it/s][A
Epoch 4/5:  96%|█████████▌| 2109/2208 [12:37<00:35,  2.78it/s][A
Epoch 4/5:  96%|█████████▌| 2110/2208 [12:37<00:34,  2.82it/s][A
Epoch 4/5:  96%|█████████▌| 2111/2208 [12:38<00:34,  2.85it/s][A
Epoch 4/5:  96%|█████████▌| 2112/2208 [12:38<00:33,  2.88it/s][A
Epoch 4/5:  96%|█████████▌| 2113/2208 [12:38<00:33,  2.84it/s][A
Epoch 4/5:  96%|█████████▌| 2114/2208 [12:39<00:33,  2.80it/s][A
Epoch 4/5:  96%|█████████▌| 2115/2208 [12:39<00:32,  2.84it/s][A
Epoch 4/5:  96%|█████████▌| 2116/2208 [12:40<00:32,  2.82it/s][A
Epoch 4/5

Batch 2125: Training accuracy = 0.8828, F1 = 0.8677, Precision = 0.8681, Recall = 0.8828



Epoch 4/5:  96%|█████████▋| 2127/2208 [12:43<00:28,  2.85it/s][A
Epoch 4/5:  96%|█████████▋| 2128/2208 [12:44<00:27,  2.88it/s][A
Epoch 4/5:  96%|█████████▋| 2129/2208 [12:44<00:27,  2.89it/s][A
Epoch 4/5:  96%|█████████▋| 2130/2208 [12:45<00:27,  2.84it/s][A
Epoch 4/5:  97%|█████████▋| 2131/2208 [12:45<00:26,  2.87it/s][A
Epoch 4/5:  97%|█████████▋| 2132/2208 [12:45<00:26,  2.86it/s][A
Epoch 4/5:  97%|█████████▋| 2133/2208 [12:46<00:26,  2.83it/s][A
Epoch 4/5:  97%|█████████▋| 2134/2208 [12:46<00:26,  2.78it/s][A
Epoch 4/5:  97%|█████████▋| 2135/2208 [12:46<00:26,  2.80it/s][A
Epoch 4/5:  97%|█████████▋| 2136/2208 [12:47<00:25,  2.80it/s][A
Epoch 4/5:  97%|█████████▋| 2137/2208 [12:47<00:25,  2.84it/s][A
Epoch 4/5:  97%|█████████▋| 2138/2208 [12:47<00:24,  2.82it/s][A
Epoch 4/5:  97%|█████████▋| 2139/2208 [12:48<00:25,  2.74it/s][A
Epoch 4/5:  97%|█████████▋| 2140/2208 [12:48<00:25,  2.69it/s][A
Epoch 4/5:  97%|█████████▋| 2141/2208 [12:49<00:25,  2.66it/s][A
Epoch 4/5

Batch 2150: Training accuracy = 0.9375, F1 = 0.9323, Precision = 0.9297, Recall = 0.9375



Epoch 4/5:  97%|█████████▋| 2152/2208 [12:53<00:20,  2.77it/s][A
Epoch 4/5:  98%|█████████▊| 2153/2208 [12:53<00:20,  2.74it/s][A
Epoch 4/5:  98%|█████████▊| 2154/2208 [12:53<00:19,  2.79it/s][A
Epoch 4/5:  98%|█████████▊| 2155/2208 [12:54<00:19,  2.78it/s][A
Epoch 4/5:  98%|█████████▊| 2156/2208 [12:54<00:18,  2.80it/s][A
Epoch 4/5:  98%|█████████▊| 2157/2208 [12:54<00:18,  2.82it/s][A
Epoch 4/5:  98%|█████████▊| 2158/2208 [12:55<00:17,  2.82it/s][A
Epoch 4/5:  98%|█████████▊| 2159/2208 [12:55<00:17,  2.85it/s][A
Epoch 4/5:  98%|█████████▊| 2160/2208 [12:55<00:17,  2.79it/s][A
Epoch 4/5:  98%|█████████▊| 2161/2208 [12:56<00:16,  2.84it/s][A
Epoch 4/5:  98%|█████████▊| 2162/2208 [12:56<00:16,  2.84it/s][A
Epoch 4/5:  98%|█████████▊| 2163/2208 [12:56<00:15,  2.83it/s][A
Epoch 4/5:  98%|█████████▊| 2164/2208 [12:57<00:15,  2.83it/s][A
Epoch 4/5:  98%|█████████▊| 2165/2208 [12:57<00:15,  2.84it/s][A
Epoch 4/5:  98%|█████████▊| 2166/2208 [12:58<00:14,  2.87it/s][A
Epoch 4/5

Batch 2175: Training accuracy = 0.8672, F1 = 0.8688, Precision = 0.8932, Recall = 0.8672



Epoch 4/5:  99%|█████████▊| 2177/2208 [13:01<00:11,  2.79it/s][A
Epoch 4/5:  99%|█████████▊| 2178/2208 [13:02<00:10,  2.75it/s][A
Epoch 4/5:  99%|█████████▊| 2179/2208 [13:02<00:10,  2.79it/s][A
Epoch 4/5:  99%|█████████▊| 2180/2208 [13:02<00:10,  2.79it/s][A
Epoch 4/5:  99%|█████████▉| 2181/2208 [13:03<00:09,  2.78it/s][A
Epoch 4/5:  99%|█████████▉| 2182/2208 [13:03<00:09,  2.81it/s][A
Epoch 4/5:  99%|█████████▉| 2183/2208 [13:04<00:08,  2.83it/s][A
Epoch 4/5:  99%|█████████▉| 2184/2208 [13:04<00:08,  2.79it/s][A
Epoch 4/5:  99%|█████████▉| 2185/2208 [13:04<00:08,  2.72it/s][A
Epoch 4/5:  99%|█████████▉| 2186/2208 [13:05<00:08,  2.65it/s][A
Epoch 4/5:  99%|█████████▉| 2187/2208 [13:05<00:07,  2.72it/s][A
Epoch 4/5:  99%|█████████▉| 2188/2208 [13:05<00:07,  2.71it/s][A
Epoch 4/5:  99%|█████████▉| 2189/2208 [13:06<00:06,  2.78it/s][A
Epoch 4/5:  99%|█████████▉| 2190/2208 [13:06<00:06,  2.80it/s][A
Epoch 4/5:  99%|█████████▉| 2191/2208 [13:06<00:06,  2.79it/s][A
Epoch 4/5

Batch 2200: Training accuracy = 0.8594, F1 = 0.8491, Precision = 0.8568, Recall = 0.8594



Epoch 4/5: 100%|█████████▉| 2202/2208 [13:10<00:02,  2.81it/s][A
Epoch 4/5: 100%|█████████▉| 2203/2208 [13:11<00:01,  2.84it/s][A
Epoch 4/5: 100%|█████████▉| 2204/2208 [13:11<00:01,  2.85it/s][A
Epoch 4/5: 100%|█████████▉| 2205/2208 [13:11<00:01,  2.86it/s][A
Epoch 4/5: 100%|█████████▉| 2206/2208 [13:12<00:00,  2.88it/s][A
Epoch 4/5: 100%|█████████▉| 2207/2208 [13:12<00:00,  2.90it/s][A
Epoch 4/5: 100%|██████████| 2208/2208 [13:12<00:00,  2.92it/s][A
                                                              [A


Epoch 4 training accuracy: 0.87%
Epoch 4 training F1 score: 0.8722
Epoch 4 training precision: 0.8831
Epoch 4 training recall: 0.8657

Starting validation...



Validation:   0%|          | 0/552 [00:00<?, ?it/s][A
Validation:   0%|          | 1/552 [00:01<15:04,  1.64s/it][A
Validation:   1%|          | 3/552 [00:01<04:21,  2.10it/s][A
Validation:   1%|          | 5/552 [00:02<02:50,  3.21it/s][A
Validation:   2%|▏         | 9/552 [00:02<01:19,  6.84it/s][A
Validation:   2%|▏         | 12/552 [00:02<00:57,  9.47it/s][A
Validation:   3%|▎         | 14/552 [00:02<01:07,  7.99it/s][A
Validation:   3%|▎         | 16/552 [00:02<00:56,  9.56it/s][A
Validation:   3%|▎         | 18/552 [00:03<00:56,  9.52it/s][A
Validation:   4%|▎         | 20/552 [00:03<00:48, 10.99it/s][A
Validation:   4%|▍         | 22/552 [00:03<00:44, 11.90it/s][A
Validation:   4%|▍         | 24/552 [00:03<00:50, 10.49it/s][A
Validation:   5%|▍         | 26/552 [00:03<00:56,  9.34it/s][A
Validation:   5%|▌         | 29/552 [00:03<00:46, 11.15it/s][A
Validation:   6%|▌         | 32/552 [00:04<00:36, 14.13it/s][A
Validation:   6%|▌         | 34/552 [00:04<00:40, 12

Validation accuracy: 0.75%
Validation F1 score: 0.7603
Validation precision: 0.8292
Validation recall: 0.7482

Starting epoch 5/5



  _warn_prf(average, modifier, f"{metric.capitalize()} is", len(result))
  _warn_prf(average, modifier, f"{metric.capitalize()} is", len(result))

Epoch 5/5:   0%|          | 1/2208 [00:03<1:57:42,  3.20s/it][A

Batch 0: Training accuracy = 0.9141, F1 = 0.9042, Precision = 0.9043, Recall = 0.9141



Epoch 5/5:   0%|          | 2/2208 [00:03<55:48,  1.52s/it]  [A
Epoch 5/5:   0%|          | 3/2208 [00:03<36:04,  1.02it/s][A
Epoch 5/5:   0%|          | 4/2208 [00:04<26:48,  1.37it/s][A
Epoch 5/5:   0%|          | 5/2208 [00:04<21:47,  1.69it/s][A
Epoch 5/5:   0%|          | 6/2208 [00:04<18:57,  1.94it/s][A
Epoch 5/5:   0%|          | 7/2208 [00:05<16:56,  2.17it/s][A
Epoch 5/5:   0%|          | 8/2208 [00:05<15:32,  2.36it/s][A
Epoch 5/5:   0%|          | 9/2208 [00:05<14:33,  2.52it/s][A
Epoch 5/5:   0%|          | 10/2208 [00:06<14:01,  2.61it/s][A
Epoch 5/5:   0%|          | 11/2208 [00:06<13:33,  2.70it/s][A
Epoch 5/5:   1%|          | 12/2208 [00:07<13:30,  2.71it/s][A
Epoch 5/5:   1%|          | 13/2208 [00:07<13:09,  2.78it/s][A
Epoch 5/5:   1%|          | 14/2208 [00:07<13:07,  2.79it/s][A
Epoch 5/5:   1%|          | 15/2208 [00:08<12:56,  2.82it/s][A
Epoch 5/5:   1%|          | 16/2208 [00:08<13:09,  2.78it/s][A
Epoch 5/5:   1%|          | 17/2208 [00:08<12

Batch 25: Training accuracy = 0.8984, F1 = 0.8953, Precision = 0.9010, Recall = 0.8984



Epoch 5/5:   1%|          | 27/2208 [00:12<12:56,  2.81it/s][A
Epoch 5/5:   1%|▏         | 28/2208 [00:12<12:49,  2.83it/s][A
Epoch 5/5:   1%|▏         | 29/2208 [00:13<12:42,  2.86it/s][A
Epoch 5/5:   1%|▏         | 30/2208 [00:13<12:50,  2.83it/s][A
Epoch 5/5:   1%|▏         | 31/2208 [00:13<13:06,  2.77it/s][A
Epoch 5/5:   1%|▏         | 32/2208 [00:14<13:15,  2.74it/s][A
Epoch 5/5:   1%|▏         | 33/2208 [00:14<13:01,  2.78it/s][A
Epoch 5/5:   2%|▏         | 34/2208 [00:14<12:53,  2.81it/s][A
Epoch 5/5:   2%|▏         | 35/2208 [00:15<12:52,  2.81it/s][A
Epoch 5/5:   2%|▏         | 36/2208 [00:15<12:40,  2.86it/s][A
Epoch 5/5:   2%|▏         | 37/2208 [00:15<12:33,  2.88it/s][A
Epoch 5/5:   2%|▏         | 38/2208 [00:16<12:26,  2.91it/s][A
Epoch 5/5:   2%|▏         | 39/2208 [00:16<12:40,  2.85it/s][A
Epoch 5/5:   2%|▏         | 40/2208 [00:16<12:34,  2.87it/s][A
Epoch 5/5:   2%|▏         | 41/2208 [00:17<12:33,  2.88it/s][A
Epoch 5/5:   2%|▏         | 42/2208 [00

Batch 50: Training accuracy = 0.8750, F1 = 0.8622, Precision = 0.8613, Recall = 0.8750



Epoch 5/5:   2%|▏         | 52/2208 [00:21<12:42,  2.83it/s][A
Epoch 5/5:   2%|▏         | 53/2208 [00:21<12:36,  2.85it/s][A
Epoch 5/5:   2%|▏         | 54/2208 [00:21<12:28,  2.88it/s][A
Epoch 5/5:   2%|▏         | 55/2208 [00:22<12:23,  2.89it/s][A
Epoch 5/5:   3%|▎         | 56/2208 [00:22<12:21,  2.90it/s][A
Epoch 5/5:   3%|▎         | 57/2208 [00:22<12:35,  2.85it/s][A
Epoch 5/5:   3%|▎         | 58/2208 [00:23<12:27,  2.87it/s][A
Epoch 5/5:   3%|▎         | 59/2208 [00:23<12:32,  2.86it/s][A
Epoch 5/5:   3%|▎         | 60/2208 [00:23<12:29,  2.87it/s][A
Epoch 5/5:   3%|▎         | 61/2208 [00:24<12:22,  2.89it/s][A
Epoch 5/5:   3%|▎         | 62/2208 [00:24<12:33,  2.85it/s][A
Epoch 5/5:   3%|▎         | 63/2208 [00:25<12:30,  2.86it/s][A
Epoch 5/5:   3%|▎         | 64/2208 [00:25<12:37,  2.83it/s][A
Epoch 5/5:   3%|▎         | 65/2208 [00:25<12:46,  2.79it/s][A
Epoch 5/5:   3%|▎         | 66/2208 [00:26<12:34,  2.84it/s][A
Epoch 5/5:   3%|▎         | 67/2208 [00

Batch 75: Training accuracy = 0.8125, F1 = 0.7969, Precision = 0.8078, Recall = 0.8125



Epoch 5/5:   3%|▎         | 77/2208 [00:29<12:12,  2.91it/s][A
Epoch 5/5:   4%|▎         | 78/2208 [00:30<12:28,  2.84it/s][A
Epoch 5/5:   4%|▎         | 79/2208 [00:30<12:29,  2.84it/s][A
Epoch 5/5:   4%|▎         | 80/2208 [00:31<12:23,  2.86it/s][A
Epoch 5/5:   4%|▎         | 81/2208 [00:31<12:37,  2.81it/s][A
Epoch 5/5:   4%|▎         | 82/2208 [00:31<12:50,  2.76it/s][A
Epoch 5/5:   4%|▍         | 83/2208 [00:32<12:42,  2.79it/s][A
Epoch 5/5:   4%|▍         | 84/2208 [00:32<13:02,  2.71it/s][A
Epoch 5/5:   4%|▍         | 85/2208 [00:32<12:45,  2.77it/s][A
Epoch 5/5:   4%|▍         | 86/2208 [00:33<12:30,  2.83it/s][A
Epoch 5/5:   4%|▍         | 87/2208 [00:33<12:22,  2.86it/s][A
Epoch 5/5:   4%|▍         | 88/2208 [00:33<12:22,  2.85it/s][A
Epoch 5/5:   4%|▍         | 89/2208 [00:34<12:36,  2.80it/s][A
Epoch 5/5:   4%|▍         | 90/2208 [00:34<12:29,  2.82it/s][A
Epoch 5/5:   4%|▍         | 91/2208 [00:34<12:23,  2.85it/s][A
Epoch 5/5:   4%|▍         | 92/2208 [00

Batch 100: Training accuracy = 0.8906, F1 = 0.8945, Precision = 0.9128, Recall = 0.8906



Epoch 5/5:   5%|▍         | 102/2208 [00:38<12:40,  2.77it/s][A
Epoch 5/5:   5%|▍         | 103/2208 [00:39<12:36,  2.78it/s][A
Epoch 5/5:   5%|▍         | 104/2208 [00:39<12:55,  2.71it/s][A
Epoch 5/5:   5%|▍         | 105/2208 [00:40<13:15,  2.64it/s][A
Epoch 5/5:   5%|▍         | 106/2208 [00:40<12:51,  2.73it/s][A
Epoch 5/5:   5%|▍         | 107/2208 [00:40<13:05,  2.68it/s][A
Epoch 5/5:   5%|▍         | 108/2208 [00:41<13:02,  2.68it/s][A
Epoch 5/5:   5%|▍         | 109/2208 [00:41<12:40,  2.76it/s][A
Epoch 5/5:   5%|▍         | 110/2208 [00:41<12:42,  2.75it/s][A
Epoch 5/5:   5%|▌         | 111/2208 [00:42<12:51,  2.72it/s][A
Epoch 5/5:   5%|▌         | 112/2208 [00:42<12:56,  2.70it/s][A
Epoch 5/5:   5%|▌         | 113/2208 [00:42<13:05,  2.67it/s][A
Epoch 5/5:   5%|▌         | 114/2208 [00:43<13:00,  2.68it/s][A
Epoch 5/5:   5%|▌         | 115/2208 [00:43<12:38,  2.76it/s][A
Epoch 5/5:   5%|▌         | 116/2208 [00:44<12:30,  2.79it/s][A
Epoch 5/5:   5%|▌       

Batch 125: Training accuracy = 0.8672, F1 = 0.8633, Precision = 0.8776, Recall = 0.8672



Epoch 5/5:   6%|▌         | 127/2208 [00:47<12:16,  2.82it/s][A
Epoch 5/5:   6%|▌         | 128/2208 [00:48<12:12,  2.84it/s][A
Epoch 5/5:   6%|▌         | 129/2208 [00:48<12:22,  2.80it/s][A
Epoch 5/5:   6%|▌         | 130/2208 [00:48<12:23,  2.79it/s][A
Epoch 5/5:   6%|▌         | 131/2208 [00:49<12:24,  2.79it/s][A
Epoch 5/5:   6%|▌         | 132/2208 [00:49<12:21,  2.80it/s][A
Epoch 5/5:   6%|▌         | 133/2208 [00:50<12:11,  2.84it/s][A
Epoch 5/5:   6%|▌         | 134/2208 [00:50<12:16,  2.82it/s][A
Epoch 5/5:   6%|▌         | 135/2208 [00:50<12:26,  2.78it/s][A
Epoch 5/5:   6%|▌         | 136/2208 [00:51<12:18,  2.81it/s][A
Epoch 5/5:   6%|▌         | 137/2208 [00:51<12:25,  2.78it/s][A
Epoch 5/5:   6%|▋         | 138/2208 [00:51<12:15,  2.82it/s][A
Epoch 5/5:   6%|▋         | 139/2208 [00:52<12:09,  2.84it/s][A
Epoch 5/5:   6%|▋         | 140/2208 [00:52<12:30,  2.76it/s][A
Epoch 5/5:   6%|▋         | 141/2208 [00:52<12:21,  2.79it/s][A
Epoch 5/5:   6%|▋       

Batch 150: Training accuracy = 0.8984, F1 = 0.8924, Precision = 0.8971, Recall = 0.8984



Epoch 5/5:   7%|▋         | 152/2208 [00:57<12:53,  2.66it/s][A
Epoch 5/5:   7%|▋         | 153/2208 [00:57<12:48,  2.67it/s][A
Epoch 5/5:   7%|▋         | 154/2208 [00:57<12:42,  2.70it/s][A
Epoch 5/5:   7%|▋         | 155/2208 [00:58<12:28,  2.74it/s][A
Epoch 5/5:   7%|▋         | 156/2208 [00:58<12:33,  2.72it/s][A
Epoch 5/5:   7%|▋         | 157/2208 [00:58<12:29,  2.74it/s][A
Epoch 5/5:   7%|▋         | 158/2208 [00:59<12:17,  2.78it/s][A
Epoch 5/5:   7%|▋         | 159/2208 [00:59<12:09,  2.81it/s][A
Epoch 5/5:   7%|▋         | 160/2208 [00:59<12:03,  2.83it/s][A
Epoch 5/5:   7%|▋         | 161/2208 [01:00<11:58,  2.85it/s][A
Epoch 5/5:   7%|▋         | 162/2208 [01:00<12:10,  2.80it/s][A
Epoch 5/5:   7%|▋         | 163/2208 [01:00<11:58,  2.85it/s][A
Epoch 5/5:   7%|▋         | 164/2208 [01:01<12:00,  2.84it/s][A
Epoch 5/5:   7%|▋         | 165/2208 [01:01<11:51,  2.87it/s][A
Epoch 5/5:   8%|▊         | 166/2208 [01:02<12:01,  2.83it/s][A
Epoch 5/5:   8%|▊       

Batch 175: Training accuracy = 0.8594, F1 = 0.8568, Precision = 0.8763, Recall = 0.8594



Epoch 5/5:   8%|▊         | 177/2208 [01:05<12:10,  2.78it/s][A
Epoch 5/5:   8%|▊         | 178/2208 [01:06<12:18,  2.75it/s][A
Epoch 5/5:   8%|▊         | 179/2208 [01:06<12:34,  2.69it/s][A
Epoch 5/5:   8%|▊         | 180/2208 [01:07<12:26,  2.72it/s][A
Epoch 5/5:   8%|▊         | 181/2208 [01:07<12:12,  2.77it/s][A
Epoch 5/5:   8%|▊         | 182/2208 [01:07<12:29,  2.70it/s][A
Epoch 5/5:   8%|▊         | 183/2208 [01:08<12:12,  2.77it/s][A
Epoch 5/5:   8%|▊         | 184/2208 [01:08<12:02,  2.80it/s][A
Epoch 5/5:   8%|▊         | 185/2208 [01:08<11:53,  2.83it/s][A
Epoch 5/5:   8%|▊         | 186/2208 [01:09<12:02,  2.80it/s][A
Epoch 5/5:   8%|▊         | 187/2208 [01:09<12:12,  2.76it/s][A
Epoch 5/5:   9%|▊         | 188/2208 [01:09<12:10,  2.77it/s][A
Epoch 5/5:   9%|▊         | 189/2208 [01:10<12:20,  2.73it/s][A
Epoch 5/5:   9%|▊         | 190/2208 [01:10<12:25,  2.71it/s][A
Epoch 5/5:   9%|▊         | 191/2208 [01:11<12:54,  2.60it/s][A
Epoch 5/5:   9%|▊       

Batch 200: Training accuracy = 0.8516, F1 = 0.8411, Precision = 0.8438, Recall = 0.8516



Epoch 5/5:   9%|▉         | 202/2208 [01:15<11:44,  2.85it/s][A
Epoch 5/5:   9%|▉         | 203/2208 [01:15<11:38,  2.87it/s][A
Epoch 5/5:   9%|▉         | 204/2208 [01:15<12:05,  2.76it/s][A
Epoch 5/5:   9%|▉         | 205/2208 [01:16<11:54,  2.81it/s][A
Epoch 5/5:   9%|▉         | 206/2208 [01:16<12:07,  2.75it/s][A
Epoch 5/5:   9%|▉         | 207/2208 [01:16<12:01,  2.77it/s][A
Epoch 5/5:   9%|▉         | 208/2208 [01:17<12:27,  2.68it/s][A
Epoch 5/5:   9%|▉         | 209/2208 [01:17<12:05,  2.76it/s][A
Epoch 5/5:  10%|▉         | 210/2208 [01:17<11:53,  2.80it/s][A
Epoch 5/5:  10%|▉         | 211/2208 [01:18<11:48,  2.82it/s][A
Epoch 5/5:  10%|▉         | 212/2208 [01:18<11:48,  2.82it/s][A
Epoch 5/5:  10%|▉         | 213/2208 [01:18<11:42,  2.84it/s][A
Epoch 5/5:  10%|▉         | 214/2208 [01:19<11:35,  2.87it/s][A
Epoch 5/5:  10%|▉         | 215/2208 [01:19<11:34,  2.87it/s][A
Epoch 5/5:  10%|▉         | 216/2208 [01:19<11:33,  2.87it/s][A
Epoch 5/5:  10%|▉       

Batch 225: Training accuracy = 0.8594, F1 = 0.8521, Precision = 0.8629, Recall = 0.8594



Epoch 5/5:  10%|█         | 227/2208 [01:24<11:59,  2.75it/s][A
Epoch 5/5:  10%|█         | 228/2208 [01:24<11:46,  2.80it/s][A
Epoch 5/5:  10%|█         | 229/2208 [01:24<11:52,  2.78it/s][A
Epoch 5/5:  10%|█         | 230/2208 [01:25<11:49,  2.79it/s][A
Epoch 5/5:  10%|█         | 231/2208 [01:25<12:04,  2.73it/s][A
Epoch 5/5:  11%|█         | 232/2208 [01:25<12:21,  2.66it/s][A
Epoch 5/5:  11%|█         | 233/2208 [01:26<12:08,  2.71it/s][A
Epoch 5/5:  11%|█         | 234/2208 [01:26<11:58,  2.75it/s][A
Epoch 5/5:  11%|█         | 235/2208 [01:26<12:06,  2.72it/s][A
Epoch 5/5:  11%|█         | 236/2208 [01:27<12:00,  2.74it/s][A
Epoch 5/5:  11%|█         | 237/2208 [01:27<11:48,  2.78it/s][A
Epoch 5/5:  11%|█         | 238/2208 [01:28<11:43,  2.80it/s][A
Epoch 5/5:  11%|█         | 239/2208 [01:28<11:48,  2.78it/s][A
Epoch 5/5:  11%|█         | 240/2208 [01:28<11:49,  2.77it/s][A
Epoch 5/5:  11%|█         | 241/2208 [01:29<12:03,  2.72it/s][A
Epoch 5/5:  11%|█       

Batch 250: Training accuracy = 0.8047, F1 = 0.7977, Precision = 0.8060, Recall = 0.8047



Epoch 5/5:  11%|█▏        | 252/2208 [01:33<11:36,  2.81it/s][A
Epoch 5/5:  11%|█▏        | 253/2208 [01:33<11:39,  2.80it/s][A
Epoch 5/5:  12%|█▏        | 254/2208 [01:33<11:29,  2.83it/s][A
Epoch 5/5:  12%|█▏        | 255/2208 [01:34<11:21,  2.87it/s][A
Epoch 5/5:  12%|█▏        | 256/2208 [01:34<11:19,  2.87it/s][A
Epoch 5/5:  12%|█▏        | 257/2208 [01:34<11:28,  2.83it/s][A
Epoch 5/5:  12%|█▏        | 258/2208 [01:35<11:20,  2.87it/s][A
Epoch 5/5:  12%|█▏        | 259/2208 [01:35<11:49,  2.75it/s][A
Epoch 5/5:  12%|█▏        | 260/2208 [01:35<11:49,  2.75it/s][A
Epoch 5/5:  12%|█▏        | 261/2208 [01:36<11:40,  2.78it/s][A
Epoch 5/5:  12%|█▏        | 262/2208 [01:36<11:35,  2.80it/s][A
Epoch 5/5:  12%|█▏        | 263/2208 [01:36<11:27,  2.83it/s][A
Epoch 5/5:  12%|█▏        | 264/2208 [01:37<11:33,  2.80it/s][A
Epoch 5/5:  12%|█▏        | 265/2208 [01:37<11:28,  2.82it/s][A
Epoch 5/5:  12%|█▏        | 266/2208 [01:38<11:22,  2.85it/s][A
Epoch 5/5:  12%|█▏      

Batch 275: Training accuracy = 0.9062, F1 = 0.8917, Precision = 0.8878, Recall = 0.9062



Epoch 5/5:  13%|█▎        | 277/2208 [01:42<11:30,  2.80it/s][A
Epoch 5/5:  13%|█▎        | 278/2208 [01:42<11:38,  2.76it/s][A
Epoch 5/5:  13%|█▎        | 279/2208 [01:42<11:50,  2.71it/s][A
Epoch 5/5:  13%|█▎        | 280/2208 [01:43<11:49,  2.72it/s][A
Epoch 5/5:  13%|█▎        | 281/2208 [01:43<11:43,  2.74it/s][A
Epoch 5/5:  13%|█▎        | 282/2208 [01:43<11:27,  2.80it/s][A
Epoch 5/5:  13%|█▎        | 283/2208 [01:44<11:26,  2.80it/s][A
Epoch 5/5:  13%|█▎        | 284/2208 [01:44<11:28,  2.79it/s][A
Epoch 5/5:  13%|█▎        | 285/2208 [01:44<11:19,  2.83it/s][A
Epoch 5/5:  13%|█▎        | 286/2208 [01:45<11:10,  2.87it/s][A
Epoch 5/5:  13%|█▎        | 287/2208 [01:45<11:12,  2.86it/s][A
Epoch 5/5:  13%|█▎        | 288/2208 [01:45<11:08,  2.87it/s][A
Epoch 5/5:  13%|█▎        | 289/2208 [01:46<11:40,  2.74it/s][A
Epoch 5/5:  13%|█▎        | 290/2208 [01:46<11:25,  2.80it/s][A
Epoch 5/5:  13%|█▎        | 291/2208 [01:47<11:17,  2.83it/s][A
Epoch 5/5:  13%|█▎      

Batch 300: Training accuracy = 0.8672, F1 = 0.8552, Precision = 0.8516, Recall = 0.8672



Epoch 5/5:  14%|█▎        | 302/2208 [01:51<11:50,  2.68it/s][A
Epoch 5/5:  14%|█▎        | 303/2208 [01:51<11:30,  2.76it/s][A
Epoch 5/5:  14%|█▍        | 304/2208 [01:51<11:42,  2.71it/s][A
Epoch 5/5:  14%|█▍        | 305/2208 [01:52<11:55,  2.66it/s][A
Epoch 5/5:  14%|█▍        | 306/2208 [01:52<11:44,  2.70it/s][A
Epoch 5/5:  14%|█▍        | 307/2208 [01:52<11:28,  2.76it/s][A
Epoch 5/5:  14%|█▍        | 308/2208 [01:53<11:16,  2.81it/s][A
Epoch 5/5:  14%|█▍        | 309/2208 [01:53<11:23,  2.78it/s][A
Epoch 5/5:  14%|█▍        | 310/2208 [01:53<11:16,  2.80it/s][A
Epoch 5/5:  14%|█▍        | 311/2208 [01:54<11:20,  2.79it/s][A
Epoch 5/5:  14%|█▍        | 312/2208 [01:54<11:28,  2.76it/s][A
Epoch 5/5:  14%|█▍        | 313/2208 [01:55<11:54,  2.65it/s][A
Epoch 5/5:  14%|█▍        | 314/2208 [01:55<11:40,  2.70it/s][A
Epoch 5/5:  14%|█▍        | 315/2208 [01:55<11:41,  2.70it/s][A
Epoch 5/5:  14%|█▍        | 316/2208 [01:56<11:47,  2.67it/s][A
Epoch 5/5:  14%|█▍      

Batch 325: Training accuracy = 0.8516, F1 = 0.8510, Precision = 0.8659, Recall = 0.8516



Epoch 5/5:  15%|█▍        | 327/2208 [02:00<11:21,  2.76it/s][A
Epoch 5/5:  15%|█▍        | 328/2208 [02:00<11:20,  2.76it/s][A
Epoch 5/5:  15%|█▍        | 329/2208 [02:00<11:07,  2.81it/s][A
Epoch 5/5:  15%|█▍        | 330/2208 [02:01<11:00,  2.84it/s][A
Epoch 5/5:  15%|█▍        | 331/2208 [02:01<10:51,  2.88it/s][A
Epoch 5/5:  15%|█▌        | 332/2208 [02:01<10:58,  2.85it/s][A
Epoch 5/5:  15%|█▌        | 333/2208 [02:02<10:59,  2.84it/s][A
Epoch 5/5:  15%|█▌        | 334/2208 [02:02<11:01,  2.83it/s][A
Epoch 5/5:  15%|█▌        | 335/2208 [02:02<10:52,  2.87it/s][A
Epoch 5/5:  15%|█▌        | 336/2208 [02:03<10:50,  2.88it/s][A
Epoch 5/5:  15%|█▌        | 337/2208 [02:03<10:52,  2.87it/s][A
Epoch 5/5:  15%|█▌        | 338/2208 [02:03<10:53,  2.86it/s][A
Epoch 5/5:  15%|█▌        | 339/2208 [02:04<11:04,  2.81it/s][A
Epoch 5/5:  15%|█▌        | 340/2208 [02:04<11:01,  2.82it/s][A
Epoch 5/5:  15%|█▌        | 341/2208 [02:05<11:04,  2.81it/s][A
Epoch 5/5:  15%|█▌      

Batch 350: Training accuracy = 0.8359, F1 = 0.8154, Precision = 0.8099, Recall = 0.8359



Epoch 5/5:  16%|█▌        | 352/2208 [02:09<11:39,  2.65it/s][A
Epoch 5/5:  16%|█▌        | 353/2208 [02:09<11:27,  2.70it/s][A
Epoch 5/5:  16%|█▌        | 354/2208 [02:09<11:11,  2.76it/s][A
Epoch 5/5:  16%|█▌        | 355/2208 [02:10<11:01,  2.80it/s][A
Epoch 5/5:  16%|█▌        | 356/2208 [02:10<11:09,  2.77it/s][A
Epoch 5/5:  16%|█▌        | 357/2208 [02:10<11:18,  2.73it/s][A
Epoch 5/5:  16%|█▌        | 358/2208 [02:11<11:08,  2.77it/s][A
Epoch 5/5:  16%|█▋        | 359/2208 [02:11<11:12,  2.75it/s][A
Epoch 5/5:  16%|█▋        | 360/2208 [02:11<11:22,  2.71it/s][A
Epoch 5/5:  16%|█▋        | 361/2208 [02:12<11:10,  2.75it/s][A
Epoch 5/5:  16%|█▋        | 362/2208 [02:12<11:24,  2.70it/s][A
Epoch 5/5:  16%|█▋        | 363/2208 [02:13<11:13,  2.74it/s][A
Epoch 5/5:  16%|█▋        | 364/2208 [02:13<11:20,  2.71it/s][A
Epoch 5/5:  17%|█▋        | 365/2208 [02:13<11:08,  2.76it/s][A
Epoch 5/5:  17%|█▋        | 366/2208 [02:14<10:54,  2.81it/s][A
Epoch 5/5:  17%|█▋      

Batch 375: Training accuracy = 0.8672, F1 = 0.8536, Precision = 0.8607, Recall = 0.8672



Epoch 5/5:  17%|█▋        | 377/2208 [02:18<11:18,  2.70it/s][A
Epoch 5/5:  17%|█▋        | 378/2208 [02:18<11:00,  2.77it/s][A
Epoch 5/5:  17%|█▋        | 379/2208 [02:18<11:04,  2.75it/s][A
Epoch 5/5:  17%|█▋        | 380/2208 [02:19<10:57,  2.78it/s][A
Epoch 5/5:  17%|█▋        | 381/2208 [02:19<11:04,  2.75it/s][A
Epoch 5/5:  17%|█▋        | 382/2208 [02:19<11:00,  2.76it/s][A
Epoch 5/5:  17%|█▋        | 383/2208 [02:20<10:52,  2.80it/s][A
Epoch 5/5:  17%|█▋        | 384/2208 [02:20<10:44,  2.83it/s][A
Epoch 5/5:  17%|█▋        | 385/2208 [02:20<10:52,  2.79it/s][A
Epoch 5/5:  17%|█▋        | 386/2208 [02:21<10:52,  2.79it/s][A
Epoch 5/5:  18%|█▊        | 387/2208 [02:21<10:58,  2.76it/s][A
Epoch 5/5:  18%|█▊        | 388/2208 [02:21<10:47,  2.81it/s][A
Epoch 5/5:  18%|█▊        | 389/2208 [02:22<10:59,  2.76it/s][A
Epoch 5/5:  18%|█▊        | 390/2208 [02:22<11:00,  2.75it/s][A
Epoch 5/5:  18%|█▊        | 391/2208 [02:23<10:47,  2.81it/s][A
Epoch 5/5:  18%|█▊      

Batch 400: Training accuracy = 0.9141, F1 = 0.9005, Precision = 0.8945, Recall = 0.9141



Epoch 5/5:  18%|█▊        | 402/2208 [02:27<10:44,  2.80it/s][A
Epoch 5/5:  18%|█▊        | 403/2208 [02:27<10:41,  2.81it/s][A
Epoch 5/5:  18%|█▊        | 404/2208 [02:27<10:32,  2.85it/s][A
Epoch 5/5:  18%|█▊        | 405/2208 [02:28<10:36,  2.83it/s][A
Epoch 5/5:  18%|█▊        | 406/2208 [02:28<10:44,  2.79it/s][A
Epoch 5/5:  18%|█▊        | 407/2208 [02:28<10:36,  2.83it/s][A
Epoch 5/5:  18%|█▊        | 408/2208 [02:29<10:47,  2.78it/s][A
Epoch 5/5:  19%|█▊        | 409/2208 [02:29<10:38,  2.82it/s][A
Epoch 5/5:  19%|█▊        | 410/2208 [02:29<10:43,  2.79it/s][A
Epoch 5/5:  19%|█▊        | 411/2208 [02:30<10:49,  2.76it/s][A
Epoch 5/5:  19%|█▊        | 412/2208 [02:30<10:56,  2.73it/s][A
Epoch 5/5:  19%|█▊        | 413/2208 [02:31<11:02,  2.71it/s][A
Epoch 5/5:  19%|█▉        | 414/2208 [02:31<11:01,  2.71it/s][A
Epoch 5/5:  19%|█▉        | 415/2208 [02:31<10:48,  2.76it/s][A
Epoch 5/5:  19%|█▉        | 416/2208 [02:32<10:55,  2.73it/s][A
Epoch 5/5:  19%|█▉      

Batch 425: Training accuracy = 0.8906, F1 = 0.8859, Precision = 0.8984, Recall = 0.8906



Epoch 5/5:  19%|█▉        | 427/2208 [02:36<11:02,  2.69it/s][A
Epoch 5/5:  19%|█▉        | 428/2208 [02:36<10:48,  2.74it/s][A
Epoch 5/5:  19%|█▉        | 429/2208 [02:36<10:52,  2.73it/s][A
Epoch 5/5:  19%|█▉        | 430/2208 [02:37<10:37,  2.79it/s][A
Epoch 5/5:  20%|█▉        | 431/2208 [02:37<10:39,  2.78it/s][A
Epoch 5/5:  20%|█▉        | 432/2208 [02:37<10:41,  2.77it/s][A
Epoch 5/5:  20%|█▉        | 433/2208 [02:38<10:36,  2.79it/s][A
Epoch 5/5:  20%|█▉        | 434/2208 [02:38<10:42,  2.76it/s][A
Epoch 5/5:  20%|█▉        | 435/2208 [02:38<10:47,  2.74it/s][A
Epoch 5/5:  20%|█▉        | 436/2208 [02:39<10:32,  2.80it/s][A
Epoch 5/5:  20%|█▉        | 437/2208 [02:39<10:30,  2.81it/s][A
Epoch 5/5:  20%|█▉        | 438/2208 [02:40<10:26,  2.82it/s][A
Epoch 5/5:  20%|█▉        | 439/2208 [02:40<10:20,  2.85it/s][A
Epoch 5/5:  20%|█▉        | 440/2208 [02:40<10:30,  2.80it/s][A
Epoch 5/5:  20%|█▉        | 441/2208 [02:41<10:25,  2.82it/s][A
Epoch 5/5:  20%|██      

Batch 450: Training accuracy = 0.8594, F1 = 0.8495, Precision = 0.8535, Recall = 0.8594



Epoch 5/5:  20%|██        | 452/2208 [02:45<10:33,  2.77it/s][A
Epoch 5/5:  21%|██        | 453/2208 [02:45<10:39,  2.74it/s][A
Epoch 5/5:  21%|██        | 454/2208 [02:45<10:47,  2.71it/s][A
Epoch 5/5:  21%|██        | 455/2208 [02:46<10:30,  2.78it/s][A
Epoch 5/5:  21%|██        | 456/2208 [02:46<10:20,  2.82it/s][A
Epoch 5/5:  21%|██        | 457/2208 [02:46<10:15,  2.84it/s][A
Epoch 5/5:  21%|██        | 458/2208 [02:47<10:09,  2.87it/s][A
Epoch 5/5:  21%|██        | 459/2208 [02:47<10:32,  2.76it/s][A
Epoch 5/5:  21%|██        | 460/2208 [02:47<10:49,  2.69it/s][A
Epoch 5/5:  21%|██        | 461/2208 [02:48<10:40,  2.73it/s][A
Epoch 5/5:  21%|██        | 462/2208 [02:48<10:41,  2.72it/s][A
Epoch 5/5:  21%|██        | 463/2208 [02:48<10:25,  2.79it/s][A
Epoch 5/5:  21%|██        | 464/2208 [02:49<10:42,  2.72it/s][A
Epoch 5/5:  21%|██        | 465/2208 [02:49<10:43,  2.71it/s][A
Epoch 5/5:  21%|██        | 466/2208 [02:50<10:48,  2.69it/s][A
Epoch 5/5:  21%|██      

Batch 475: Training accuracy = 0.8906, F1 = 0.8818, Precision = 0.8867, Recall = 0.8906



Epoch 5/5:  22%|██▏       | 477/2208 [02:54<10:33,  2.73it/s][A
Epoch 5/5:  22%|██▏       | 478/2208 [02:54<10:22,  2.78it/s][A
Epoch 5/5:  22%|██▏       | 479/2208 [02:54<10:16,  2.81it/s][A
Epoch 5/5:  22%|██▏       | 480/2208 [02:55<10:23,  2.77it/s][A
Epoch 5/5:  22%|██▏       | 481/2208 [02:55<10:27,  2.75it/s][A
Epoch 5/5:  22%|██▏       | 482/2208 [02:55<10:16,  2.80it/s][A
Epoch 5/5:  22%|██▏       | 483/2208 [02:56<10:20,  2.78it/s][A
Epoch 5/5:  22%|██▏       | 484/2208 [02:56<10:10,  2.82it/s][A
Epoch 5/5:  22%|██▏       | 485/2208 [02:57<10:13,  2.81it/s][A
Epoch 5/5:  22%|██▏       | 486/2208 [02:57<10:07,  2.84it/s][A
Epoch 5/5:  22%|██▏       | 487/2208 [02:57<10:11,  2.82it/s][A
Epoch 5/5:  22%|██▏       | 488/2208 [02:58<10:32,  2.72it/s][A
Epoch 5/5:  22%|██▏       | 489/2208 [02:58<10:41,  2.68it/s][A
Epoch 5/5:  22%|██▏       | 490/2208 [02:58<10:23,  2.75it/s][A
Epoch 5/5:  22%|██▏       | 491/2208 [02:59<10:31,  2.72it/s][A
Epoch 5/5:  22%|██▏     

Batch 500: Training accuracy = 0.8281, F1 = 0.8074, Precision = 0.8040, Recall = 0.8281



Epoch 5/5:  23%|██▎       | 502/2208 [03:03<10:32,  2.70it/s][A
Epoch 5/5:  23%|██▎       | 503/2208 [03:03<10:20,  2.75it/s][A
Epoch 5/5:  23%|██▎       | 504/2208 [03:03<10:08,  2.80it/s][A
Epoch 5/5:  23%|██▎       | 505/2208 [03:04<10:16,  2.76it/s][A
Epoch 5/5:  23%|██▎       | 506/2208 [03:04<10:05,  2.81it/s][A
Epoch 5/5:  23%|██▎       | 507/2208 [03:04<10:09,  2.79it/s][A
Epoch 5/5:  23%|██▎       | 508/2208 [03:05<10:00,  2.83it/s][A
Epoch 5/5:  23%|██▎       | 509/2208 [03:05<10:32,  2.69it/s][A
Epoch 5/5:  23%|██▎       | 510/2208 [03:06<10:23,  2.73it/s][A
Epoch 5/5:  23%|██▎       | 511/2208 [03:06<10:17,  2.75it/s][A
Epoch 5/5:  23%|██▎       | 512/2208 [03:06<10:11,  2.77it/s][A
Epoch 5/5:  23%|██▎       | 513/2208 [03:07<10:14,  2.76it/s][A
Epoch 5/5:  23%|██▎       | 514/2208 [03:07<10:20,  2.73it/s][A
Epoch 5/5:  23%|██▎       | 515/2208 [03:07<10:25,  2.71it/s][A
Epoch 5/5:  23%|██▎       | 516/2208 [03:08<10:21,  2.72it/s][A
Epoch 5/5:  23%|██▎     

Batch 525: Training accuracy = 0.8750, F1 = 0.8672, Precision = 0.8796, Recall = 0.8750



Epoch 5/5:  24%|██▍       | 527/2208 [03:12<09:57,  2.81it/s][A
Epoch 5/5:  24%|██▍       | 528/2208 [03:12<09:54,  2.83it/s][A
Epoch 5/5:  24%|██▍       | 529/2208 [03:12<09:59,  2.80it/s][A
Epoch 5/5:  24%|██▍       | 530/2208 [03:13<10:01,  2.79it/s][A
Epoch 5/5:  24%|██▍       | 531/2208 [03:13<09:56,  2.81it/s][A
Epoch 5/5:  24%|██▍       | 532/2208 [03:14<10:03,  2.78it/s][A
Epoch 5/5:  24%|██▍       | 533/2208 [03:14<10:01,  2.79it/s][A
Epoch 5/5:  24%|██▍       | 534/2208 [03:14<10:20,  2.70it/s][A
Epoch 5/5:  24%|██▍       | 535/2208 [03:15<10:17,  2.71it/s][A
Epoch 5/5:  24%|██▍       | 536/2208 [03:15<10:13,  2.72it/s][A
Epoch 5/5:  24%|██▍       | 537/2208 [03:15<10:00,  2.78it/s][A
Epoch 5/5:  24%|██▍       | 538/2208 [03:16<09:54,  2.81it/s][A
Epoch 5/5:  24%|██▍       | 539/2208 [03:16<09:57,  2.80it/s][A
Epoch 5/5:  24%|██▍       | 540/2208 [03:16<09:54,  2.81it/s][A
Epoch 5/5:  25%|██▍       | 541/2208 [03:17<09:55,  2.80it/s][A
Epoch 5/5:  25%|██▍     

Batch 550: Training accuracy = 0.7969, F1 = 0.7764, Precision = 0.7745, Recall = 0.7969



Epoch 5/5:  25%|██▌       | 552/2208 [03:21<10:04,  2.74it/s][A
Epoch 5/5:  25%|██▌       | 553/2208 [03:21<09:56,  2.77it/s][A
Epoch 5/5:  25%|██▌       | 554/2208 [03:21<09:56,  2.78it/s][A
Epoch 5/5:  25%|██▌       | 555/2208 [03:22<09:59,  2.76it/s][A
Epoch 5/5:  25%|██▌       | 556/2208 [03:22<09:52,  2.79it/s][A
Epoch 5/5:  25%|██▌       | 557/2208 [03:23<09:45,  2.82it/s][A
Epoch 5/5:  25%|██▌       | 558/2208 [03:23<09:46,  2.81it/s][A
Epoch 5/5:  25%|██▌       | 559/2208 [03:23<09:45,  2.82it/s][A
Epoch 5/5:  25%|██▌       | 560/2208 [03:24<09:58,  2.75it/s][A
Epoch 5/5:  25%|██▌       | 561/2208 [03:24<09:55,  2.76it/s][A
Epoch 5/5:  25%|██▌       | 562/2208 [03:24<09:48,  2.80it/s][A
Epoch 5/5:  25%|██▌       | 563/2208 [03:25<09:41,  2.83it/s][A
Epoch 5/5:  26%|██▌       | 564/2208 [03:25<09:49,  2.79it/s][A
Epoch 5/5:  26%|██▌       | 565/2208 [03:25<10:04,  2.72it/s][A
Epoch 5/5:  26%|██▌       | 566/2208 [03:26<09:49,  2.78it/s][A
Epoch 5/5:  26%|██▌     

Batch 575: Training accuracy = 0.7969, F1 = 0.7852, Precision = 0.7949, Recall = 0.7969



Epoch 5/5:  26%|██▌       | 577/2208 [03:30<09:21,  2.90it/s][A
Epoch 5/5:  26%|██▌       | 578/2208 [03:30<09:18,  2.92it/s][A
Epoch 5/5:  26%|██▌       | 579/2208 [03:30<09:20,  2.91it/s][A
Epoch 5/5:  26%|██▋       | 580/2208 [03:31<09:29,  2.86it/s][A
Epoch 5/5:  26%|██▋       | 581/2208 [03:31<09:41,  2.80it/s][A
Epoch 5/5:  26%|██▋       | 582/2208 [03:31<09:38,  2.81it/s][A
Epoch 5/5:  26%|██▋       | 583/2208 [03:32<09:31,  2.85it/s][A
Epoch 5/5:  26%|██▋       | 584/2208 [03:32<09:41,  2.80it/s][A
Epoch 5/5:  26%|██▋       | 585/2208 [03:33<09:48,  2.76it/s][A
Epoch 5/5:  27%|██▋       | 586/2208 [03:33<09:39,  2.80it/s][A
Epoch 5/5:  27%|██▋       | 587/2208 [03:33<09:39,  2.80it/s][A
Epoch 5/5:  27%|██▋       | 588/2208 [03:34<09:57,  2.71it/s][A
Epoch 5/5:  27%|██▋       | 589/2208 [03:34<10:08,  2.66it/s][A
Epoch 5/5:  27%|██▋       | 590/2208 [03:34<09:58,  2.70it/s][A
Epoch 5/5:  27%|██▋       | 591/2208 [03:35<09:54,  2.72it/s][A
Epoch 5/5:  27%|██▋     

Batch 600: Training accuracy = 0.8594, F1 = 0.8420, Precision = 0.8444, Recall = 0.8594



Epoch 5/5:  27%|██▋       | 602/2208 [03:39<09:31,  2.81it/s][A
Epoch 5/5:  27%|██▋       | 603/2208 [03:39<09:29,  2.82it/s][A
Epoch 5/5:  27%|██▋       | 604/2208 [03:39<09:26,  2.83it/s][A
Epoch 5/5:  27%|██▋       | 605/2208 [03:40<09:21,  2.86it/s][A
Epoch 5/5:  27%|██▋       | 606/2208 [03:40<09:15,  2.88it/s][A
Epoch 5/5:  27%|██▋       | 607/2208 [03:40<09:11,  2.90it/s][A
Epoch 5/5:  28%|██▊       | 608/2208 [03:41<09:08,  2.92it/s][A
Epoch 5/5:  28%|██▊       | 609/2208 [03:41<09:07,  2.92it/s][A
Epoch 5/5:  28%|██▊       | 610/2208 [03:41<09:06,  2.92it/s][A
Epoch 5/5:  28%|██▊       | 611/2208 [03:42<09:04,  2.93it/s][A
Epoch 5/5:  28%|██▊       | 612/2208 [03:42<09:10,  2.90it/s][A
Epoch 5/5:  28%|██▊       | 613/2208 [03:42<09:15,  2.87it/s][A
Epoch 5/5:  28%|██▊       | 614/2208 [03:43<09:20,  2.84it/s][A
Epoch 5/5:  28%|██▊       | 615/2208 [03:43<09:15,  2.87it/s][A
Epoch 5/5:  28%|██▊       | 616/2208 [03:44<09:30,  2.79it/s][A
Epoch 5/5:  28%|██▊     

Batch 625: Training accuracy = 0.8594, F1 = 0.8370, Precision = 0.8294, Recall = 0.8594



Epoch 5/5:  28%|██▊       | 627/2208 [03:47<09:15,  2.84it/s][A
Epoch 5/5:  28%|██▊       | 628/2208 [03:48<09:10,  2.87it/s][A
Epoch 5/5:  28%|██▊       | 629/2208 [03:48<09:19,  2.82it/s][A
Epoch 5/5:  29%|██▊       | 630/2208 [03:49<09:17,  2.83it/s][A
Epoch 5/5:  29%|██▊       | 631/2208 [03:49<09:19,  2.82it/s][A
Epoch 5/5:  29%|██▊       | 632/2208 [03:49<09:34,  2.75it/s][A
Epoch 5/5:  29%|██▊       | 633/2208 [03:50<09:21,  2.80it/s][A
Epoch 5/5:  29%|██▊       | 634/2208 [03:50<09:17,  2.82it/s][A
Epoch 5/5:  29%|██▉       | 635/2208 [03:50<09:15,  2.83it/s][A
Epoch 5/5:  29%|██▉       | 636/2208 [03:51<09:24,  2.78it/s][A
Epoch 5/5:  29%|██▉       | 637/2208 [03:51<09:38,  2.72it/s][A
Epoch 5/5:  29%|██▉       | 638/2208 [03:51<09:38,  2.71it/s][A
Epoch 5/5:  29%|██▉       | 639/2208 [03:52<09:49,  2.66it/s][A
Epoch 5/5:  29%|██▉       | 640/2208 [03:52<09:51,  2.65it/s][A
Epoch 5/5:  29%|██▉       | 641/2208 [03:53<09:41,  2.69it/s][A
Epoch 5/5:  29%|██▉     

Batch 650: Training accuracy = 0.8672, F1 = 0.8565, Precision = 0.8600, Recall = 0.8672



Epoch 5/5:  30%|██▉       | 652/2208 [03:57<09:10,  2.83it/s][A
Epoch 5/5:  30%|██▉       | 653/2208 [03:57<09:19,  2.78it/s][A
Epoch 5/5:  30%|██▉       | 654/2208 [03:57<09:20,  2.77it/s][A
Epoch 5/5:  30%|██▉       | 655/2208 [03:58<09:31,  2.72it/s][A
Epoch 5/5:  30%|██▉       | 656/2208 [03:58<09:28,  2.73it/s][A
Epoch 5/5:  30%|██▉       | 657/2208 [03:58<09:27,  2.73it/s][A
Epoch 5/5:  30%|██▉       | 658/2208 [03:59<09:17,  2.78it/s][A
Epoch 5/5:  30%|██▉       | 659/2208 [03:59<09:33,  2.70it/s][A
Epoch 5/5:  30%|██▉       | 660/2208 [03:59<09:25,  2.74it/s][A
Epoch 5/5:  30%|██▉       | 661/2208 [04:00<09:13,  2.79it/s][A
Epoch 5/5:  30%|██▉       | 662/2208 [04:00<09:21,  2.75it/s][A
Epoch 5/5:  30%|███       | 663/2208 [04:01<09:09,  2.81it/s][A
Epoch 5/5:  30%|███       | 664/2208 [04:01<09:08,  2.81it/s][A
Epoch 5/5:  30%|███       | 665/2208 [04:01<09:01,  2.85it/s][A
Epoch 5/5:  30%|███       | 666/2208 [04:02<09:10,  2.80it/s][A
Epoch 5/5:  30%|███     

Batch 675: Training accuracy = 0.8281, F1 = 0.8071, Precision = 0.8026, Recall = 0.8281



Epoch 5/5:  31%|███       | 677/2208 [04:06<09:25,  2.71it/s][A
Epoch 5/5:  31%|███       | 678/2208 [04:06<09:13,  2.76it/s][A
Epoch 5/5:  31%|███       | 679/2208 [04:06<09:15,  2.75it/s][A
Epoch 5/5:  31%|███       | 680/2208 [04:07<09:04,  2.80it/s][A
Epoch 5/5:  31%|███       | 681/2208 [04:07<08:59,  2.83it/s][A
Epoch 5/5:  31%|███       | 682/2208 [04:07<09:10,  2.77it/s][A
Epoch 5/5:  31%|███       | 683/2208 [04:08<09:16,  2.74it/s][A
Epoch 5/5:  31%|███       | 684/2208 [04:08<09:06,  2.79it/s][A
Epoch 5/5:  31%|███       | 685/2208 [04:08<09:17,  2.73it/s][A
Epoch 5/5:  31%|███       | 686/2208 [04:09<09:13,  2.75it/s][A
Epoch 5/5:  31%|███       | 687/2208 [04:09<09:05,  2.79it/s][A
Epoch 5/5:  31%|███       | 688/2208 [04:09<08:55,  2.84it/s][A
Epoch 5/5:  31%|███       | 689/2208 [04:10<08:50,  2.86it/s][A
Epoch 5/5:  31%|███▏      | 690/2208 [04:10<08:55,  2.84it/s][A
Epoch 5/5:  31%|███▏      | 691/2208 [04:11<08:50,  2.86it/s][A
Epoch 5/5:  31%|███▏    

Batch 700: Training accuracy = 0.8594, F1 = 0.8419, Precision = 0.8372, Recall = 0.8594



Epoch 5/5:  32%|███▏      | 702/2208 [04:14<08:49,  2.84it/s][A
Epoch 5/5:  32%|███▏      | 703/2208 [04:15<08:46,  2.86it/s][A
Epoch 5/5:  32%|███▏      | 704/2208 [04:15<09:02,  2.77it/s][A
Epoch 5/5:  32%|███▏      | 705/2208 [04:15<08:51,  2.83it/s][A
Epoch 5/5:  32%|███▏      | 706/2208 [04:16<08:58,  2.79it/s][A
Epoch 5/5:  32%|███▏      | 707/2208 [04:16<08:52,  2.82it/s][A
Epoch 5/5:  32%|███▏      | 708/2208 [04:17<09:01,  2.77it/s][A
Epoch 5/5:  32%|███▏      | 709/2208 [04:17<09:08,  2.73it/s][A
Epoch 5/5:  32%|███▏      | 710/2208 [04:17<09:19,  2.68it/s][A
Epoch 5/5:  32%|███▏      | 711/2208 [04:18<09:12,  2.71it/s][A
Epoch 5/5:  32%|███▏      | 712/2208 [04:18<09:00,  2.77it/s][A
Epoch 5/5:  32%|███▏      | 713/2208 [04:18<08:59,  2.77it/s][A
Epoch 5/5:  32%|███▏      | 714/2208 [04:19<09:05,  2.74it/s][A
Epoch 5/5:  32%|███▏      | 715/2208 [04:19<08:53,  2.80it/s][A
Epoch 5/5:  32%|███▏      | 716/2208 [04:20<09:03,  2.74it/s][A
Epoch 5/5:  32%|███▏    

Batch 725: Training accuracy = 0.8672, F1 = 0.8603, Precision = 0.8735, Recall = 0.8672



Epoch 5/5:  33%|███▎      | 727/2208 [04:23<08:35,  2.87it/s][A
Epoch 5/5:  33%|███▎      | 728/2208 [04:24<08:30,  2.90it/s][A
Epoch 5/5:  33%|███▎      | 729/2208 [04:24<08:30,  2.90it/s][A
Epoch 5/5:  33%|███▎      | 730/2208 [04:24<08:29,  2.90it/s][A
Epoch 5/5:  33%|███▎      | 731/2208 [04:25<08:29,  2.90it/s][A
Epoch 5/5:  33%|███▎      | 732/2208 [04:25<08:28,  2.90it/s][A
Epoch 5/5:  33%|███▎      | 733/2208 [04:25<08:33,  2.87it/s][A
Epoch 5/5:  33%|███▎      | 734/2208 [04:26<08:46,  2.80it/s][A
Epoch 5/5:  33%|███▎      | 735/2208 [04:26<08:52,  2.77it/s][A
Epoch 5/5:  33%|███▎      | 736/2208 [04:27<08:45,  2.80it/s][A
Epoch 5/5:  33%|███▎      | 737/2208 [04:27<08:54,  2.75it/s][A
Epoch 5/5:  33%|███▎      | 738/2208 [04:27<08:59,  2.72it/s][A
Epoch 5/5:  33%|███▎      | 739/2208 [04:28<09:05,  2.69it/s][A
Epoch 5/5:  34%|███▎      | 740/2208 [04:28<08:55,  2.74it/s][A
Epoch 5/5:  34%|███▎      | 741/2208 [04:28<08:47,  2.78it/s][A
Epoch 5/5:  34%|███▎    

Batch 750: Training accuracy = 0.7812, F1 = 0.7680, Precision = 0.7839, Recall = 0.7812



Epoch 5/5:  34%|███▍      | 752/2208 [04:32<08:49,  2.75it/s][A
Epoch 5/5:  34%|███▍      | 753/2208 [04:33<08:38,  2.80it/s][A
Epoch 5/5:  34%|███▍      | 754/2208 [04:33<08:41,  2.79it/s][A
Epoch 5/5:  34%|███▍      | 755/2208 [04:33<08:37,  2.81it/s][A
Epoch 5/5:  34%|███▍      | 756/2208 [04:34<08:36,  2.81it/s][A
Epoch 5/5:  34%|███▍      | 757/2208 [04:34<08:39,  2.79it/s][A
Epoch 5/5:  34%|███▍      | 758/2208 [04:34<08:33,  2.82it/s][A
Epoch 5/5:  34%|███▍      | 759/2208 [04:35<08:50,  2.73it/s][A
Epoch 5/5:  34%|███▍      | 760/2208 [04:35<08:40,  2.78it/s][A
Epoch 5/5:  34%|███▍      | 761/2208 [04:36<08:48,  2.74it/s][A
Epoch 5/5:  35%|███▍      | 762/2208 [04:36<08:57,  2.69it/s][A
Epoch 5/5:  35%|███▍      | 763/2208 [04:36<09:12,  2.62it/s][A
Epoch 5/5:  35%|███▍      | 764/2208 [04:37<08:55,  2.70it/s][A
Epoch 5/5:  35%|███▍      | 765/2208 [04:37<08:52,  2.71it/s][A
Epoch 5/5:  35%|███▍      | 766/2208 [04:37<08:45,  2.75it/s][A
Epoch 5/5:  35%|███▍    

Batch 775: Training accuracy = 0.8594, F1 = 0.8484, Precision = 0.8464, Recall = 0.8594



Epoch 5/5:  35%|███▌      | 777/2208 [04:41<08:26,  2.82it/s][A
Epoch 5/5:  35%|███▌      | 778/2208 [04:42<08:26,  2.82it/s][A
Epoch 5/5:  35%|███▌      | 779/2208 [04:42<08:21,  2.85it/s][A
Epoch 5/5:  35%|███▌      | 780/2208 [04:42<08:18,  2.87it/s][A
Epoch 5/5:  35%|███▌      | 781/2208 [04:43<08:30,  2.80it/s][A
Epoch 5/5:  35%|███▌      | 782/2208 [04:43<08:27,  2.81it/s][A
Epoch 5/5:  35%|███▌      | 783/2208 [04:44<08:47,  2.70it/s][A
Epoch 5/5:  36%|███▌      | 784/2208 [04:44<08:34,  2.77it/s][A
Epoch 5/5:  36%|███▌      | 785/2208 [04:44<08:27,  2.80it/s][A
Epoch 5/5:  36%|███▌      | 786/2208 [04:45<08:23,  2.82it/s][A
Epoch 5/5:  36%|███▌      | 787/2208 [04:45<08:17,  2.86it/s][A
Epoch 5/5:  36%|███▌      | 788/2208 [04:45<08:35,  2.75it/s][A
Epoch 5/5:  36%|███▌      | 789/2208 [04:46<08:25,  2.81it/s][A
Epoch 5/5:  36%|███▌      | 790/2208 [04:46<08:26,  2.80it/s][A
Epoch 5/5:  36%|███▌      | 791/2208 [04:46<08:36,  2.74it/s][A
Epoch 5/5:  36%|███▌    

Batch 800: Training accuracy = 0.9062, F1 = 0.8946, Precision = 0.8924, Recall = 0.9062



Epoch 5/5:  36%|███▋      | 802/2208 [04:50<08:32,  2.74it/s][A
Epoch 5/5:  36%|███▋      | 803/2208 [04:51<08:40,  2.70it/s][A
Epoch 5/5:  36%|███▋      | 804/2208 [04:51<08:38,  2.71it/s][A
Epoch 5/5:  36%|███▋      | 805/2208 [04:52<08:37,  2.71it/s][A
Epoch 5/5:  37%|███▋      | 806/2208 [04:52<08:34,  2.72it/s][A
Epoch 5/5:  37%|███▋      | 807/2208 [04:52<08:23,  2.78it/s][A
Epoch 5/5:  37%|███▋      | 808/2208 [04:53<08:16,  2.82it/s][A
Epoch 5/5:  37%|███▋      | 809/2208 [04:53<08:26,  2.76it/s][A
Epoch 5/5:  37%|███▋      | 810/2208 [04:53<08:29,  2.74it/s][A
Epoch 5/5:  37%|███▋      | 811/2208 [04:54<08:48,  2.64it/s][A
Epoch 5/5:  37%|███▋      | 812/2208 [04:54<08:48,  2.64it/s][A
Epoch 5/5:  37%|███▋      | 813/2208 [04:55<08:42,  2.67it/s][A
Epoch 5/5:  37%|███▋      | 814/2208 [04:55<08:36,  2.70it/s][A
Epoch 5/5:  37%|███▋      | 815/2208 [04:55<08:24,  2.76it/s][A
Epoch 5/5:  37%|███▋      | 816/2208 [04:56<08:22,  2.77it/s][A
Epoch 5/5:  37%|███▋    

Batch 825: Training accuracy = 0.8906, F1 = 0.8875, Precision = 0.9010, Recall = 0.8906



Epoch 5/5:  37%|███▋      | 827/2208 [05:00<08:07,  2.83it/s][A
Epoch 5/5:  38%|███▊      | 828/2208 [05:00<08:05,  2.84it/s][A
Epoch 5/5:  38%|███▊      | 829/2208 [05:00<08:11,  2.81it/s][A
Epoch 5/5:  38%|███▊      | 830/2208 [05:01<08:04,  2.84it/s][A
Epoch 5/5:  38%|███▊      | 831/2208 [05:01<08:16,  2.77it/s][A
Epoch 5/5:  38%|███▊      | 832/2208 [05:01<08:17,  2.77it/s][A
Epoch 5/5:  38%|███▊      | 833/2208 [05:02<08:09,  2.81it/s][A
Epoch 5/5:  38%|███▊      | 834/2208 [05:02<08:17,  2.76it/s][A
Epoch 5/5:  38%|███▊      | 835/2208 [05:02<08:10,  2.80it/s][A
Epoch 5/5:  38%|███▊      | 836/2208 [05:03<08:16,  2.76it/s][A
Epoch 5/5:  38%|███▊      | 837/2208 [05:03<08:21,  2.74it/s][A
Epoch 5/5:  38%|███▊      | 838/2208 [05:04<08:29,  2.69it/s][A
Epoch 5/5:  38%|███▊      | 839/2208 [05:04<08:35,  2.66it/s][A
Epoch 5/5:  38%|███▊      | 840/2208 [05:04<08:34,  2.66it/s][A
Epoch 5/5:  38%|███▊      | 841/2208 [05:05<08:22,  2.72it/s][A
Epoch 5/5:  38%|███▊    

Batch 850: Training accuracy = 0.8359, F1 = 0.8359, Precision = 0.8503, Recall = 0.8359



Epoch 5/5:  39%|███▊      | 852/2208 [05:09<08:07,  2.78it/s][A
Epoch 5/5:  39%|███▊      | 853/2208 [05:09<08:09,  2.77it/s][A
Epoch 5/5:  39%|███▊      | 854/2208 [05:09<08:11,  2.76it/s][A
Epoch 5/5:  39%|███▊      | 855/2208 [05:10<08:16,  2.73it/s][A
Epoch 5/5:  39%|███▉      | 856/2208 [05:10<08:04,  2.79it/s][A
Epoch 5/5:  39%|███▉      | 857/2208 [05:10<07:58,  2.82it/s][A
Epoch 5/5:  39%|███▉      | 858/2208 [05:11<07:54,  2.85it/s][A
Epoch 5/5:  39%|███▉      | 859/2208 [05:11<07:49,  2.87it/s][A
Epoch 5/5:  39%|███▉      | 860/2208 [05:11<07:53,  2.85it/s][A
Epoch 5/5:  39%|███▉      | 861/2208 [05:12<07:49,  2.87it/s][A
Epoch 5/5:  39%|███▉      | 862/2208 [05:12<07:55,  2.83it/s][A
Epoch 5/5:  39%|███▉      | 863/2208 [05:12<07:50,  2.86it/s][A
Epoch 5/5:  39%|███▉      | 864/2208 [05:13<07:51,  2.85it/s][A
Epoch 5/5:  39%|███▉      | 865/2208 [05:13<07:55,  2.83it/s][A
Epoch 5/5:  39%|███▉      | 866/2208 [05:14<08:08,  2.75it/s][A
Epoch 5/5:  39%|███▉    

Batch 875: Training accuracy = 0.8594, F1 = 0.8456, Precision = 0.8464, Recall = 0.8594



Epoch 5/5:  40%|███▉      | 877/2208 [05:18<07:54,  2.80it/s][A
Epoch 5/5:  40%|███▉      | 878/2208 [05:18<07:54,  2.80it/s][A
Epoch 5/5:  40%|███▉      | 879/2208 [05:18<07:54,  2.80it/s][A
Epoch 5/5:  40%|███▉      | 880/2208 [05:19<08:00,  2.77it/s][A
Epoch 5/5:  40%|███▉      | 881/2208 [05:19<08:07,  2.72it/s][A
Epoch 5/5:  40%|███▉      | 882/2208 [05:19<08:12,  2.69it/s][A
Epoch 5/5:  40%|███▉      | 883/2208 [05:20<08:00,  2.76it/s][A
Epoch 5/5:  40%|████      | 884/2208 [05:20<07:59,  2.76it/s][A
Epoch 5/5:  40%|████      | 885/2208 [05:20<07:50,  2.81it/s][A
Epoch 5/5:  40%|████      | 886/2208 [05:21<07:52,  2.80it/s][A
Epoch 5/5:  40%|████      | 887/2208 [05:21<07:49,  2.82it/s][A
Epoch 5/5:  40%|████      | 888/2208 [05:22<07:42,  2.85it/s][A
Epoch 5/5:  40%|████      | 889/2208 [05:22<07:37,  2.88it/s][A
Epoch 5/5:  40%|████      | 890/2208 [05:22<07:35,  2.89it/s][A
Epoch 5/5:  40%|████      | 891/2208 [05:23<07:36,  2.88it/s][A
Epoch 5/5:  40%|████    

Batch 900: Training accuracy = 0.8594, F1 = 0.8667, Precision = 0.8854, Recall = 0.8594



Epoch 5/5:  41%|████      | 902/2208 [05:26<07:44,  2.81it/s][A
Epoch 5/5:  41%|████      | 903/2208 [05:27<07:37,  2.85it/s][A
Epoch 5/5:  41%|████      | 904/2208 [05:27<07:40,  2.83it/s][A
Epoch 5/5:  41%|████      | 905/2208 [05:28<07:42,  2.82it/s][A
Epoch 5/5:  41%|████      | 906/2208 [05:28<07:42,  2.82it/s][A
Epoch 5/5:  41%|████      | 907/2208 [05:28<07:46,  2.79it/s][A
Epoch 5/5:  41%|████      | 908/2208 [05:29<07:48,  2.78it/s][A
Epoch 5/5:  41%|████      | 909/2208 [05:29<07:55,  2.73it/s][A
Epoch 5/5:  41%|████      | 910/2208 [05:29<08:04,  2.68it/s][A
Epoch 5/5:  41%|████▏     | 911/2208 [05:30<08:05,  2.67it/s][A
Epoch 5/5:  41%|████▏     | 912/2208 [05:30<08:05,  2.67it/s][A
Epoch 5/5:  41%|████▏     | 913/2208 [05:30<07:53,  2.74it/s][A
Epoch 5/5:  41%|████▏     | 914/2208 [05:31<07:46,  2.78it/s][A
Epoch 5/5:  41%|████▏     | 915/2208 [05:31<07:40,  2.81it/s][A
Epoch 5/5:  41%|████▏     | 916/2208 [05:32<07:43,  2.79it/s][A
Epoch 5/5:  42%|████▏   

Batch 925: Training accuracy = 0.8906, F1 = 0.8854, Precision = 0.8906, Recall = 0.8906



Epoch 5/5:  42%|████▏     | 927/2208 [05:35<07:43,  2.77it/s][A
Epoch 5/5:  42%|████▏     | 928/2208 [05:36<07:36,  2.80it/s][A
Epoch 5/5:  42%|████▏     | 929/2208 [05:36<07:34,  2.81it/s][A
Epoch 5/5:  42%|████▏     | 930/2208 [05:37<07:29,  2.84it/s][A
Epoch 5/5:  42%|████▏     | 931/2208 [05:37<07:28,  2.85it/s][A
Epoch 5/5:  42%|████▏     | 932/2208 [05:37<07:22,  2.88it/s][A
Epoch 5/5:  42%|████▏     | 933/2208 [05:38<07:25,  2.86it/s][A
Epoch 5/5:  42%|████▏     | 934/2208 [05:38<07:33,  2.81it/s][A
Epoch 5/5:  42%|████▏     | 935/2208 [05:38<07:46,  2.73it/s][A
Epoch 5/5:  42%|████▏     | 936/2208 [05:39<07:43,  2.75it/s][A
Epoch 5/5:  42%|████▏     | 937/2208 [05:39<07:36,  2.78it/s][A
Epoch 5/5:  42%|████▏     | 938/2208 [05:39<07:39,  2.76it/s][A
Epoch 5/5:  43%|████▎     | 939/2208 [05:40<07:34,  2.79it/s][A
Epoch 5/5:  43%|████▎     | 940/2208 [05:40<07:29,  2.82it/s][A
Epoch 5/5:  43%|████▎     | 941/2208 [05:40<07:34,  2.79it/s][A
Epoch 5/5:  43%|████▎   

Batch 950: Training accuracy = 0.8438, F1 = 0.8349, Precision = 0.8451, Recall = 0.8438



Epoch 5/5:  43%|████▎     | 952/2208 [05:44<07:28,  2.80it/s][A
Epoch 5/5:  43%|████▎     | 953/2208 [05:45<07:31,  2.78it/s][A
Epoch 5/5:  43%|████▎     | 954/2208 [05:45<07:25,  2.81it/s][A
Epoch 5/5:  43%|████▎     | 955/2208 [05:46<07:24,  2.82it/s][A
Epoch 5/5:  43%|████▎     | 956/2208 [05:46<07:23,  2.82it/s][A
Epoch 5/5:  43%|████▎     | 957/2208 [05:46<07:34,  2.75it/s][A
Epoch 5/5:  43%|████▎     | 958/2208 [05:47<07:35,  2.74it/s][A
Epoch 5/5:  43%|████▎     | 959/2208 [05:47<07:46,  2.68it/s][A
Epoch 5/5:  43%|████▎     | 960/2208 [05:47<07:54,  2.63it/s][A
Epoch 5/5:  44%|████▎     | 961/2208 [05:48<07:51,  2.65it/s][A
Epoch 5/5:  44%|████▎     | 962/2208 [05:48<07:36,  2.73it/s][A
Epoch 5/5:  44%|████▎     | 963/2208 [05:49<07:46,  2.67it/s][A
Epoch 5/5:  44%|████▎     | 964/2208 [05:49<07:43,  2.69it/s][A
Epoch 5/5:  44%|████▎     | 965/2208 [05:49<07:42,  2.69it/s][A
Epoch 5/5:  44%|████▍     | 966/2208 [05:50<07:41,  2.69it/s][A
Epoch 5/5:  44%|████▍   

Batch 975: Training accuracy = 0.8750, F1 = 0.8667, Precision = 0.8753, Recall = 0.8750



Epoch 5/5:  44%|████▍     | 977/2208 [05:54<07:18,  2.81it/s][A
Epoch 5/5:  44%|████▍     | 978/2208 [05:54<07:21,  2.79it/s][A
Epoch 5/5:  44%|████▍     | 979/2208 [05:54<07:15,  2.82it/s][A
Epoch 5/5:  44%|████▍     | 980/2208 [05:55<07:23,  2.77it/s][A
Epoch 5/5:  44%|████▍     | 981/2208 [05:55<07:15,  2.81it/s][A
Epoch 5/5:  44%|████▍     | 982/2208 [05:55<07:22,  2.77it/s][A
Epoch 5/5:  45%|████▍     | 983/2208 [05:56<07:18,  2.79it/s][A
Epoch 5/5:  45%|████▍     | 984/2208 [05:56<07:26,  2.74it/s][A
Epoch 5/5:  45%|████▍     | 985/2208 [05:56<07:34,  2.69it/s][A
Epoch 5/5:  45%|████▍     | 986/2208 [05:57<07:43,  2.64it/s][A
Epoch 5/5:  45%|████▍     | 987/2208 [05:57<07:38,  2.66it/s][A
Epoch 5/5:  45%|████▍     | 988/2208 [05:58<07:26,  2.73it/s][A
Epoch 5/5:  45%|████▍     | 989/2208 [05:58<07:19,  2.78it/s][A
Epoch 5/5:  45%|████▍     | 990/2208 [05:58<07:16,  2.79it/s][A
Epoch 5/5:  45%|████▍     | 991/2208 [05:59<07:09,  2.84it/s][A
Epoch 5/5:  45%|████▍   

Batch 1000: Training accuracy = 0.8750, F1 = 0.8591, Precision = 0.8659, Recall = 0.8750



Epoch 5/5:  45%|████▌     | 1002/2208 [06:03<07:25,  2.70it/s][A
Epoch 5/5:  45%|████▌     | 1003/2208 [06:03<07:14,  2.77it/s][A
Epoch 5/5:  45%|████▌     | 1004/2208 [06:03<07:10,  2.80it/s][A
Epoch 5/5:  46%|████▌     | 1005/2208 [06:04<07:16,  2.76it/s][A
Epoch 5/5:  46%|████▌     | 1006/2208 [06:04<07:11,  2.79it/s][A
Epoch 5/5:  46%|████▌     | 1007/2208 [06:04<07:07,  2.81it/s][A
Epoch 5/5:  46%|████▌     | 1008/2208 [06:05<07:07,  2.81it/s][A
Epoch 5/5:  46%|████▌     | 1009/2208 [06:05<07:14,  2.76it/s][A
Epoch 5/5:  46%|████▌     | 1010/2208 [06:06<07:10,  2.78it/s][A
Epoch 5/5:  46%|████▌     | 1011/2208 [06:06<07:16,  2.74it/s][A
Epoch 5/5:  46%|████▌     | 1012/2208 [06:06<07:11,  2.77it/s][A
Epoch 5/5:  46%|████▌     | 1013/2208 [06:07<07:09,  2.78it/s][A
Epoch 5/5:  46%|████▌     | 1014/2208 [06:07<07:07,  2.79it/s][A
Epoch 5/5:  46%|████▌     | 1015/2208 [06:07<07:04,  2.81it/s][A
Epoch 5/5:  46%|████▌     | 1016/2208 [06:08<07:00,  2.84it/s][A
Epoch 5/5

Batch 1025: Training accuracy = 0.8750, F1 = 0.8732, Precision = 0.8841, Recall = 0.8750



Epoch 5/5:  47%|████▋     | 1027/2208 [06:12<07:00,  2.81it/s][A
Epoch 5/5:  47%|████▋     | 1028/2208 [06:12<07:00,  2.81it/s][A
Epoch 5/5:  47%|████▋     | 1029/2208 [06:12<07:06,  2.77it/s][A
Epoch 5/5:  47%|████▋     | 1030/2208 [06:13<07:05,  2.77it/s][A
Epoch 5/5:  47%|████▋     | 1031/2208 [06:13<07:07,  2.75it/s][A
Epoch 5/5:  47%|████▋     | 1032/2208 [06:13<06:59,  2.80it/s][A
Epoch 5/5:  47%|████▋     | 1033/2208 [06:14<06:53,  2.84it/s][A
Epoch 5/5:  47%|████▋     | 1034/2208 [06:14<07:00,  2.79it/s][A
Epoch 5/5:  47%|████▋     | 1035/2208 [06:14<06:56,  2.82it/s][A
Epoch 5/5:  47%|████▋     | 1036/2208 [06:15<07:07,  2.74it/s][A
Epoch 5/5:  47%|████▋     | 1037/2208 [06:15<07:01,  2.78it/s][A
Epoch 5/5:  47%|████▋     | 1038/2208 [06:16<07:05,  2.75it/s][A
Epoch 5/5:  47%|████▋     | 1039/2208 [06:16<07:06,  2.74it/s][A
Epoch 5/5:  47%|████▋     | 1040/2208 [06:16<07:04,  2.75it/s][A
Epoch 5/5:  47%|████▋     | 1041/2208 [06:17<07:09,  2.72it/s][A
Epoch 5/5

Batch 1050: Training accuracy = 0.8594, F1 = 0.8472, Precision = 0.8457, Recall = 0.8594



Epoch 5/5:  48%|████▊     | 1052/2208 [06:21<07:02,  2.74it/s][A
Epoch 5/5:  48%|████▊     | 1053/2208 [06:21<06:57,  2.76it/s][A
Epoch 5/5:  48%|████▊     | 1054/2208 [06:21<07:01,  2.73it/s][A
Epoch 5/5:  48%|████▊     | 1055/2208 [06:22<06:59,  2.75it/s][A
Epoch 5/5:  48%|████▊     | 1056/2208 [06:22<07:03,  2.72it/s][A
Epoch 5/5:  48%|████▊     | 1057/2208 [06:22<07:03,  2.72it/s][A
Epoch 5/5:  48%|████▊     | 1058/2208 [06:23<06:55,  2.77it/s][A
Epoch 5/5:  48%|████▊     | 1059/2208 [06:23<06:50,  2.80it/s][A
Epoch 5/5:  48%|████▊     | 1060/2208 [06:23<06:44,  2.84it/s][A
Epoch 5/5:  48%|████▊     | 1061/2208 [06:24<06:40,  2.86it/s][A
Epoch 5/5:  48%|████▊     | 1062/2208 [06:24<06:46,  2.82it/s][A
Epoch 5/5:  48%|████▊     | 1063/2208 [06:25<06:51,  2.78it/s][A
Epoch 5/5:  48%|████▊     | 1064/2208 [06:25<06:45,  2.82it/s][A
Epoch 5/5:  48%|████▊     | 1065/2208 [06:25<06:39,  2.86it/s][A
Epoch 5/5:  48%|████▊     | 1066/2208 [06:26<06:40,  2.85it/s][A
Epoch 5/5

Batch 1075: Training accuracy = 0.8828, F1 = 0.8750, Precision = 0.8789, Recall = 0.8828



Epoch 5/5:  49%|████▉     | 1077/2208 [06:29<06:50,  2.75it/s][A
Epoch 5/5:  49%|████▉     | 1078/2208 [06:30<07:09,  2.63it/s][A
Epoch 5/5:  49%|████▉     | 1079/2208 [06:30<07:05,  2.65it/s][A
Epoch 5/5:  49%|████▉     | 1080/2208 [06:31<06:57,  2.70it/s][A
Epoch 5/5:  49%|████▉     | 1081/2208 [06:31<06:49,  2.76it/s][A
Epoch 5/5:  49%|████▉     | 1082/2208 [06:31<06:43,  2.79it/s][A
Epoch 5/5:  49%|████▉     | 1083/2208 [06:32<06:41,  2.80it/s][A
Epoch 5/5:  49%|████▉     | 1084/2208 [06:32<06:36,  2.83it/s][A
Epoch 5/5:  49%|████▉     | 1085/2208 [06:32<06:45,  2.77it/s][A
Epoch 5/5:  49%|████▉     | 1086/2208 [06:33<06:45,  2.76it/s][A
Epoch 5/5:  49%|████▉     | 1087/2208 [06:33<06:42,  2.79it/s][A
Epoch 5/5:  49%|████▉     | 1088/2208 [06:33<06:44,  2.77it/s][A
Epoch 5/5:  49%|████▉     | 1089/2208 [06:34<06:50,  2.72it/s][A
Epoch 5/5:  49%|████▉     | 1090/2208 [06:34<06:42,  2.78it/s][A
Epoch 5/5:  49%|████▉     | 1091/2208 [06:35<06:40,  2.79it/s][A
Epoch 5/5

Batch 1100: Training accuracy = 0.8984, F1 = 0.8906, Precision = 0.8997, Recall = 0.8984



Epoch 5/5:  50%|████▉     | 1102/2208 [06:39<06:40,  2.76it/s][A
Epoch 5/5:  50%|████▉     | 1103/2208 [06:39<06:36,  2.79it/s][A
Epoch 5/5:  50%|█████     | 1104/2208 [06:39<06:32,  2.81it/s][A
Epoch 5/5:  50%|█████     | 1105/2208 [06:40<06:30,  2.82it/s][A
Epoch 5/5:  50%|█████     | 1106/2208 [06:40<06:37,  2.77it/s][A
Epoch 5/5:  50%|█████     | 1107/2208 [06:40<06:29,  2.83it/s][A
Epoch 5/5:  50%|█████     | 1108/2208 [06:41<06:31,  2.81it/s][A
Epoch 5/5:  50%|█████     | 1109/2208 [06:41<06:37,  2.76it/s][A
Epoch 5/5:  50%|█████     | 1110/2208 [06:41<06:37,  2.76it/s][A
Epoch 5/5:  50%|█████     | 1111/2208 [06:42<06:33,  2.79it/s][A
Epoch 5/5:  50%|█████     | 1112/2208 [06:42<06:26,  2.84it/s][A
Epoch 5/5:  50%|█████     | 1113/2208 [06:42<06:21,  2.87it/s][A
Epoch 5/5:  50%|█████     | 1114/2208 [06:43<06:17,  2.90it/s][A
Epoch 5/5:  50%|█████     | 1115/2208 [06:43<06:24,  2.84it/s][A
Epoch 5/5:  51%|█████     | 1116/2208 [06:44<06:23,  2.85it/s][A
Epoch 5/5

Batch 1125: Training accuracy = 0.8906, F1 = 0.8953, Precision = 0.9128, Recall = 0.8906



Epoch 5/5:  51%|█████     | 1127/2208 [06:48<06:35,  2.73it/s][A
Epoch 5/5:  51%|█████     | 1128/2208 [06:48<06:27,  2.79it/s][A
Epoch 5/5:  51%|█████     | 1129/2208 [06:48<06:23,  2.81it/s][A
Epoch 5/5:  51%|█████     | 1130/2208 [06:49<06:18,  2.85it/s][A
Epoch 5/5:  51%|█████     | 1131/2208 [06:49<06:13,  2.88it/s][A
Epoch 5/5:  51%|█████▏    | 1132/2208 [06:49<06:15,  2.86it/s][A
Epoch 5/5:  51%|█████▏    | 1133/2208 [06:50<06:18,  2.84it/s][A
Epoch 5/5:  51%|█████▏    | 1134/2208 [06:50<06:29,  2.76it/s][A
Epoch 5/5:  51%|█████▏    | 1135/2208 [06:50<06:22,  2.81it/s][A
Epoch 5/5:  51%|█████▏    | 1136/2208 [06:51<06:16,  2.85it/s][A
Epoch 5/5:  51%|█████▏    | 1137/2208 [06:51<06:11,  2.88it/s][A
Epoch 5/5:  52%|█████▏    | 1138/2208 [06:51<06:19,  2.82it/s][A
Epoch 5/5:  52%|█████▏    | 1139/2208 [06:52<06:17,  2.83it/s][A
Epoch 5/5:  52%|█████▏    | 1140/2208 [06:52<06:12,  2.86it/s][A
Epoch 5/5:  52%|█████▏    | 1141/2208 [06:53<06:19,  2.81it/s][A
Epoch 5/5

Batch 1150: Training accuracy = 0.8750, F1 = 0.8711, Precision = 0.8802, Recall = 0.8750



Epoch 5/5:  52%|█████▏    | 1152/2208 [06:57<06:30,  2.70it/s][A
Epoch 5/5:  52%|█████▏    | 1153/2208 [06:57<06:26,  2.73it/s][A
Epoch 5/5:  52%|█████▏    | 1154/2208 [06:57<06:34,  2.67it/s][A
Epoch 5/5:  52%|█████▏    | 1155/2208 [06:58<06:25,  2.73it/s][A
Epoch 5/5:  52%|█████▏    | 1156/2208 [06:58<06:24,  2.74it/s][A
Epoch 5/5:  52%|█████▏    | 1157/2208 [06:58<06:26,  2.72it/s][A
Epoch 5/5:  52%|█████▏    | 1158/2208 [06:59<06:22,  2.74it/s][A
Epoch 5/5:  52%|█████▏    | 1159/2208 [06:59<06:21,  2.75it/s][A
Epoch 5/5:  53%|█████▎    | 1160/2208 [06:59<06:16,  2.78it/s][A
Epoch 5/5:  53%|█████▎    | 1161/2208 [07:00<06:18,  2.77it/s][A
Epoch 5/5:  53%|█████▎    | 1162/2208 [07:00<06:17,  2.77it/s][A
Epoch 5/5:  53%|█████▎    | 1163/2208 [07:01<06:21,  2.74it/s][A
Epoch 5/5:  53%|█████▎    | 1164/2208 [07:01<06:37,  2.63it/s][A
Epoch 5/5:  53%|█████▎    | 1165/2208 [07:01<06:35,  2.64it/s][A
Epoch 5/5:  53%|█████▎    | 1166/2208 [07:02<06:23,  2.72it/s][A
Epoch 5/5

Batch 1175: Training accuracy = 0.8906, F1 = 0.8901, Precision = 0.8971, Recall = 0.8906



Epoch 5/5:  53%|█████▎    | 1177/2208 [07:06<06:10,  2.78it/s][A
Epoch 5/5:  53%|█████▎    | 1178/2208 [07:06<06:04,  2.83it/s][A
Epoch 5/5:  53%|█████▎    | 1179/2208 [07:06<06:08,  2.79it/s][A
Epoch 5/5:  53%|█████▎    | 1180/2208 [07:07<06:02,  2.83it/s][A
Epoch 5/5:  53%|█████▎    | 1181/2208 [07:07<05:59,  2.85it/s][A
Epoch 5/5:  54%|█████▎    | 1182/2208 [07:07<05:57,  2.87it/s][A
Epoch 5/5:  54%|█████▎    | 1183/2208 [07:08<06:04,  2.81it/s][A
Epoch 5/5:  54%|█████▎    | 1184/2208 [07:08<06:05,  2.80it/s][A
Epoch 5/5:  54%|█████▎    | 1185/2208 [07:08<05:59,  2.84it/s][A
Epoch 5/5:  54%|█████▎    | 1186/2208 [07:09<06:02,  2.82it/s][A
Epoch 5/5:  54%|█████▍    | 1187/2208 [07:09<06:06,  2.79it/s][A
Epoch 5/5:  54%|█████▍    | 1188/2208 [07:10<06:01,  2.82it/s][A
Epoch 5/5:  54%|█████▍    | 1189/2208 [07:10<06:12,  2.74it/s][A
Epoch 5/5:  54%|█████▍    | 1190/2208 [07:10<06:11,  2.74it/s][A
Epoch 5/5:  54%|█████▍    | 1191/2208 [07:11<06:15,  2.71it/s][A
Epoch 5/5

Batch 1200: Training accuracy = 0.8047, F1 = 0.7969, Precision = 0.8008, Recall = 0.8047



Epoch 5/5:  54%|█████▍    | 1202/2208 [07:15<06:08,  2.73it/s][A
Epoch 5/5:  54%|█████▍    | 1203/2208 [07:15<06:09,  2.72it/s][A
Epoch 5/5:  55%|█████▍    | 1204/2208 [07:15<06:01,  2.78it/s][A
Epoch 5/5:  55%|█████▍    | 1205/2208 [07:16<06:02,  2.77it/s][A
Epoch 5/5:  55%|█████▍    | 1206/2208 [07:16<05:58,  2.80it/s][A
Epoch 5/5:  55%|█████▍    | 1207/2208 [07:16<05:55,  2.82it/s][A
Epoch 5/5:  55%|█████▍    | 1208/2208 [07:17<06:00,  2.77it/s][A
Epoch 5/5:  55%|█████▍    | 1209/2208 [07:17<06:06,  2.72it/s][A
Epoch 5/5:  55%|█████▍    | 1210/2208 [07:18<06:02,  2.76it/s][A
Epoch 5/5:  55%|█████▍    | 1211/2208 [07:18<05:54,  2.81it/s][A
Epoch 5/5:  55%|█████▍    | 1212/2208 [07:18<05:51,  2.83it/s][A
Epoch 5/5:  55%|█████▍    | 1213/2208 [07:19<05:53,  2.82it/s][A
Epoch 5/5:  55%|█████▍    | 1214/2208 [07:19<05:47,  2.86it/s][A
Epoch 5/5:  55%|█████▌    | 1215/2208 [07:19<05:49,  2.84it/s][A
Epoch 5/5:  55%|█████▌    | 1216/2208 [07:20<05:45,  2.87it/s][A
Epoch 5/5

Batch 1225: Training accuracy = 0.9062, F1 = 0.8979, Precision = 0.8971, Recall = 0.9062



Epoch 5/5:  56%|█████▌    | 1227/2208 [07:24<06:03,  2.70it/s][A
Epoch 5/5:  56%|█████▌    | 1228/2208 [07:24<05:54,  2.77it/s][A
Epoch 5/5:  56%|█████▌    | 1229/2208 [07:24<05:50,  2.80it/s][A
Epoch 5/5:  56%|█████▌    | 1230/2208 [07:25<05:43,  2.84it/s][A
Epoch 5/5:  56%|█████▌    | 1231/2208 [07:25<05:50,  2.78it/s][A
Epoch 5/5:  56%|█████▌    | 1232/2208 [07:25<05:47,  2.81it/s][A
Epoch 5/5:  56%|█████▌    | 1233/2208 [07:26<05:43,  2.84it/s][A
Epoch 5/5:  56%|█████▌    | 1234/2208 [07:26<05:46,  2.81it/s][A
Epoch 5/5:  56%|█████▌    | 1235/2208 [07:26<05:41,  2.85it/s][A
Epoch 5/5:  56%|█████▌    | 1236/2208 [07:27<05:42,  2.84it/s][A
Epoch 5/5:  56%|█████▌    | 1237/2208 [07:27<05:40,  2.85it/s][A
Epoch 5/5:  56%|█████▌    | 1238/2208 [07:27<05:38,  2.86it/s][A
Epoch 5/5:  56%|█████▌    | 1239/2208 [07:28<05:42,  2.83it/s][A
Epoch 5/5:  56%|█████▌    | 1240/2208 [07:28<05:44,  2.81it/s][A
Epoch 5/5:  56%|█████▌    | 1241/2208 [07:29<05:47,  2.78it/s][A
Epoch 5/5

Batch 1250: Training accuracy = 0.8984, F1 = 0.8849, Precision = 0.8815, Recall = 0.8984



Epoch 5/5:  57%|█████▋    | 1252/2208 [07:33<05:44,  2.77it/s][A
Epoch 5/5:  57%|█████▋    | 1253/2208 [07:33<05:38,  2.82it/s][A
Epoch 5/5:  57%|█████▋    | 1254/2208 [07:33<05:38,  2.82it/s][A
Epoch 5/5:  57%|█████▋    | 1255/2208 [07:34<05:46,  2.75it/s][A
Epoch 5/5:  57%|█████▋    | 1256/2208 [07:34<05:49,  2.73it/s][A
Epoch 5/5:  57%|█████▋    | 1257/2208 [07:34<05:46,  2.74it/s][A
Epoch 5/5:  57%|█████▋    | 1258/2208 [07:35<05:41,  2.78it/s][A
Epoch 5/5:  57%|█████▋    | 1259/2208 [07:35<05:46,  2.74it/s][A
Epoch 5/5:  57%|█████▋    | 1260/2208 [07:35<05:42,  2.76it/s][A
Epoch 5/5:  57%|█████▋    | 1261/2208 [07:36<05:36,  2.81it/s][A
Epoch 5/5:  57%|█████▋    | 1262/2208 [07:36<05:39,  2.79it/s][A
Epoch 5/5:  57%|█████▋    | 1263/2208 [07:37<05:39,  2.79it/s][A
Epoch 5/5:  57%|█████▋    | 1264/2208 [07:37<05:41,  2.76it/s][A
Epoch 5/5:  57%|█████▋    | 1265/2208 [07:37<05:44,  2.74it/s][A
Epoch 5/5:  57%|█████▋    | 1266/2208 [07:38<05:47,  2.71it/s][A
Epoch 5/5

Batch 1275: Training accuracy = 0.8906, F1 = 0.8828, Precision = 0.8867, Recall = 0.8906



Epoch 5/5:  58%|█████▊    | 1277/2208 [07:42<05:33,  2.79it/s][A
Epoch 5/5:  58%|█████▊    | 1278/2208 [07:42<05:30,  2.81it/s][A
Epoch 5/5:  58%|█████▊    | 1279/2208 [07:42<05:26,  2.84it/s][A
Epoch 5/5:  58%|█████▊    | 1280/2208 [07:43<05:37,  2.75it/s][A
Epoch 5/5:  58%|█████▊    | 1281/2208 [07:43<05:36,  2.75it/s][A
Epoch 5/5:  58%|█████▊    | 1282/2208 [07:43<05:42,  2.71it/s][A
Epoch 5/5:  58%|█████▊    | 1283/2208 [07:44<05:40,  2.71it/s][A
Epoch 5/5:  58%|█████▊    | 1284/2208 [07:44<05:46,  2.66it/s][A
Epoch 5/5:  58%|█████▊    | 1285/2208 [07:45<05:49,  2.64it/s][A
Epoch 5/5:  58%|█████▊    | 1286/2208 [07:45<05:50,  2.63it/s][A
Epoch 5/5:  58%|█████▊    | 1287/2208 [07:45<05:38,  2.72it/s][A
Epoch 5/5:  58%|█████▊    | 1288/2208 [07:46<05:40,  2.70it/s][A
Epoch 5/5:  58%|█████▊    | 1289/2208 [07:46<05:38,  2.71it/s][A
Epoch 5/5:  58%|█████▊    | 1290/2208 [07:46<05:33,  2.76it/s][A
Epoch 5/5:  58%|█████▊    | 1291/2208 [07:47<05:31,  2.77it/s][A
Epoch 5/5

Batch 1300: Training accuracy = 0.8438, F1 = 0.8333, Precision = 0.8411, Recall = 0.8438



Epoch 5/5:  59%|█████▉    | 1302/2208 [07:51<05:23,  2.80it/s][A
Epoch 5/5:  59%|█████▉    | 1303/2208 [07:51<05:18,  2.84it/s][A
Epoch 5/5:  59%|█████▉    | 1304/2208 [07:51<05:13,  2.88it/s][A
Epoch 5/5:  59%|█████▉    | 1305/2208 [07:52<05:10,  2.91it/s][A
Epoch 5/5:  59%|█████▉    | 1306/2208 [07:52<05:14,  2.86it/s][A
Epoch 5/5:  59%|█████▉    | 1307/2208 [07:52<05:17,  2.84it/s][A
Epoch 5/5:  59%|█████▉    | 1308/2208 [07:53<05:20,  2.81it/s][A
Epoch 5/5:  59%|█████▉    | 1309/2208 [07:53<05:15,  2.85it/s][A
Epoch 5/5:  59%|█████▉    | 1310/2208 [07:53<05:13,  2.86it/s][A
Epoch 5/5:  59%|█████▉    | 1311/2208 [07:54<05:13,  2.86it/s][A
Epoch 5/5:  59%|█████▉    | 1312/2208 [07:54<05:16,  2.83it/s][A
Epoch 5/5:  59%|█████▉    | 1313/2208 [07:55<05:21,  2.78it/s][A
Epoch 5/5:  60%|█████▉    | 1314/2208 [07:55<05:29,  2.71it/s][A
Epoch 5/5:  60%|█████▉    | 1315/2208 [07:55<05:23,  2.76it/s][A
Epoch 5/5:  60%|█████▉    | 1316/2208 [07:56<05:16,  2.81it/s][A
Epoch 5/5

Batch 1325: Training accuracy = 0.9141, F1 = 0.9089, Precision = 0.9089, Recall = 0.9141



Epoch 5/5:  60%|██████    | 1327/2208 [08:00<05:19,  2.76it/s][A
Epoch 5/5:  60%|██████    | 1328/2208 [08:00<05:24,  2.71it/s][A
Epoch 5/5:  60%|██████    | 1329/2208 [08:00<05:21,  2.73it/s][A
Epoch 5/5:  60%|██████    | 1330/2208 [08:01<05:23,  2.72it/s][A
Epoch 5/5:  60%|██████    | 1331/2208 [08:01<05:17,  2.77it/s][A
Epoch 5/5:  60%|██████    | 1332/2208 [08:01<05:10,  2.82it/s][A
Epoch 5/5:  60%|██████    | 1333/2208 [08:02<05:07,  2.84it/s][A
Epoch 5/5:  60%|██████    | 1334/2208 [08:02<05:09,  2.82it/s][A
Epoch 5/5:  60%|██████    | 1335/2208 [08:03<05:18,  2.74it/s][A
Epoch 5/5:  61%|██████    | 1336/2208 [08:03<05:11,  2.80it/s][A
Epoch 5/5:  61%|██████    | 1337/2208 [08:03<05:06,  2.84it/s][A
Epoch 5/5:  61%|██████    | 1338/2208 [08:04<05:03,  2.87it/s][A
Epoch 5/5:  61%|██████    | 1339/2208 [08:04<05:06,  2.83it/s][A
Epoch 5/5:  61%|██████    | 1340/2208 [08:04<05:10,  2.80it/s][A
Epoch 5/5:  61%|██████    | 1341/2208 [08:05<05:10,  2.79it/s][A
Epoch 5/5

Batch 1350: Training accuracy = 0.8672, F1 = 0.8599, Precision = 0.8672, Recall = 0.8672



Epoch 5/5:  61%|██████    | 1352/2208 [08:09<05:11,  2.75it/s][A
Epoch 5/5:  61%|██████▏   | 1353/2208 [08:09<05:14,  2.72it/s][A
Epoch 5/5:  61%|██████▏   | 1354/2208 [08:09<05:14,  2.71it/s][A
Epoch 5/5:  61%|██████▏   | 1355/2208 [08:10<05:12,  2.73it/s][A
Epoch 5/5:  61%|██████▏   | 1356/2208 [08:10<05:05,  2.79it/s][A
Epoch 5/5:  61%|██████▏   | 1357/2208 [08:10<05:06,  2.78it/s][A
Epoch 5/5:  62%|██████▏   | 1358/2208 [08:11<05:08,  2.76it/s][A
Epoch 5/5:  62%|██████▏   | 1359/2208 [08:11<05:04,  2.79it/s][A
Epoch 5/5:  62%|██████▏   | 1360/2208 [08:11<04:59,  2.83it/s][A
Epoch 5/5:  62%|██████▏   | 1361/2208 [08:12<05:03,  2.79it/s][A
Epoch 5/5:  62%|██████▏   | 1362/2208 [08:12<04:59,  2.83it/s][A
Epoch 5/5:  62%|██████▏   | 1363/2208 [08:13<04:57,  2.84it/s][A
Epoch 5/5:  62%|██████▏   | 1364/2208 [08:13<05:05,  2.76it/s][A
Epoch 5/5:  62%|██████▏   | 1365/2208 [08:13<05:06,  2.75it/s][A
Epoch 5/5:  62%|██████▏   | 1366/2208 [08:14<05:11,  2.70it/s][A
Epoch 5/5

Batch 1375: Training accuracy = 0.8281, F1 = 0.8191, Precision = 0.8394, Recall = 0.8281



Epoch 5/5:  62%|██████▏   | 1377/2208 [08:18<04:53,  2.83it/s][A
Epoch 5/5:  62%|██████▏   | 1378/2208 [08:18<04:55,  2.81it/s][A
Epoch 5/5:  62%|██████▏   | 1379/2208 [08:18<04:52,  2.83it/s][A
Epoch 5/5:  62%|██████▎   | 1380/2208 [08:19<04:51,  2.84it/s][A
Epoch 5/5:  63%|██████▎   | 1381/2208 [08:19<04:56,  2.79it/s][A
Epoch 5/5:  63%|██████▎   | 1382/2208 [08:19<04:53,  2.82it/s][A
Epoch 5/5:  63%|██████▎   | 1383/2208 [08:20<04:53,  2.81it/s][A
Epoch 5/5:  63%|██████▎   | 1384/2208 [08:20<05:00,  2.74it/s][A
Epoch 5/5:  63%|██████▎   | 1385/2208 [08:21<05:04,  2.70it/s][A
Epoch 5/5:  63%|██████▎   | 1386/2208 [08:21<05:03,  2.71it/s][A
Epoch 5/5:  63%|██████▎   | 1387/2208 [08:21<04:56,  2.77it/s][A
Epoch 5/5:  63%|██████▎   | 1388/2208 [08:22<05:02,  2.71it/s][A
Epoch 5/5:  63%|██████▎   | 1389/2208 [08:22<04:54,  2.78it/s][A
Epoch 5/5:  63%|██████▎   | 1390/2208 [08:22<04:49,  2.83it/s][A
Epoch 5/5:  63%|██████▎   | 1391/2208 [08:23<04:45,  2.86it/s][A
Epoch 5/5

Batch 1400: Training accuracy = 0.8672, F1 = 0.8526, Precision = 0.8529, Recall = 0.8672



Epoch 5/5:  63%|██████▎   | 1402/2208 [08:27<04:51,  2.77it/s][A
Epoch 5/5:  64%|██████▎   | 1403/2208 [08:27<04:52,  2.75it/s][A
Epoch 5/5:  64%|██████▎   | 1404/2208 [08:27<04:51,  2.76it/s][A
Epoch 5/5:  64%|██████▎   | 1405/2208 [08:28<04:50,  2.76it/s][A
Epoch 5/5:  64%|██████▎   | 1406/2208 [08:28<04:52,  2.74it/s][A
Epoch 5/5:  64%|██████▎   | 1407/2208 [08:28<04:46,  2.80it/s][A
Epoch 5/5:  64%|██████▍   | 1408/2208 [08:29<04:48,  2.77it/s][A
Epoch 5/5:  64%|██████▍   | 1409/2208 [08:29<04:45,  2.80it/s][A
Epoch 5/5:  64%|██████▍   | 1410/2208 [08:30<04:59,  2.67it/s][A
Epoch 5/5:  64%|██████▍   | 1411/2208 [08:30<04:50,  2.75it/s][A
Epoch 5/5:  64%|██████▍   | 1412/2208 [08:30<04:46,  2.78it/s][A
Epoch 5/5:  64%|██████▍   | 1413/2208 [08:31<04:40,  2.83it/s][A
Epoch 5/5:  64%|██████▍   | 1414/2208 [08:31<04:45,  2.78it/s][A
Epoch 5/5:  64%|██████▍   | 1415/2208 [08:31<04:44,  2.79it/s][A
Epoch 5/5:  64%|██████▍   | 1416/2208 [08:32<04:44,  2.79it/s][A
Epoch 5/5

Batch 1425: Training accuracy = 0.8516, F1 = 0.8424, Precision = 0.8411, Recall = 0.8516



Epoch 5/5:  65%|██████▍   | 1427/2208 [08:36<04:38,  2.80it/s][A
Epoch 5/5:  65%|██████▍   | 1428/2208 [08:36<04:42,  2.77it/s][A
Epoch 5/5:  65%|██████▍   | 1429/2208 [08:36<04:41,  2.76it/s][A
Epoch 5/5:  65%|██████▍   | 1430/2208 [08:37<04:43,  2.74it/s][A
Epoch 5/5:  65%|██████▍   | 1431/2208 [08:37<04:45,  2.73it/s][A
Epoch 5/5:  65%|██████▍   | 1432/2208 [08:37<04:45,  2.72it/s][A
Epoch 5/5:  65%|██████▍   | 1433/2208 [08:38<04:38,  2.78it/s][A
Epoch 5/5:  65%|██████▍   | 1434/2208 [08:38<04:33,  2.83it/s][A
Epoch 5/5:  65%|██████▍   | 1435/2208 [08:38<04:31,  2.85it/s][A
Epoch 5/5:  65%|██████▌   | 1436/2208 [08:39<04:29,  2.86it/s][A
Epoch 5/5:  65%|██████▌   | 1437/2208 [08:39<04:27,  2.89it/s][A
Epoch 5/5:  65%|██████▌   | 1438/2208 [08:39<04:25,  2.90it/s][A
Epoch 5/5:  65%|██████▌   | 1439/2208 [08:40<04:23,  2.91it/s][A
Epoch 5/5:  65%|██████▌   | 1440/2208 [08:40<04:22,  2.92it/s][A
Epoch 5/5:  65%|██████▌   | 1441/2208 [08:40<04:27,  2.87it/s][A
Epoch 5/5

Batch 1450: Training accuracy = 0.8672, F1 = 0.8576, Precision = 0.8607, Recall = 0.8672



Epoch 5/5:  66%|██████▌   | 1452/2208 [08:45<04:52,  2.59it/s][A
Epoch 5/5:  66%|██████▌   | 1453/2208 [08:45<04:47,  2.63it/s][A
Epoch 5/5:  66%|██████▌   | 1454/2208 [08:45<04:37,  2.72it/s][A
Epoch 5/5:  66%|██████▌   | 1455/2208 [08:46<04:33,  2.75it/s][A
Epoch 5/5:  66%|██████▌   | 1456/2208 [08:46<04:28,  2.80it/s][A
Epoch 5/5:  66%|██████▌   | 1457/2208 [08:46<04:31,  2.77it/s][A
Epoch 5/5:  66%|██████▌   | 1458/2208 [08:47<04:30,  2.77it/s][A
Epoch 5/5:  66%|██████▌   | 1459/2208 [08:47<04:31,  2.75it/s][A
Epoch 5/5:  66%|██████▌   | 1460/2208 [08:47<04:33,  2.74it/s][A
Epoch 5/5:  66%|██████▌   | 1461/2208 [08:48<04:28,  2.78it/s][A
Epoch 5/5:  66%|██████▌   | 1462/2208 [08:48<04:29,  2.77it/s][A
Epoch 5/5:  66%|██████▋   | 1463/2208 [08:48<04:27,  2.79it/s][A
Epoch 5/5:  66%|██████▋   | 1464/2208 [08:49<04:28,  2.77it/s][A
Epoch 5/5:  66%|██████▋   | 1465/2208 [08:49<04:24,  2.81it/s][A
Epoch 5/5:  66%|██████▋   | 1466/2208 [08:50<04:29,  2.75it/s][A
Epoch 5/5

Batch 1475: Training accuracy = 0.8359, F1 = 0.8424, Precision = 0.8776, Recall = 0.8359



Epoch 5/5:  67%|██████▋   | 1477/2208 [08:53<04:16,  2.85it/s][A
Epoch 5/5:  67%|██████▋   | 1478/2208 [08:54<04:13,  2.88it/s][A
Epoch 5/5:  67%|██████▋   | 1479/2208 [08:54<04:20,  2.80it/s][A
Epoch 5/5:  67%|██████▋   | 1480/2208 [08:54<04:16,  2.84it/s][A
Epoch 5/5:  67%|██████▋   | 1481/2208 [08:55<04:15,  2.84it/s][A
Epoch 5/5:  67%|██████▋   | 1482/2208 [08:55<04:15,  2.85it/s][A
Epoch 5/5:  67%|██████▋   | 1483/2208 [08:56<04:15,  2.84it/s][A
Epoch 5/5:  67%|██████▋   | 1484/2208 [08:56<04:18,  2.80it/s][A
Epoch 5/5:  67%|██████▋   | 1485/2208 [08:56<04:20,  2.77it/s][A
Epoch 5/5:  67%|██████▋   | 1486/2208 [08:57<04:23,  2.74it/s][A
Epoch 5/5:  67%|██████▋   | 1487/2208 [08:57<04:25,  2.71it/s][A
Epoch 5/5:  67%|██████▋   | 1488/2208 [08:57<04:26,  2.70it/s][A
Epoch 5/5:  67%|██████▋   | 1489/2208 [08:58<04:26,  2.70it/s][A
Epoch 5/5:  67%|██████▋   | 1490/2208 [08:58<04:27,  2.68it/s][A
Epoch 5/5:  68%|██████▊   | 1491/2208 [08:59<04:28,  2.67it/s][A
Epoch 5/5

Batch 1500: Training accuracy = 0.8984, F1 = 0.8880, Precision = 0.8867, Recall = 0.8984



Epoch 5/5:  68%|██████▊   | 1502/2208 [09:02<04:06,  2.87it/s][A
Epoch 5/5:  68%|██████▊   | 1503/2208 [09:03<04:04,  2.89it/s][A
Epoch 5/5:  68%|██████▊   | 1504/2208 [09:03<04:09,  2.83it/s][A
Epoch 5/5:  68%|██████▊   | 1505/2208 [09:04<04:10,  2.81it/s][A
Epoch 5/5:  68%|██████▊   | 1506/2208 [09:04<04:08,  2.82it/s][A
Epoch 5/5:  68%|██████▊   | 1507/2208 [09:04<04:05,  2.86it/s][A
Epoch 5/5:  68%|██████▊   | 1508/2208 [09:05<04:03,  2.87it/s][A
Epoch 5/5:  68%|██████▊   | 1509/2208 [09:05<04:07,  2.82it/s][A
Epoch 5/5:  68%|██████▊   | 1510/2208 [09:05<04:10,  2.79it/s][A
Epoch 5/5:  68%|██████▊   | 1511/2208 [09:06<04:05,  2.84it/s][A
Epoch 5/5:  68%|██████▊   | 1512/2208 [09:06<04:08,  2.80it/s][A
Epoch 5/5:  69%|██████▊   | 1513/2208 [09:06<04:15,  2.72it/s][A
Epoch 5/5:  69%|██████▊   | 1514/2208 [09:07<04:09,  2.78it/s][A
Epoch 5/5:  69%|██████▊   | 1515/2208 [09:07<04:06,  2.81it/s][A
Epoch 5/5:  69%|██████▊   | 1516/2208 [09:07<04:07,  2.80it/s][A
Epoch 5/5

Batch 1525: Training accuracy = 0.8750, F1 = 0.8646, Precision = 0.8711, Recall = 0.8750



Epoch 5/5:  69%|██████▉   | 1527/2208 [09:11<04:08,  2.74it/s][A
Epoch 5/5:  69%|██████▉   | 1528/2208 [09:12<04:02,  2.80it/s][A
Epoch 5/5:  69%|██████▉   | 1529/2208 [09:12<04:02,  2.79it/s][A
Epoch 5/5:  69%|██████▉   | 1530/2208 [09:12<04:00,  2.82it/s][A
Epoch 5/5:  69%|██████▉   | 1531/2208 [09:13<03:56,  2.86it/s][A
Epoch 5/5:  69%|██████▉   | 1532/2208 [09:13<03:54,  2.89it/s][A
Epoch 5/5:  69%|██████▉   | 1533/2208 [09:13<04:02,  2.78it/s][A
Epoch 5/5:  69%|██████▉   | 1534/2208 [09:14<04:04,  2.76it/s][A
Epoch 5/5:  70%|██████▉   | 1535/2208 [09:14<03:59,  2.81it/s][A
Epoch 5/5:  70%|██████▉   | 1536/2208 [09:15<03:59,  2.81it/s][A
Epoch 5/5:  70%|██████▉   | 1537/2208 [09:15<03:56,  2.84it/s][A
Epoch 5/5:  70%|██████▉   | 1538/2208 [09:15<03:53,  2.87it/s][A
Epoch 5/5:  70%|██████▉   | 1539/2208 [09:16<03:51,  2.88it/s][A
Epoch 5/5:  70%|██████▉   | 1540/2208 [09:16<03:53,  2.86it/s][A
Epoch 5/5:  70%|██████▉   | 1541/2208 [09:16<03:52,  2.87it/s][A
Epoch 5/5

Batch 1550: Training accuracy = 0.9141, F1 = 0.9036, Precision = 0.8984, Recall = 0.9141



Epoch 5/5:  70%|███████   | 1552/2208 [09:20<03:56,  2.77it/s][A
Epoch 5/5:  70%|███████   | 1553/2208 [09:21<03:52,  2.81it/s][A
Epoch 5/5:  70%|███████   | 1554/2208 [09:21<03:52,  2.81it/s][A
Epoch 5/5:  70%|███████   | 1555/2208 [09:21<03:51,  2.82it/s][A
Epoch 5/5:  70%|███████   | 1556/2208 [09:22<03:50,  2.82it/s][A
Epoch 5/5:  71%|███████   | 1557/2208 [09:22<03:47,  2.86it/s][A
Epoch 5/5:  71%|███████   | 1558/2208 [09:22<03:49,  2.84it/s][A
Epoch 5/5:  71%|███████   | 1559/2208 [09:23<03:50,  2.82it/s][A
Epoch 5/5:  71%|███████   | 1560/2208 [09:23<03:49,  2.83it/s][A
Epoch 5/5:  71%|███████   | 1561/2208 [09:23<03:46,  2.86it/s][A
Epoch 5/5:  71%|███████   | 1562/2208 [09:24<03:51,  2.79it/s][A
Epoch 5/5:  71%|███████   | 1563/2208 [09:24<03:53,  2.76it/s][A
Epoch 5/5:  71%|███████   | 1564/2208 [09:24<03:49,  2.80it/s][A
Epoch 5/5:  71%|███████   | 1565/2208 [09:25<03:49,  2.80it/s][A
Epoch 5/5:  71%|███████   | 1566/2208 [09:25<03:53,  2.76it/s][A
Epoch 5/5

Batch 1575: Training accuracy = 0.8906, F1 = 0.8880, Precision = 0.8932, Recall = 0.8906



Epoch 5/5:  71%|███████▏  | 1577/2208 [09:29<03:50,  2.74it/s][A
Epoch 5/5:  71%|███████▏  | 1578/2208 [09:30<03:45,  2.80it/s][A
Epoch 5/5:  72%|███████▏  | 1579/2208 [09:30<03:51,  2.72it/s][A
Epoch 5/5:  72%|███████▏  | 1580/2208 [09:30<03:49,  2.74it/s][A
Epoch 5/5:  72%|███████▏  | 1581/2208 [09:31<03:46,  2.77it/s][A
Epoch 5/5:  72%|███████▏  | 1582/2208 [09:31<03:43,  2.80it/s][A
Epoch 5/5:  72%|███████▏  | 1583/2208 [09:31<03:39,  2.85it/s][A
Epoch 5/5:  72%|███████▏  | 1584/2208 [09:32<03:37,  2.86it/s][A
Epoch 5/5:  72%|███████▏  | 1585/2208 [09:32<03:35,  2.89it/s][A
Epoch 5/5:  72%|███████▏  | 1586/2208 [09:32<03:34,  2.91it/s][A
Epoch 5/5:  72%|███████▏  | 1587/2208 [09:33<03:37,  2.86it/s][A
Epoch 5/5:  72%|███████▏  | 1588/2208 [09:33<03:35,  2.88it/s][A
Epoch 5/5:  72%|███████▏  | 1589/2208 [09:33<03:36,  2.86it/s][A
Epoch 5/5:  72%|███████▏  | 1590/2208 [09:34<03:37,  2.84it/s][A
Epoch 5/5:  72%|███████▏  | 1591/2208 [09:34<03:35,  2.87it/s][A
Epoch 5/5

Batch 1600: Training accuracy = 0.8281, F1 = 0.8161, Precision = 0.8199, Recall = 0.8281



Epoch 5/5:  73%|███████▎  | 1602/2208 [09:38<03:35,  2.82it/s][A
Epoch 5/5:  73%|███████▎  | 1603/2208 [09:38<03:38,  2.77it/s][A
Epoch 5/5:  73%|███████▎  | 1604/2208 [09:39<03:35,  2.80it/s][A
Epoch 5/5:  73%|███████▎  | 1605/2208 [09:39<03:35,  2.80it/s][A
Epoch 5/5:  73%|███████▎  | 1606/2208 [09:40<03:36,  2.78it/s][A
Epoch 5/5:  73%|███████▎  | 1607/2208 [09:40<03:41,  2.71it/s][A
Epoch 5/5:  73%|███████▎  | 1608/2208 [09:40<03:41,  2.71it/s][A
Epoch 5/5:  73%|███████▎  | 1609/2208 [09:41<03:37,  2.76it/s][A
Epoch 5/5:  73%|███████▎  | 1610/2208 [09:41<03:39,  2.73it/s][A
Epoch 5/5:  73%|███████▎  | 1611/2208 [09:41<03:39,  2.71it/s][A
Epoch 5/5:  73%|███████▎  | 1612/2208 [09:42<03:39,  2.71it/s][A
Epoch 5/5:  73%|███████▎  | 1613/2208 [09:42<03:36,  2.75it/s][A
Epoch 5/5:  73%|███████▎  | 1614/2208 [09:42<03:34,  2.77it/s][A
Epoch 5/5:  73%|███████▎  | 1615/2208 [09:43<03:33,  2.78it/s][A
Epoch 5/5:  73%|███████▎  | 1616/2208 [09:43<03:34,  2.75it/s][A
Epoch 5/5

Batch 1625: Training accuracy = 0.8594, F1 = 0.8547, Precision = 0.8639, Recall = 0.8594



Epoch 5/5:  74%|███████▎  | 1627/2208 [09:47<03:29,  2.78it/s][A
Epoch 5/5:  74%|███████▎  | 1628/2208 [09:47<03:27,  2.79it/s][A
Epoch 5/5:  74%|███████▍  | 1629/2208 [09:48<03:32,  2.73it/s][A
Epoch 5/5:  74%|███████▍  | 1630/2208 [09:48<03:32,  2.72it/s][A
Epoch 5/5:  74%|███████▍  | 1631/2208 [09:49<03:31,  2.73it/s][A
Epoch 5/5:  74%|███████▍  | 1632/2208 [09:49<03:26,  2.79it/s][A
Epoch 5/5:  74%|███████▍  | 1633/2208 [09:49<03:24,  2.81it/s][A
Epoch 5/5:  74%|███████▍  | 1634/2208 [09:50<03:23,  2.81it/s][A
Epoch 5/5:  74%|███████▍  | 1635/2208 [09:50<03:20,  2.85it/s][A
Epoch 5/5:  74%|███████▍  | 1636/2208 [09:50<03:22,  2.83it/s][A
Epoch 5/5:  74%|███████▍  | 1637/2208 [09:51<03:20,  2.85it/s][A
Epoch 5/5:  74%|███████▍  | 1638/2208 [09:51<03:19,  2.86it/s][A
Epoch 5/5:  74%|███████▍  | 1639/2208 [09:51<03:17,  2.87it/s][A
Epoch 5/5:  74%|███████▍  | 1640/2208 [09:52<03:18,  2.86it/s][A
Epoch 5/5:  74%|███████▍  | 1641/2208 [09:52<03:22,  2.81it/s][A
Epoch 5/5

Batch 1650: Training accuracy = 0.8438, F1 = 0.8242, Precision = 0.8242, Recall = 0.8438



Epoch 5/5:  75%|███████▍  | 1652/2208 [09:56<03:28,  2.66it/s][A
Epoch 5/5:  75%|███████▍  | 1653/2208 [09:56<03:25,  2.70it/s][A
Epoch 5/5:  75%|███████▍  | 1654/2208 [09:57<03:25,  2.69it/s][A
Epoch 5/5:  75%|███████▍  | 1655/2208 [09:57<03:19,  2.77it/s][A
Epoch 5/5:  75%|███████▌  | 1656/2208 [09:58<03:27,  2.66it/s][A
Epoch 5/5:  75%|███████▌  | 1657/2208 [09:58<03:27,  2.66it/s][A
Epoch 5/5:  75%|███████▌  | 1658/2208 [09:58<03:25,  2.67it/s][A
Epoch 5/5:  75%|███████▌  | 1659/2208 [09:59<03:22,  2.71it/s][A
Epoch 5/5:  75%|███████▌  | 1660/2208 [09:59<03:22,  2.70it/s][A
Epoch 5/5:  75%|███████▌  | 1661/2208 [09:59<03:23,  2.69it/s][A
Epoch 5/5:  75%|███████▌  | 1662/2208 [10:00<03:19,  2.74it/s][A
Epoch 5/5:  75%|███████▌  | 1663/2208 [10:00<03:14,  2.80it/s][A
Epoch 5/5:  75%|███████▌  | 1664/2208 [10:00<03:14,  2.80it/s][A
Epoch 5/5:  75%|███████▌  | 1665/2208 [10:01<03:11,  2.84it/s][A
Epoch 5/5:  75%|███████▌  | 1666/2208 [10:01<03:11,  2.83it/s][A
Epoch 5/5

Batch 1675: Training accuracy = 0.8906, F1 = 0.8893, Precision = 0.9036, Recall = 0.8906



Epoch 5/5:  76%|███████▌  | 1677/2208 [10:05<03:07,  2.83it/s][A
Epoch 5/5:  76%|███████▌  | 1678/2208 [10:05<03:05,  2.86it/s][A
Epoch 5/5:  76%|███████▌  | 1679/2208 [10:06<03:07,  2.82it/s][A
Epoch 5/5:  76%|███████▌  | 1680/2208 [10:06<03:04,  2.85it/s][A
Epoch 5/5:  76%|███████▌  | 1681/2208 [10:06<03:06,  2.83it/s][A
Epoch 5/5:  76%|███████▌  | 1682/2208 [10:07<03:12,  2.73it/s][A
Epoch 5/5:  76%|███████▌  | 1683/2208 [10:07<03:07,  2.79it/s][A
Epoch 5/5:  76%|███████▋  | 1684/2208 [10:08<03:08,  2.78it/s][A
Epoch 5/5:  76%|███████▋  | 1685/2208 [10:08<03:05,  2.82it/s][A
Epoch 5/5:  76%|███████▋  | 1686/2208 [10:08<03:10,  2.74it/s][A
Epoch 5/5:  76%|███████▋  | 1687/2208 [10:09<03:06,  2.79it/s][A
Epoch 5/5:  76%|███████▋  | 1688/2208 [10:09<03:05,  2.80it/s][A
Epoch 5/5:  76%|███████▋  | 1689/2208 [10:09<03:03,  2.83it/s][A
Epoch 5/5:  77%|███████▋  | 1690/2208 [10:10<03:04,  2.81it/s][A
Epoch 5/5:  77%|███████▋  | 1691/2208 [10:10<03:08,  2.75it/s][A
Epoch 5/5

Batch 1700: Training accuracy = 0.8750, F1 = 0.8765, Precision = 0.8887, Recall = 0.8750



Epoch 5/5:  77%|███████▋  | 1702/2208 [10:14<02:58,  2.83it/s][A
Epoch 5/5:  77%|███████▋  | 1703/2208 [10:14<03:00,  2.80it/s][A
Epoch 5/5:  77%|███████▋  | 1704/2208 [10:15<03:01,  2.78it/s][A
Epoch 5/5:  77%|███████▋  | 1705/2208 [10:15<03:06,  2.70it/s][A
Epoch 5/5:  77%|███████▋  | 1706/2208 [10:15<03:02,  2.76it/s][A
Epoch 5/5:  77%|███████▋  | 1707/2208 [10:16<02:57,  2.82it/s][A
Epoch 5/5:  77%|███████▋  | 1708/2208 [10:16<02:58,  2.80it/s][A
Epoch 5/5:  77%|███████▋  | 1709/2208 [10:17<02:59,  2.78it/s][A
Epoch 5/5:  77%|███████▋  | 1710/2208 [10:17<02:59,  2.78it/s][A
Epoch 5/5:  77%|███████▋  | 1711/2208 [10:17<02:55,  2.83it/s][A
Epoch 5/5:  78%|███████▊  | 1712/2208 [10:18<02:53,  2.86it/s][A
Epoch 5/5:  78%|███████▊  | 1713/2208 [10:18<02:55,  2.81it/s][A
Epoch 5/5:  78%|███████▊  | 1714/2208 [10:18<03:00,  2.73it/s][A
Epoch 5/5:  78%|███████▊  | 1715/2208 [10:19<02:56,  2.79it/s][A
Epoch 5/5:  78%|███████▊  | 1716/2208 [10:19<02:56,  2.79it/s][A
Epoch 5/5

Batch 1725: Training accuracy = 0.8828, F1 = 0.8659, Precision = 0.8659, Recall = 0.8828



Epoch 5/5:  78%|███████▊  | 1727/2208 [10:23<02:58,  2.69it/s][A
Epoch 5/5:  78%|███████▊  | 1728/2208 [10:23<02:59,  2.67it/s][A
Epoch 5/5:  78%|███████▊  | 1729/2208 [10:24<02:58,  2.68it/s][A
Epoch 5/5:  78%|███████▊  | 1730/2208 [10:24<02:55,  2.72it/s][A
Epoch 5/5:  78%|███████▊  | 1731/2208 [10:25<02:53,  2.75it/s][A
Epoch 5/5:  78%|███████▊  | 1732/2208 [10:25<02:59,  2.65it/s][A
Epoch 5/5:  78%|███████▊  | 1733/2208 [10:25<03:03,  2.59it/s][A
Epoch 5/5:  79%|███████▊  | 1734/2208 [10:26<02:59,  2.64it/s][A
Epoch 5/5:  79%|███████▊  | 1735/2208 [10:26<02:54,  2.71it/s][A
Epoch 5/5:  79%|███████▊  | 1736/2208 [10:26<02:52,  2.73it/s][A
Epoch 5/5:  79%|███████▊  | 1737/2208 [10:27<02:53,  2.72it/s][A
Epoch 5/5:  79%|███████▊  | 1738/2208 [10:27<02:54,  2.69it/s][A
Epoch 5/5:  79%|███████▉  | 1739/2208 [10:28<02:53,  2.70it/s][A
Epoch 5/5:  79%|███████▉  | 1740/2208 [10:28<02:53,  2.70it/s][A
Epoch 5/5:  79%|███████▉  | 1741/2208 [10:28<02:48,  2.77it/s][A
Epoch 5/5

Batch 1750: Training accuracy = 0.9062, F1 = 0.8951, Precision = 0.9021, Recall = 0.9062



Epoch 5/5:  79%|███████▉  | 1752/2208 [10:32<02:45,  2.76it/s][A
Epoch 5/5:  79%|███████▉  | 1753/2208 [10:33<02:45,  2.74it/s][A
Epoch 5/5:  79%|███████▉  | 1754/2208 [10:33<02:46,  2.73it/s][A
Epoch 5/5:  79%|███████▉  | 1755/2208 [10:33<02:44,  2.76it/s][A
Epoch 5/5:  80%|███████▉  | 1756/2208 [10:34<02:40,  2.82it/s][A
Epoch 5/5:  80%|███████▉  | 1757/2208 [10:34<02:37,  2.85it/s][A
Epoch 5/5:  80%|███████▉  | 1758/2208 [10:34<02:37,  2.86it/s][A
Epoch 5/5:  80%|███████▉  | 1759/2208 [10:35<02:35,  2.88it/s][A
Epoch 5/5:  80%|███████▉  | 1760/2208 [10:35<02:36,  2.86it/s][A
Epoch 5/5:  80%|███████▉  | 1761/2208 [10:35<02:38,  2.81it/s][A
Epoch 5/5:  80%|███████▉  | 1762/2208 [10:36<02:36,  2.85it/s][A
Epoch 5/5:  80%|███████▉  | 1763/2208 [10:36<02:36,  2.85it/s][A
Epoch 5/5:  80%|███████▉  | 1764/2208 [10:36<02:34,  2.88it/s][A
Epoch 5/5:  80%|███████▉  | 1765/2208 [10:37<02:32,  2.90it/s][A
Epoch 5/5:  80%|███████▉  | 1766/2208 [10:37<02:36,  2.82it/s][A
Epoch 5/5

Batch 1775: Training accuracy = 0.8828, F1 = 0.8792, Precision = 0.8841, Recall = 0.8828



Epoch 5/5:  80%|████████  | 1777/2208 [10:41<02:42,  2.65it/s][A
Epoch 5/5:  81%|████████  | 1778/2208 [10:42<02:43,  2.64it/s][A
Epoch 5/5:  81%|████████  | 1779/2208 [10:42<02:41,  2.66it/s][A
Epoch 5/5:  81%|████████  | 1780/2208 [10:42<02:41,  2.65it/s][A
Epoch 5/5:  81%|████████  | 1781/2208 [10:43<02:39,  2.68it/s][A
Epoch 5/5:  81%|████████  | 1782/2208 [10:43<02:35,  2.74it/s][A
Epoch 5/5:  81%|████████  | 1783/2208 [10:43<02:37,  2.70it/s][A
Epoch 5/5:  81%|████████  | 1784/2208 [10:44<02:37,  2.69it/s][A
Epoch 5/5:  81%|████████  | 1785/2208 [10:44<02:35,  2.73it/s][A
Epoch 5/5:  81%|████████  | 1786/2208 [10:44<02:32,  2.77it/s][A
Epoch 5/5:  81%|████████  | 1787/2208 [10:45<02:30,  2.80it/s][A
Epoch 5/5:  81%|████████  | 1788/2208 [10:45<02:31,  2.77it/s][A
Epoch 5/5:  81%|████████  | 1789/2208 [10:45<02:28,  2.82it/s][A
Epoch 5/5:  81%|████████  | 1790/2208 [10:46<02:27,  2.83it/s][A
Epoch 5/5:  81%|████████  | 1791/2208 [10:46<02:28,  2.81it/s][A
Epoch 5/5

Batch 1800: Training accuracy = 0.8594, F1 = 0.8612, Precision = 0.8867, Recall = 0.8594



Epoch 5/5:  82%|████████▏ | 1802/2208 [10:50<02:28,  2.73it/s][A
Epoch 5/5:  82%|████████▏ | 1803/2208 [10:50<02:24,  2.80it/s][A
Epoch 5/5:  82%|████████▏ | 1804/2208 [10:51<02:22,  2.83it/s][A
Epoch 5/5:  82%|████████▏ | 1805/2208 [10:51<02:21,  2.86it/s][A
Epoch 5/5:  82%|████████▏ | 1806/2208 [10:52<02:21,  2.85it/s][A
Epoch 5/5:  82%|████████▏ | 1807/2208 [10:52<02:19,  2.87it/s][A
Epoch 5/5:  82%|████████▏ | 1808/2208 [10:52<02:22,  2.81it/s][A
Epoch 5/5:  82%|████████▏ | 1809/2208 [10:53<02:23,  2.77it/s][A
Epoch 5/5:  82%|████████▏ | 1810/2208 [10:53<02:25,  2.74it/s][A
Epoch 5/5:  82%|████████▏ | 1811/2208 [10:53<02:23,  2.76it/s][A
Epoch 5/5:  82%|████████▏ | 1812/2208 [10:54<02:28,  2.67it/s][A
Epoch 5/5:  82%|████████▏ | 1813/2208 [10:54<02:25,  2.72it/s][A
Epoch 5/5:  82%|████████▏ | 1814/2208 [10:54<02:25,  2.71it/s][A
Epoch 5/5:  82%|████████▏ | 1815/2208 [10:55<02:22,  2.75it/s][A
Epoch 5/5:  82%|████████▏ | 1816/2208 [10:55<02:23,  2.73it/s][A
Epoch 5/5

Batch 1825: Training accuracy = 0.8906, F1 = 0.8815, Precision = 0.8815, Recall = 0.8906



Epoch 5/5:  83%|████████▎ | 1827/2208 [10:59<02:14,  2.84it/s][A
Epoch 5/5:  83%|████████▎ | 1828/2208 [10:59<02:15,  2.80it/s][A
Epoch 5/5:  83%|████████▎ | 1829/2208 [11:00<02:16,  2.78it/s][A
Epoch 5/5:  83%|████████▎ | 1830/2208 [11:00<02:18,  2.73it/s][A
Epoch 5/5:  83%|████████▎ | 1831/2208 [11:00<02:15,  2.78it/s][A
Epoch 5/5:  83%|████████▎ | 1832/2208 [11:01<02:16,  2.75it/s][A
Epoch 5/5:  83%|████████▎ | 1833/2208 [11:01<02:13,  2.80it/s][A
Epoch 5/5:  83%|████████▎ | 1834/2208 [11:02<02:12,  2.82it/s][A
Epoch 5/5:  83%|████████▎ | 1835/2208 [11:02<02:14,  2.77it/s][A
Epoch 5/5:  83%|████████▎ | 1836/2208 [11:02<02:11,  2.82it/s][A
Epoch 5/5:  83%|████████▎ | 1837/2208 [11:03<02:09,  2.86it/s][A
Epoch 5/5:  83%|████████▎ | 1838/2208 [11:03<02:12,  2.78it/s][A
Epoch 5/5:  83%|████████▎ | 1839/2208 [11:03<02:12,  2.79it/s][A
Epoch 5/5:  83%|████████▎ | 1840/2208 [11:04<02:13,  2.76it/s][A
Epoch 5/5:  83%|████████▎ | 1841/2208 [11:04<02:16,  2.70it/s][A
Epoch 5/5

Batch 1850: Training accuracy = 0.8906, F1 = 0.8745, Precision = 0.8659, Recall = 0.8906



Epoch 5/5:  84%|████████▍ | 1852/2208 [11:08<02:13,  2.66it/s][A
Epoch 5/5:  84%|████████▍ | 1853/2208 [11:08<02:10,  2.72it/s][A
Epoch 5/5:  84%|████████▍ | 1854/2208 [11:09<02:15,  2.61it/s][A
Epoch 5/5:  84%|████████▍ | 1855/2208 [11:09<02:16,  2.59it/s][A
Epoch 5/5:  84%|████████▍ | 1856/2208 [11:10<02:14,  2.63it/s][A
Epoch 5/5:  84%|████████▍ | 1857/2208 [11:10<02:09,  2.71it/s][A
Epoch 5/5:  84%|████████▍ | 1858/2208 [11:10<02:07,  2.74it/s][A
Epoch 5/5:  84%|████████▍ | 1859/2208 [11:11<02:07,  2.73it/s][A
Epoch 5/5:  84%|████████▍ | 1860/2208 [11:11<02:05,  2.76it/s][A
Epoch 5/5:  84%|████████▍ | 1861/2208 [11:11<02:07,  2.72it/s][A
Epoch 5/5:  84%|████████▍ | 1862/2208 [11:12<02:07,  2.71it/s][A
Epoch 5/5:  84%|████████▍ | 1863/2208 [11:12<02:07,  2.70it/s][A
Epoch 5/5:  84%|████████▍ | 1864/2208 [11:13<02:06,  2.71it/s][A
Epoch 5/5:  84%|████████▍ | 1865/2208 [11:13<02:08,  2.67it/s][A
Epoch 5/5:  85%|████████▍ | 1866/2208 [11:13<02:09,  2.65it/s][A
Epoch 5/5

Batch 1875: Training accuracy = 0.8359, F1 = 0.8197, Precision = 0.8259, Recall = 0.8359



Epoch 5/5:  85%|████████▌ | 1877/2208 [11:17<01:58,  2.79it/s][A
Epoch 5/5:  85%|████████▌ | 1878/2208 [11:18<01:57,  2.80it/s][A
Epoch 5/5:  85%|████████▌ | 1879/2208 [11:18<01:59,  2.76it/s][A
Epoch 5/5:  85%|████████▌ | 1880/2208 [11:18<01:58,  2.76it/s][A
Epoch 5/5:  85%|████████▌ | 1881/2208 [11:19<01:56,  2.82it/s][A
Epoch 5/5:  85%|████████▌ | 1882/2208 [11:19<01:55,  2.81it/s][A
Epoch 5/5:  85%|████████▌ | 1883/2208 [11:19<01:56,  2.80it/s][A
Epoch 5/5:  85%|████████▌ | 1884/2208 [11:20<01:59,  2.71it/s][A
Epoch 5/5:  85%|████████▌ | 1885/2208 [11:20<01:58,  2.73it/s][A
Epoch 5/5:  85%|████████▌ | 1886/2208 [11:20<01:56,  2.76it/s][A
Epoch 5/5:  85%|████████▌ | 1887/2208 [11:21<01:56,  2.76it/s][A
Epoch 5/5:  86%|████████▌ | 1888/2208 [11:21<01:54,  2.80it/s][A
Epoch 5/5:  86%|████████▌ | 1889/2208 [11:22<01:57,  2.72it/s][A
Epoch 5/5:  86%|████████▌ | 1890/2208 [11:22<02:00,  2.63it/s][A
Epoch 5/5:  86%|████████▌ | 1891/2208 [11:22<02:02,  2.58it/s][A
Epoch 5/5

Batch 1900: Training accuracy = 0.8750, F1 = 0.8542, Precision = 0.8522, Recall = 0.8750



Epoch 5/5:  86%|████████▌ | 1902/2208 [11:26<01:52,  2.71it/s][A
Epoch 5/5:  86%|████████▌ | 1903/2208 [11:27<01:52,  2.70it/s][A
Epoch 5/5:  86%|████████▌ | 1904/2208 [11:27<01:51,  2.73it/s][A
Epoch 5/5:  86%|████████▋ | 1905/2208 [11:28<01:51,  2.72it/s][A
Epoch 5/5:  86%|████████▋ | 1906/2208 [11:28<01:52,  2.68it/s][A
Epoch 5/5:  86%|████████▋ | 1907/2208 [11:28<01:51,  2.70it/s][A
Epoch 5/5:  86%|████████▋ | 1908/2208 [11:29<01:49,  2.73it/s][A
Epoch 5/5:  86%|████████▋ | 1909/2208 [11:29<01:48,  2.76it/s][A
Epoch 5/5:  87%|████████▋ | 1910/2208 [11:29<01:47,  2.78it/s][A
Epoch 5/5:  87%|████████▋ | 1911/2208 [11:30<01:46,  2.79it/s][A
Epoch 5/5:  87%|████████▋ | 1912/2208 [11:30<01:47,  2.75it/s][A
Epoch 5/5:  87%|████████▋ | 1913/2208 [11:30<01:47,  2.76it/s][A
Epoch 5/5:  87%|████████▋ | 1914/2208 [11:31<01:45,  2.80it/s][A
Epoch 5/5:  87%|████████▋ | 1915/2208 [11:31<01:47,  2.74it/s][A
Epoch 5/5:  87%|████████▋ | 1916/2208 [11:32<01:45,  2.77it/s][A
Epoch 5/5

Batch 1925: Training accuracy = 0.8438, F1 = 0.8328, Precision = 0.8424, Recall = 0.8438



Epoch 5/5:  87%|████████▋ | 1927/2208 [11:35<01:40,  2.79it/s][A
Epoch 5/5:  87%|████████▋ | 1928/2208 [11:36<01:42,  2.72it/s][A
Epoch 5/5:  87%|████████▋ | 1929/2208 [11:36<01:40,  2.77it/s][A
Epoch 5/5:  87%|████████▋ | 1930/2208 [11:37<01:40,  2.77it/s][A
Epoch 5/5:  87%|████████▋ | 1931/2208 [11:37<01:41,  2.74it/s][A
Epoch 5/5:  88%|████████▊ | 1932/2208 [11:37<01:40,  2.74it/s][A
Epoch 5/5:  88%|████████▊ | 1933/2208 [11:38<01:38,  2.78it/s][A
Epoch 5/5:  88%|████████▊ | 1934/2208 [11:38<01:38,  2.79it/s][A
Epoch 5/5:  88%|████████▊ | 1935/2208 [11:38<01:38,  2.77it/s][A
Epoch 5/5:  88%|████████▊ | 1936/2208 [11:39<01:38,  2.77it/s][A
Epoch 5/5:  88%|████████▊ | 1937/2208 [11:39<01:36,  2.79it/s][A
Epoch 5/5:  88%|████████▊ | 1938/2208 [11:39<01:35,  2.84it/s][A
Epoch 5/5:  88%|████████▊ | 1939/2208 [11:40<01:36,  2.78it/s][A
Epoch 5/5:  88%|████████▊ | 1940/2208 [11:40<01:36,  2.79it/s][A
Epoch 5/5:  88%|████████▊ | 1941/2208 [11:41<01:33,  2.84it/s][A
Epoch 5/5

Batch 1950: Training accuracy = 0.7812, F1 = 0.7819, Precision = 0.8006, Recall = 0.7812



Epoch 5/5:  88%|████████▊ | 1952/2208 [11:44<01:31,  2.78it/s][A
Epoch 5/5:  88%|████████▊ | 1953/2208 [11:45<01:34,  2.70it/s][A
Epoch 5/5:  88%|████████▊ | 1954/2208 [11:45<01:33,  2.71it/s][A
Epoch 5/5:  89%|████████▊ | 1955/2208 [11:46<01:33,  2.70it/s][A
Epoch 5/5:  89%|████████▊ | 1956/2208 [11:46<01:31,  2.76it/s][A
Epoch 5/5:  89%|████████▊ | 1957/2208 [11:46<01:29,  2.81it/s][A
Epoch 5/5:  89%|████████▊ | 1958/2208 [11:47<01:28,  2.82it/s][A
Epoch 5/5:  89%|████████▊ | 1959/2208 [11:47<01:29,  2.78it/s][A
Epoch 5/5:  89%|████████▉ | 1960/2208 [11:47<01:28,  2.82it/s][A
Epoch 5/5:  89%|████████▉ | 1961/2208 [11:48<01:28,  2.80it/s][A
Epoch 5/5:  89%|████████▉ | 1962/2208 [11:48<01:28,  2.79it/s][A
Epoch 5/5:  89%|████████▉ | 1963/2208 [11:48<01:27,  2.79it/s][A
Epoch 5/5:  89%|████████▉ | 1964/2208 [11:49<01:28,  2.77it/s][A
Epoch 5/5:  89%|████████▉ | 1965/2208 [11:49<01:26,  2.81it/s][A
Epoch 5/5:  89%|████████▉ | 1966/2208 [11:50<01:27,  2.77it/s][A
Epoch 5/5

Batch 1975: Training accuracy = 0.8594, F1 = 0.8393, Precision = 0.8333, Recall = 0.8594



Epoch 5/5:  90%|████████▉ | 1977/2208 [11:53<01:25,  2.70it/s][A
Epoch 5/5:  90%|████████▉ | 1978/2208 [11:54<01:25,  2.68it/s][A
Epoch 5/5:  90%|████████▉ | 1979/2208 [11:54<01:25,  2.68it/s][A
Epoch 5/5:  90%|████████▉ | 1980/2208 [11:55<01:24,  2.69it/s][A
Epoch 5/5:  90%|████████▉ | 1981/2208 [11:55<01:24,  2.68it/s][A
Epoch 5/5:  90%|████████▉ | 1982/2208 [11:55<01:24,  2.68it/s][A
Epoch 5/5:  90%|████████▉ | 1983/2208 [11:56<01:22,  2.72it/s][A
Epoch 5/5:  90%|████████▉ | 1984/2208 [11:56<01:22,  2.72it/s][A
Epoch 5/5:  90%|████████▉ | 1985/2208 [11:56<01:20,  2.77it/s][A
Epoch 5/5:  90%|████████▉ | 1986/2208 [11:57<01:18,  2.82it/s][A
Epoch 5/5:  90%|████████▉ | 1987/2208 [11:57<01:17,  2.85it/s][A
Epoch 5/5:  90%|█████████ | 1988/2208 [11:57<01:16,  2.86it/s][A
Epoch 5/5:  90%|█████████ | 1989/2208 [11:58<01:17,  2.83it/s][A
Epoch 5/5:  90%|█████████ | 1990/2208 [11:58<01:16,  2.86it/s][A
Epoch 5/5:  90%|█████████ | 1991/2208 [11:59<01:16,  2.83it/s][A
Epoch 5/5

Batch 2000: Training accuracy = 0.8594, F1 = 0.8500, Precision = 0.8451, Recall = 0.8594



Epoch 5/5:  91%|█████████ | 2002/2208 [12:02<01:13,  2.82it/s][A
Epoch 5/5:  91%|█████████ | 2003/2208 [12:03<01:13,  2.78it/s][A
Epoch 5/5:  91%|█████████ | 2004/2208 [12:03<01:13,  2.79it/s][A
Epoch 5/5:  91%|█████████ | 2005/2208 [12:03<01:13,  2.77it/s][A
Epoch 5/5:  91%|█████████ | 2006/2208 [12:04<01:13,  2.73it/s][A
Epoch 5/5:  91%|█████████ | 2007/2208 [12:04<01:12,  2.79it/s][A
Epoch 5/5:  91%|█████████ | 2008/2208 [12:05<01:12,  2.78it/s][A
Epoch 5/5:  91%|█████████ | 2009/2208 [12:05<01:12,  2.74it/s][A
Epoch 5/5:  91%|█████████ | 2010/2208 [12:05<01:11,  2.79it/s][A
Epoch 5/5:  91%|█████████ | 2011/2208 [12:06<01:11,  2.76it/s][A
Epoch 5/5:  91%|█████████ | 2012/2208 [12:06<01:11,  2.73it/s][A
Epoch 5/5:  91%|█████████ | 2013/2208 [12:06<01:10,  2.78it/s][A
Epoch 5/5:  91%|█████████ | 2014/2208 [12:07<01:08,  2.83it/s][A
Epoch 5/5:  91%|█████████▏| 2015/2208 [12:07<01:07,  2.84it/s][A
Epoch 5/5:  91%|█████████▏| 2016/2208 [12:07<01:10,  2.73it/s][A
Epoch 5/5

Batch 2025: Training accuracy = 0.8516, F1 = 0.8469, Precision = 0.8633, Recall = 0.8516



Epoch 5/5:  92%|█████████▏| 2027/2208 [12:12<01:06,  2.71it/s][A
Epoch 5/5:  92%|█████████▏| 2028/2208 [12:12<01:04,  2.77it/s][A
Epoch 5/5:  92%|█████████▏| 2029/2208 [12:12<01:03,  2.81it/s][A
Epoch 5/5:  92%|█████████▏| 2030/2208 [12:13<01:02,  2.85it/s][A
Epoch 5/5:  92%|█████████▏| 2031/2208 [12:13<01:02,  2.85it/s][A
Epoch 5/5:  92%|█████████▏| 2032/2208 [12:13<01:01,  2.88it/s][A
Epoch 5/5:  92%|█████████▏| 2033/2208 [12:14<01:01,  2.86it/s][A
Epoch 5/5:  92%|█████████▏| 2034/2208 [12:14<01:00,  2.86it/s][A
Epoch 5/5:  92%|█████████▏| 2035/2208 [12:14<01:02,  2.79it/s][A
Epoch 5/5:  92%|█████████▏| 2036/2208 [12:15<01:01,  2.81it/s][A
Epoch 5/5:  92%|█████████▏| 2037/2208 [12:15<01:00,  2.81it/s][A
Epoch 5/5:  92%|█████████▏| 2038/2208 [12:15<01:01,  2.78it/s][A
Epoch 5/5:  92%|█████████▏| 2039/2208 [12:16<01:01,  2.75it/s][A
Epoch 5/5:  92%|█████████▏| 2040/2208 [12:16<01:00,  2.77it/s][A
Epoch 5/5:  92%|█████████▏| 2041/2208 [12:17<00:59,  2.82it/s][A
Epoch 5/5

Batch 2050: Training accuracy = 0.8750, F1 = 0.8709, Precision = 0.8812, Recall = 0.8750



Epoch 5/5:  93%|█████████▎| 2052/2208 [12:21<00:58,  2.69it/s][A
Epoch 5/5:  93%|█████████▎| 2053/2208 [12:21<00:57,  2.70it/s][A
Epoch 5/5:  93%|█████████▎| 2054/2208 [12:21<00:56,  2.74it/s][A
Epoch 5/5:  93%|█████████▎| 2055/2208 [12:22<00:55,  2.74it/s][A
Epoch 5/5:  93%|█████████▎| 2056/2208 [12:22<00:54,  2.79it/s][A
Epoch 5/5:  93%|█████████▎| 2057/2208 [12:22<00:54,  2.76it/s][A
Epoch 5/5:  93%|█████████▎| 2058/2208 [12:23<00:55,  2.73it/s][A
Epoch 5/5:  93%|█████████▎| 2059/2208 [12:23<00:53,  2.77it/s][A
Epoch 5/5:  93%|█████████▎| 2060/2208 [12:23<00:52,  2.80it/s][A
Epoch 5/5:  93%|█████████▎| 2061/2208 [12:24<00:52,  2.82it/s][A
Epoch 5/5:  93%|█████████▎| 2062/2208 [12:24<00:51,  2.83it/s][A
Epoch 5/5:  93%|█████████▎| 2063/2208 [12:25<00:51,  2.83it/s][A
Epoch 5/5:  93%|█████████▎| 2064/2208 [12:25<00:51,  2.81it/s][A
Epoch 5/5:  94%|█████████▎| 2065/2208 [12:25<00:51,  2.77it/s][A
Epoch 5/5:  94%|█████████▎| 2066/2208 [12:26<00:50,  2.81it/s][A
Epoch 5/5

Batch 2075: Training accuracy = 0.8828, F1 = 0.8737, Precision = 0.8815, Recall = 0.8828



Epoch 5/5:  94%|█████████▍| 2077/2208 [12:30<00:46,  2.81it/s][A
Epoch 5/5:  94%|█████████▍| 2078/2208 [12:30<00:45,  2.83it/s][A
Epoch 5/5:  94%|█████████▍| 2079/2208 [12:30<00:45,  2.86it/s][A
Epoch 5/5:  94%|█████████▍| 2080/2208 [12:31<00:45,  2.84it/s][A
Epoch 5/5:  94%|█████████▍| 2081/2208 [12:31<00:46,  2.75it/s][A
Epoch 5/5:  94%|█████████▍| 2082/2208 [12:31<00:45,  2.77it/s][A
Epoch 5/5:  94%|█████████▍| 2083/2208 [12:32<00:44,  2.81it/s][A
Epoch 5/5:  94%|█████████▍| 2084/2208 [12:32<00:44,  2.80it/s][A
Epoch 5/5:  94%|█████████▍| 2085/2208 [12:32<00:44,  2.79it/s][A
Epoch 5/5:  94%|█████████▍| 2086/2208 [12:33<00:43,  2.80it/s][A
Epoch 5/5:  95%|█████████▍| 2087/2208 [12:33<00:43,  2.81it/s][A
Epoch 5/5:  95%|█████████▍| 2088/2208 [12:33<00:42,  2.82it/s][A
Epoch 5/5:  95%|█████████▍| 2089/2208 [12:34<00:42,  2.82it/s][A
Epoch 5/5:  95%|█████████▍| 2090/2208 [12:34<00:41,  2.82it/s][A
Epoch 5/5:  95%|█████████▍| 2091/2208 [12:35<00:41,  2.82it/s][A
Epoch 5/5

Batch 2100: Training accuracy = 0.8906, F1 = 0.8938, Precision = 0.9062, Recall = 0.8906



Epoch 5/5:  95%|█████████▌| 2102/2208 [12:39<00:38,  2.78it/s][A
Epoch 5/5:  95%|█████████▌| 2103/2208 [12:39<00:37,  2.79it/s][A
Epoch 5/5:  95%|█████████▌| 2104/2208 [12:39<00:37,  2.76it/s][A
Epoch 5/5:  95%|█████████▌| 2105/2208 [12:40<00:37,  2.75it/s][A
Epoch 5/5:  95%|█████████▌| 2106/2208 [12:40<00:36,  2.80it/s][A
Epoch 5/5:  95%|█████████▌| 2107/2208 [12:40<00:36,  2.77it/s][A
Epoch 5/5:  95%|█████████▌| 2108/2208 [12:41<00:36,  2.77it/s][A
Epoch 5/5:  96%|█████████▌| 2109/2208 [12:41<00:35,  2.78it/s][A
Epoch 5/5:  96%|█████████▌| 2110/2208 [12:41<00:34,  2.82it/s][A
Epoch 5/5:  96%|█████████▌| 2111/2208 [12:42<00:33,  2.86it/s][A
Epoch 5/5:  96%|█████████▌| 2112/2208 [12:42<00:33,  2.89it/s][A
Epoch 5/5:  96%|█████████▌| 2113/2208 [12:42<00:32,  2.90it/s][A
Epoch 5/5:  96%|█████████▌| 2114/2208 [12:43<00:32,  2.86it/s][A
Epoch 5/5:  96%|█████████▌| 2115/2208 [12:43<00:33,  2.80it/s][A
Epoch 5/5:  96%|█████████▌| 2116/2208 [12:44<00:32,  2.84it/s][A
Epoch 5/5

Batch 2125: Training accuracy = 0.8750, F1 = 0.8555, Precision = 0.8503, Recall = 0.8750



Epoch 5/5:  96%|█████████▋| 2127/2208 [12:47<00:28,  2.81it/s][A
Epoch 5/5:  96%|█████████▋| 2128/2208 [12:48<00:28,  2.84it/s][A
Epoch 5/5:  96%|█████████▋| 2129/2208 [12:48<00:28,  2.82it/s][A
Epoch 5/5:  96%|█████████▋| 2130/2208 [12:48<00:27,  2.86it/s][A
Epoch 5/5:  97%|█████████▋| 2131/2208 [12:49<00:26,  2.88it/s][A
Epoch 5/5:  97%|█████████▋| 2132/2208 [12:49<00:26,  2.88it/s][A
Epoch 5/5:  97%|█████████▋| 2133/2208 [12:50<00:26,  2.84it/s][A
Epoch 5/5:  97%|█████████▋| 2134/2208 [12:50<00:26,  2.84it/s][A
Epoch 5/5:  97%|█████████▋| 2135/2208 [12:50<00:26,  2.79it/s][A
Epoch 5/5:  97%|█████████▋| 2136/2208 [12:51<00:25,  2.78it/s][A
Epoch 5/5:  97%|█████████▋| 2137/2208 [12:51<00:25,  2.73it/s][A
Epoch 5/5:  97%|█████████▋| 2138/2208 [12:51<00:25,  2.79it/s][A
Epoch 5/5:  97%|█████████▋| 2139/2208 [12:52<00:24,  2.82it/s][A
Epoch 5/5:  97%|█████████▋| 2140/2208 [12:52<00:24,  2.78it/s][A
Epoch 5/5:  97%|█████████▋| 2141/2208 [12:52<00:23,  2.80it/s][A
Epoch 5/5

Batch 2150: Training accuracy = 0.9062, F1 = 0.9062, Precision = 0.9141, Recall = 0.9062



Epoch 5/5:  97%|█████████▋| 2152/2208 [12:56<00:19,  2.80it/s][A
Epoch 5/5:  98%|█████████▊| 2153/2208 [12:57<00:19,  2.84it/s][A
Epoch 5/5:  98%|█████████▊| 2154/2208 [12:57<00:18,  2.87it/s][A
Epoch 5/5:  98%|█████████▊| 2155/2208 [12:57<00:18,  2.89it/s][A
Epoch 5/5:  98%|█████████▊| 2156/2208 [12:58<00:18,  2.82it/s][A
Epoch 5/5:  98%|█████████▊| 2157/2208 [12:58<00:17,  2.86it/s][A
Epoch 5/5:  98%|█████████▊| 2158/2208 [12:59<00:17,  2.78it/s][A
Epoch 5/5:  98%|█████████▊| 2159/2208 [12:59<00:17,  2.77it/s][A
Epoch 5/5:  98%|█████████▊| 2160/2208 [12:59<00:17,  2.69it/s][A
Epoch 5/5:  98%|█████████▊| 2161/2208 [13:00<00:17,  2.75it/s][A
Epoch 5/5:  98%|█████████▊| 2162/2208 [13:00<00:16,  2.78it/s][A
Epoch 5/5:  98%|█████████▊| 2163/2208 [13:00<00:16,  2.81it/s][A
Epoch 5/5:  98%|█████████▊| 2164/2208 [13:01<00:15,  2.83it/s][A
Epoch 5/5:  98%|█████████▊| 2165/2208 [13:01<00:15,  2.82it/s][A
Epoch 5/5:  98%|█████████▊| 2166/2208 [13:01<00:15,  2.80it/s][A
Epoch 5/5

Batch 2175: Training accuracy = 0.8203, F1 = 0.8302, Precision = 0.8581, Recall = 0.8203



Epoch 5/5:  99%|█████████▊| 2177/2208 [13:05<00:11,  2.68it/s][A
Epoch 5/5:  99%|█████████▊| 2178/2208 [13:06<00:11,  2.71it/s][A
Epoch 5/5:  99%|█████████▊| 2179/2208 [13:06<00:10,  2.66it/s][A
Epoch 5/5:  99%|█████████▊| 2180/2208 [13:07<00:10,  2.70it/s][A
Epoch 5/5:  99%|█████████▉| 2181/2208 [13:07<00:10,  2.68it/s][A
Epoch 5/5:  99%|█████████▉| 2182/2208 [13:07<00:09,  2.71it/s][A
Epoch 5/5:  99%|█████████▉| 2183/2208 [13:08<00:09,  2.72it/s][A
Epoch 5/5:  99%|█████████▉| 2184/2208 [13:08<00:08,  2.76it/s][A
Epoch 5/5:  99%|█████████▉| 2185/2208 [13:08<00:08,  2.82it/s][A
Epoch 5/5:  99%|█████████▉| 2186/2208 [13:09<00:07,  2.80it/s][A
Epoch 5/5:  99%|█████████▉| 2187/2208 [13:09<00:07,  2.84it/s][A
Epoch 5/5:  99%|█████████▉| 2188/2208 [13:09<00:07,  2.76it/s][A
Epoch 5/5:  99%|█████████▉| 2189/2208 [13:10<00:07,  2.70it/s][A
Epoch 5/5:  99%|█████████▉| 2190/2208 [13:10<00:06,  2.77it/s][A
Epoch 5/5:  99%|█████████▉| 2191/2208 [13:10<00:06,  2.82it/s][A
Epoch 5/5

Batch 2200: Training accuracy = 0.8594, F1 = 0.8531, Precision = 0.8607, Recall = 0.8594



Epoch 5/5: 100%|█████████▉| 2202/2208 [13:14<00:02,  2.84it/s][A
Epoch 5/5: 100%|█████████▉| 2203/2208 [13:15<00:01,  2.88it/s][A
Epoch 5/5: 100%|█████████▉| 2204/2208 [13:15<00:01,  2.90it/s][A
Epoch 5/5: 100%|█████████▉| 2205/2208 [13:15<00:01,  2.92it/s][A
Epoch 5/5: 100%|█████████▉| 2206/2208 [13:16<00:00,  2.93it/s][A
Epoch 5/5: 100%|█████████▉| 2207/2208 [13:16<00:00,  2.94it/s][A
Epoch 5/5: 100%|██████████| 2208/2208 [13:16<00:00,  2.95it/s][A
                                                              [A


Epoch 5 training accuracy: 0.87%
Epoch 5 training F1 score: 0.8763
Epoch 5 training precision: 0.8891
Epoch 5 training recall: 0.8687

Starting validation...



Validation:   0%|          | 0/552 [00:00<?, ?it/s][A
Validation:   0%|          | 1/552 [00:01<16:11,  1.76s/it][A
Validation:   1%|          | 3/552 [00:01<04:35,  2.00it/s][A
Validation:   1%|          | 5/552 [00:02<02:36,  3.49it/s][A
Validation:   2%|▏         | 9/552 [00:02<01:23,  6.51it/s][A
Validation:   2%|▏         | 11/552 [00:02<01:17,  7.00it/s][A
Validation:   2%|▏         | 13/552 [00:02<01:09,  7.71it/s][A
Validation:   3%|▎         | 15/552 [00:02<01:00,  8.89it/s][A
Validation:   3%|▎         | 17/552 [00:03<01:03,  8.38it/s][A
Validation:   4%|▎         | 20/552 [00:03<00:50, 10.48it/s][A
Validation:   4%|▍         | 22/552 [00:03<00:55,  9.49it/s][A
Validation:   4%|▍         | 24/552 [00:03<00:49, 10.64it/s][A
Validation:   5%|▍         | 26/552 [00:03<00:50, 10.36it/s][A
Validation:   5%|▌         | 29/552 [00:04<00:40, 12.90it/s][A
Validation:   6%|▌         | 31/552 [00:04<00:44, 11.68it/s][A
Validation:   6%|▌         | 33/552 [00:04<00:47, 10

Validation accuracy: 0.76%
Validation F1 score: 0.7667
Validation precision: 0.8320
Validation recall: 0.7563

Starting testing...




Test accuracy: 0.76%
Test F1 score: 0.7679
Test precision: 0.8331
Test recall: 0.7580
[neptune] [info   ] Shutting down background jobs, please wait a moment...
[neptune] [info   ] Done!
[neptune] [info   ] Waiting for the remaining 4 operations to synchronize with Neptune. Do not kill this process.
[neptune] [info   ] All 4 operations synced, thanks for waiting!
[neptune] [info   ] Explore the metadata in the Neptune app: https://app.neptune.ai/muguryalcin/TKPR221/e/TKPR-191/metadata


Saving the Model

In [None]:
from joblib import dump, load
print("Saving the model...")
model_save_path = f'/content/drive/MyDrive/TKPR221/models/{run_name}.joblib'
dump(sgd_clf, model_save_path)
print("Saved the model to", model_save_path)

# References
Throughout this notebook, AI tools such as ChatGPT are used used for mainly for debugging purposes. However some of the parts are edited as well, but the code is mainly written by us.