## Imports

In [1]:
import os

from mmaction.datasets import build_dataset, build_dataloader
from mmaction.models import build_model
from mmcv import Config
from mmaction.datasets import Scrambmix
import torch.nn.functional as F
import numpy as np

  from .autonotebook import tqdm as notebook_tqdm


In [2]:
def precision_score(y_true, y_pred):
    """Calculates precision score.

    Args:
        y_true: True labels.
        y_pred: Predicted labels.

    Returns:
        Precision score.
    """

    tp = sum(y_true[i] == y_pred[i] for i in range(len(y_true)) if y_pred[i] == 1)
    fp = sum(y_true[i] != y_pred[i] for i in range(len(y_true)) if y_pred[i] == 1)
    precision = tp / (tp + fp) if tp + fp != 0 else 0
    return precision

def recall_score(y_true, y_pred):
    """Calculates recall score.

    Args:
        y_true: True labels.
        y_pred: Predicted labels.

    Returns:
        Recall score.
    """

    tp = sum(y_true[i] == y_pred[i] for i in range(len(y_true)) if y_pred[i] == 1)
    fn = sum(y_true[i] == 1 and y_pred[i] != 1 for i in range(len(y_true)))
    recall = tp / (tp + fn) if tp + fn != 0 else 0
    return recall

def f1_score(y_true, y_pred):
    """Calculates F1 score.

    Args:
        y_true: True labels.
        y_pred: Predicted labels.

    Returns:
        F1 score.
    """

    p = precision_score(y_true, y_pred)
    r = recall_score(y_true, y_pred)
    return 2 * p * r / (p + r) if p + r != 0 else 0

def weighted_f1_score(y_true, y_pred):
    """Calculates the weighted F1 score, assuming equal class weights.

    Args:
        y_true: True labels.
        y_pred: Predicted labels.

    Returns:
        Weighted F1 score.
    """

    num_classes = len(set(y_true))
    f1_scores = []
    for i in range(num_classes):
        class_mask = [1 if y == i else 0 for y in y_true]
        class_f1 = f1_score(class_mask, [1 if y == i else 0 for y in y_pred])
        f1_scores.append(class_f1)
    return sum(f1_scores) / num_classes

def accuracy_score(y_true, y_pred):
    """Calculates the accuracy score.
    
    Args:
    y_true: True labels.
    y_pred: Predicted labels.
    
    Returns:
    Accuracy score.
    """
    
    correct_predictions = sum(np.array(y_true) == np.array(y_pred))
    total_predictions = len(y_true)
    accuracy = correct_predictions / total_predictions

    return accuracy

## Loading batches

In [3]:
cfg = Config.fromfile('./mixup.py')

In [4]:
os.chdir('../../..')

In [5]:
cfg.data.train

{'type': 'RawframeDataset',
 'ann_file': 'data/hmdb51/annotation_train.txt',
 'data_prefix': 'data/hmdb51/rawframes',
 'pipeline': [{'type': 'SampleFrames',
   'clip_len': 32,
   'frame_interval': 2,
   'num_clips': 1},
  {'type': 'RawFrameDecode'},
  {'type': 'Resize', 'scale': (-1, 256)},
  {'type': 'RandomResizedCrop'},
  {'type': 'Resize', 'scale': (224, 224), 'keep_ratio': False},
  {'type': 'Flip', 'flip_ratio': 0.5},
  {'type': 'Normalize',
   'mean': [123.675, 116.28, 103.53],
   'std': [58.395, 57.12, 57.375],
   'to_bgr': False},
  {'type': 'FormatShape', 'input_format': 'NCTHW'},
  {'type': 'Collect', 'keys': ['imgs', 'label'], 'meta_keys': []},
  {'type': 'ToTensor', 'keys': ['imgs', 'label']}]}

In [6]:
train_dataset = build_dataset(cfg=cfg.data.train)
train_loader = build_dataloader(
        train_dataset,
        videos_per_gpu=8,
        workers_per_gpu=4,
        persistent_workers=False,
        num_gpus=1,
        dist=False)

val_dataset = build_dataset(cfg=cfg.data.val)
val_loader = build_dataloader(
        val_dataset,
        videos_per_gpu=1,
        workers_per_gpu=4,
        persistent_workers=False,
        num_gpus=1,
        dist=False)

## Learning Hyperparameters

In [7]:
import optuna
import torch.nn as nn
import torch.optim as optim
import torch
import logging
import numpy as np
from sklearn.metrics import accuracy_score

# Best parameters from previous study
best_params = {
    'dropout_ratio': 0.6795542149013333,
    'lr': 7.886714129990479e-06,
    'max_norm': 41,
    'with_pool2': True,
    'bottleneck_mode': 'ir',
    'norm_eval': False,
    'bn_frozen': False
}

# Configure logging
logging.basicConfig(filename='optuna_training_scrambmix_hmdb.log', 
                    filemode='w', 
                    format='%(asctime)s - %(levelname)s - %(message)s', 
                    level=logging.INFO)

# Define device
device = torch.device("cuda" if torch.cuda.is_available() else "cpu")

# Database file path for saving study
db_file = "sqlite:///optuna_study_scrambmix_hmdb.db"

sampler = optuna.samplers.TPESampler(seed=42)

# Set up study with the option to minimize validation loss
study = optuna.create_study(
    sampler=sampler,
    direction="maximize",
    study_name="scrambmix_hmdb", 
    storage=db_file,
    load_if_exists=True
)

def objective(trial):
    print("Starting a new trial...")

    # Hyperparameters to tune
    alpha = trial.suggest_float("alpha", 0.1, 10)  
    print(f"Trial {trial.number}: alpha = {alpha}")

    # Set hyperparameters
    dropout_ratio = best_params['dropout_ratio']
    lr = best_params['lr']
    max_norm = best_params['max_norm']

    # Backbone parameters
    cfg.model.backbone.with_pool2 = best_params['with_pool2']
    cfg.model.backbone.bottleneck_mode = best_params['bottleneck_mode']
    cfg.model.backbone.norm_eval = best_params['norm_eval']
    cfg.model.backbone.bn_frozen = best_params['bn_frozen']

    # Fixed pretrained URL
    cfg.model.backbone.pretrained = 'https://download.openmmlab.com/mmaction/recognition/csn/ircsn_from_scratch_r50_ig65m_20210617-ce545a37.pth'

    # Adjust config parameters
    cfg.model.cls_head.dropout_ratio = dropout_ratio

    # Initialize model, criterion, optimizer, scheduler
    print("Building the model...")
    model = build_model(cfg.model, train_cfg=None, test_cfg=cfg.get('test_cfg')).to(device)
    
    optimizer = optim.Adam(
        model.parameters(),
        lr=lr,
        weight_decay=0.00001
    )

    print("Model built successfully!")
    
    # Early stopping parameters
    total_epochs = 60
    eval_interval = 1
    best_val_accuracy = 0

    # scrambmix Blending instance
    scrambmix = Scrambmix(num_classes=cfg.model.cls_head.num_classes, alpha=alpha, num_frames=32)

    print("Starting training...")
    for epoch in range(total_epochs):

        # Training loop
        model.train()
        epoch_loss = 0
        for batch_idx, data in enumerate(train_loader):
            inputs, labels = data['imgs'].to(device), data['label'].to(device)

            # Convert labels to one-hot encoding
            labels_one_hot = F.one_hot(labels, num_classes=cfg.model.cls_head.num_classes).float()

            # Apply scrambmix
            mixed_inputs, mixed_labels = scrambmix.do_blending(inputs, labels_one_hot)

            optimizer.zero_grad()
            outputs = model(mixed_inputs, mixed_labels, return_loss=True)
            loss = outputs['loss_cls']

            loss.backward()
            torch.nn.utils.clip_grad_norm_(model.parameters(), max_norm)
            optimizer.step()

            epoch_loss += loss.item()
            if batch_idx % 10 == 0:
                print(f"Epoch [{epoch + 1}/{total_epochs}], Batch [{batch_idx}/{len(train_loader)}], Loss: {loss.item():.4f}")

        logging.info(f"Epoch [{epoch + 1}/{total_epochs}], Train Loss: {epoch_loss / len(train_loader):.4f}")
        print(f"Epoch [{epoch + 1}/{total_epochs}], Average Train Loss: {epoch_loss / len(train_loader):.4f}")

        # Validation loop (every `eval_interval` epochs)
        if (epoch + 1) % eval_interval == 0:
            model.eval()
            total_val_loss = 0
            all_preds = []
            all_labels = []
            with torch.no_grad():
                for val_data in val_loader:
                    val_inputs, val_labels = val_data['imgs'].to(device), val_data['label'].to(device)

                    val_results = model(val_inputs, return_loss=False)
                    val_loss = model(val_inputs, val_labels, return_loss=True)['loss_cls']

                    total_val_loss += val_loss.item()

                    # Collect predictions and true labels
                    predictions = np.argmax(val_results, axis=1)
                    true_labels = val_labels.cpu().numpy()

                    all_preds.extend(predictions)
                    all_labels.extend(true_labels)

            val_accuracy = accuracy_score(all_labels, all_preds)

            print(f"Epoch [{epoch + 1}/{total_epochs}], Validation Accuracy: {val_accuracy:.4f}, Validation Loss: {total_val_loss / len(val_loader):.4f}")
            logging.info(f"Epoch [{epoch + 1}/{total_epochs}], Validation Accuracy: {val_accuracy:.4f}")

            # Report validation loss to Optuna
            trial.report(val_accuracy, epoch)

            # Check if validation accuracy improved
            if val_accuracy > best_val_accuracy:
                best_val_accuracy = val_accuracy

            # Prune unpromising trials
            if trial.should_prune():
                print("Trial pruned due to lack of improvement.")
                raise optuna.exceptions.TrialPruned()

    return best_val_accuracy

# Run Optuna Study
print("Starting Optuna study...")
study.optimize(objective, n_trials=10)

print(f"Best hyperparameters: {study.best_params}")
print(f"Best validation accuracy: {study.best_value:.4f}")
logging.info("Best hyperparameters: %s", study.best_params)
logging.info("Best validation accuracy: %f", study.best_value)


[I 2024-12-13 03:54:04,464] Using an existing study with name 'scrambmix_hmdb' instead of creating a new one.


Starting Optuna study...
Starting a new trial...
Trial 1: alpha = 3.807947176588889
Building the model...


2024-12-13 03:54:04,852 - mmaction - INFO - load model from: https://download.openmmlab.com/mmaction/recognition/csn/ircsn_from_scratch_r50_ig65m_20210617-ce545a37.pth
2024-12-13 03:54:04,853 - mmaction - INFO - load checkpoint from http path: https://download.openmmlab.com/mmaction/recognition/csn/ircsn_from_scratch_r50_ig65m_20210617-ce545a37.pth


Model built successfully!
Starting training...


  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [1/60], Batch [0/447], Loss: 3.9516
Epoch [1/60], Batch [10/447], Loss: 4.0507
Epoch [1/60], Batch [20/447], Loss: 4.0422
Epoch [1/60], Batch [30/447], Loss: 3.9478
Epoch [1/60], Batch [40/447], Loss: 3.9287
Epoch [1/60], Batch [50/447], Loss: 3.9314
Epoch [1/60], Batch [60/447], Loss: 3.8720
Epoch [1/60], Batch [70/447], Loss: 3.9550
Epoch [1/60], Batch [80/447], Loss: 3.9013
Epoch [1/60], Batch [90/447], Loss: 3.9084
Epoch [1/60], Batch [100/447], Loss: 3.9606
Epoch [1/60], Batch [110/447], Loss: 3.9949
Epoch [1/60], Batch [120/447], Loss: 3.9674
Epoch [1/60], Batch [130/447], Loss: 3.9998
Epoch [1/60], Batch [140/447], Loss: 3.9940
Epoch [1/60], Batch [150/447], Loss: 3.9695
Epoch [1/60], Batch [160/447], Loss: 3.9730
Epoch [1/60], Batch [170/447], Loss: 4.0480
Epoch [1/60], Batch [180/447], Loss: 3.9665
Epoch [1/60], Batch [190/447], Loss: 3.9591
Epoch [1/60], Batch [200/447], Loss: 3.9503
Epoch [1/60], Batch [210/447], Loss: 3.9549
Epoch [1/60], Batch [220/447], Loss: 4.0153

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [2/60], Batch [0/447], Loss: 3.9850
Epoch [2/60], Batch [10/447], Loss: 3.9549
Epoch [2/60], Batch [20/447], Loss: 3.9081
Epoch [2/60], Batch [30/447], Loss: 3.9350
Epoch [2/60], Batch [40/447], Loss: 3.8993
Epoch [2/60], Batch [50/447], Loss: 3.7988
Epoch [2/60], Batch [60/447], Loss: 3.9571
Epoch [2/60], Batch [70/447], Loss: 3.9171
Epoch [2/60], Batch [80/447], Loss: 3.8712
Epoch [2/60], Batch [90/447], Loss: 3.9051
Epoch [2/60], Batch [100/447], Loss: 3.9190
Epoch [2/60], Batch [110/447], Loss: 3.8300
Epoch [2/60], Batch [120/447], Loss: 3.9062
Epoch [2/60], Batch [130/447], Loss: 3.9765
Epoch [2/60], Batch [140/447], Loss: 4.0149
Epoch [2/60], Batch [150/447], Loss: 3.8801
Epoch [2/60], Batch [160/447], Loss: 3.8692
Epoch [2/60], Batch [170/447], Loss: 3.7721
Epoch [2/60], Batch [180/447], Loss: 3.8278
Epoch [2/60], Batch [190/447], Loss: 3.8652
Epoch [2/60], Batch [200/447], Loss: 3.8363
Epoch [2/60], Batch [210/447], Loss: 3.8394
Epoch [2/60], Batch [220/447], Loss: 3.8838

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [3/60], Batch [0/447], Loss: 3.6746
Epoch [3/60], Batch [10/447], Loss: 3.8264
Epoch [3/60], Batch [20/447], Loss: 3.6565
Epoch [3/60], Batch [30/447], Loss: 3.7154
Epoch [3/60], Batch [40/447], Loss: 3.7079
Epoch [3/60], Batch [50/447], Loss: 3.9414
Epoch [3/60], Batch [60/447], Loss: 3.7184
Epoch [3/60], Batch [70/447], Loss: 3.7409
Epoch [3/60], Batch [80/447], Loss: 3.8455
Epoch [3/60], Batch [90/447], Loss: 3.5747
Epoch [3/60], Batch [100/447], Loss: 3.7251
Epoch [3/60], Batch [110/447], Loss: 3.9496
Epoch [3/60], Batch [120/447], Loss: 3.8169
Epoch [3/60], Batch [130/447], Loss: 3.7040
Epoch [3/60], Batch [140/447], Loss: 3.9275
Epoch [3/60], Batch [150/447], Loss: 3.8315
Epoch [3/60], Batch [160/447], Loss: 3.5701
Epoch [3/60], Batch [170/447], Loss: 3.5582
Epoch [3/60], Batch [180/447], Loss: 3.7096
Epoch [3/60], Batch [190/447], Loss: 3.8178
Epoch [3/60], Batch [200/447], Loss: 3.7717
Epoch [3/60], Batch [210/447], Loss: 3.5815
Epoch [3/60], Batch [220/447], Loss: 3.8178

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [4/60], Batch [0/447], Loss: 3.7462
Epoch [4/60], Batch [10/447], Loss: 3.7784
Epoch [4/60], Batch [20/447], Loss: 3.6694
Epoch [4/60], Batch [30/447], Loss: 3.7726
Epoch [4/60], Batch [40/447], Loss: 3.4985
Epoch [4/60], Batch [50/447], Loss: 3.7205
Epoch [4/60], Batch [60/447], Loss: 3.7056
Epoch [4/60], Batch [70/447], Loss: 3.6760
Epoch [4/60], Batch [80/447], Loss: 3.8889
Epoch [4/60], Batch [90/447], Loss: 3.6395
Epoch [4/60], Batch [100/447], Loss: 3.6145
Epoch [4/60], Batch [110/447], Loss: 3.8417
Epoch [4/60], Batch [120/447], Loss: 3.9060
Epoch [4/60], Batch [130/447], Loss: 3.4171
Epoch [4/60], Batch [140/447], Loss: 3.4632
Epoch [4/60], Batch [150/447], Loss: 3.8546
Epoch [4/60], Batch [160/447], Loss: 3.7785
Epoch [4/60], Batch [170/447], Loss: 3.3896
Epoch [4/60], Batch [180/447], Loss: 3.6928
Epoch [4/60], Batch [190/447], Loss: 3.7238
Epoch [4/60], Batch [200/447], Loss: 3.7053
Epoch [4/60], Batch [210/447], Loss: 3.6635
Epoch [4/60], Batch [220/447], Loss: 3.2716

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [5/60], Batch [0/447], Loss: 3.8072
Epoch [5/60], Batch [10/447], Loss: 3.4682
Epoch [5/60], Batch [20/447], Loss: 3.4356
Epoch [5/60], Batch [30/447], Loss: 3.7515
Epoch [5/60], Batch [40/447], Loss: 3.4063
Epoch [5/60], Batch [50/447], Loss: 3.5281
Epoch [5/60], Batch [60/447], Loss: 3.8363
Epoch [5/60], Batch [70/447], Loss: 3.7732
Epoch [5/60], Batch [80/447], Loss: 3.5706
Epoch [5/60], Batch [90/447], Loss: 3.5827
Epoch [5/60], Batch [100/447], Loss: 3.6294
Epoch [5/60], Batch [110/447], Loss: 3.3253
Epoch [5/60], Batch [120/447], Loss: 3.7004
Epoch [5/60], Batch [130/447], Loss: 3.5897
Epoch [5/60], Batch [140/447], Loss: 3.7357
Epoch [5/60], Batch [150/447], Loss: 3.4894
Epoch [5/60], Batch [160/447], Loss: 3.3128
Epoch [5/60], Batch [170/447], Loss: 3.4569
Epoch [5/60], Batch [180/447], Loss: 3.4503
Epoch [5/60], Batch [190/447], Loss: 3.5293
Epoch [5/60], Batch [200/447], Loss: 3.4992
Epoch [5/60], Batch [210/447], Loss: 3.5985
Epoch [5/60], Batch [220/447], Loss: 3.6852

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [6/60], Batch [0/447], Loss: 3.3606
Epoch [6/60], Batch [10/447], Loss: 3.3337
Epoch [6/60], Batch [20/447], Loss: 3.5667
Epoch [6/60], Batch [30/447], Loss: 3.5029
Epoch [6/60], Batch [40/447], Loss: 3.5424
Epoch [6/60], Batch [50/447], Loss: 3.4174
Epoch [6/60], Batch [60/447], Loss: 3.9023
Epoch [6/60], Batch [70/447], Loss: 3.4894
Epoch [6/60], Batch [80/447], Loss: 3.2886
Epoch [6/60], Batch [90/447], Loss: 3.5584
Epoch [6/60], Batch [100/447], Loss: 3.6016
Epoch [6/60], Batch [110/447], Loss: 3.4284
Epoch [6/60], Batch [120/447], Loss: 3.7673
Epoch [6/60], Batch [130/447], Loss: 3.3787
Epoch [6/60], Batch [140/447], Loss: 3.6277
Epoch [6/60], Batch [150/447], Loss: 3.4106
Epoch [6/60], Batch [160/447], Loss: 3.5868
Epoch [6/60], Batch [170/447], Loss: 3.6666
Epoch [6/60], Batch [180/447], Loss: 3.5109
Epoch [6/60], Batch [190/447], Loss: 3.4867
Epoch [6/60], Batch [200/447], Loss: 3.4771
Epoch [6/60], Batch [210/447], Loss: 3.8096
Epoch [6/60], Batch [220/447], Loss: 3.5793

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [7/60], Batch [0/447], Loss: 3.5891
Epoch [7/60], Batch [10/447], Loss: 3.2141
Epoch [7/60], Batch [20/447], Loss: 3.3770
Epoch [7/60], Batch [30/447], Loss: 3.2662
Epoch [7/60], Batch [40/447], Loss: 3.5188
Epoch [7/60], Batch [50/447], Loss: 3.7900
Epoch [7/60], Batch [60/447], Loss: 3.3975
Epoch [7/60], Batch [70/447], Loss: 3.7078
Epoch [7/60], Batch [80/447], Loss: 3.2850
Epoch [7/60], Batch [90/447], Loss: 3.5493
Epoch [7/60], Batch [100/447], Loss: 3.4076
Epoch [7/60], Batch [110/447], Loss: 3.6017
Epoch [7/60], Batch [120/447], Loss: 3.5069
Epoch [7/60], Batch [130/447], Loss: 3.7286
Epoch [7/60], Batch [140/447], Loss: 3.4940
Epoch [7/60], Batch [150/447], Loss: 2.9273
Epoch [7/60], Batch [160/447], Loss: 3.6105
Epoch [7/60], Batch [170/447], Loss: 3.5019
Epoch [7/60], Batch [180/447], Loss: 3.1439
Epoch [7/60], Batch [190/447], Loss: 3.3345
Epoch [7/60], Batch [200/447], Loss: 3.5479
Epoch [7/60], Batch [210/447], Loss: 3.6580
Epoch [7/60], Batch [220/447], Loss: 3.5353

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [8/60], Batch [0/447], Loss: 3.3947
Epoch [8/60], Batch [10/447], Loss: 3.3593
Epoch [8/60], Batch [20/447], Loss: 3.2014
Epoch [8/60], Batch [30/447], Loss: 3.1771
Epoch [8/60], Batch [40/447], Loss: 3.4146
Epoch [8/60], Batch [50/447], Loss: 3.0646
Epoch [8/60], Batch [60/447], Loss: 3.6510
Epoch [8/60], Batch [70/447], Loss: 2.5694
Epoch [8/60], Batch [80/447], Loss: 3.1642
Epoch [8/60], Batch [90/447], Loss: 3.5648
Epoch [8/60], Batch [100/447], Loss: 3.4147
Epoch [8/60], Batch [110/447], Loss: 3.3863
Epoch [8/60], Batch [120/447], Loss: 3.2707
Epoch [8/60], Batch [130/447], Loss: 3.6407
Epoch [8/60], Batch [140/447], Loss: 3.4408
Epoch [8/60], Batch [150/447], Loss: 3.3075
Epoch [8/60], Batch [160/447], Loss: 3.0674
Epoch [8/60], Batch [170/447], Loss: 3.5743
Epoch [8/60], Batch [180/447], Loss: 3.3996
Epoch [8/60], Batch [190/447], Loss: 3.4541
Epoch [8/60], Batch [200/447], Loss: 3.1216
Epoch [8/60], Batch [210/447], Loss: 3.2692
Epoch [8/60], Batch [220/447], Loss: 3.3512

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [9/60], Batch [0/447], Loss: 2.9655
Epoch [9/60], Batch [10/447], Loss: 3.2771
Epoch [9/60], Batch [20/447], Loss: 3.2954
Epoch [9/60], Batch [30/447], Loss: 3.4814
Epoch [9/60], Batch [40/447], Loss: 3.4035
Epoch [9/60], Batch [50/447], Loss: 3.7159
Epoch [9/60], Batch [60/447], Loss: 3.7189
Epoch [9/60], Batch [70/447], Loss: 3.0055
Epoch [9/60], Batch [80/447], Loss: 2.7940
Epoch [9/60], Batch [90/447], Loss: 3.8437
Epoch [9/60], Batch [100/447], Loss: 3.3180
Epoch [9/60], Batch [110/447], Loss: 3.4931
Epoch [9/60], Batch [120/447], Loss: 3.1275
Epoch [9/60], Batch [130/447], Loss: 3.2574
Epoch [9/60], Batch [140/447], Loss: 3.2497
Epoch [9/60], Batch [150/447], Loss: 3.3027
Epoch [9/60], Batch [160/447], Loss: 2.8460
Epoch [9/60], Batch [170/447], Loss: 3.4366
Epoch [9/60], Batch [180/447], Loss: 3.4104
Epoch [9/60], Batch [190/447], Loss: 3.2764
Epoch [9/60], Batch [200/447], Loss: 3.2898
Epoch [9/60], Batch [210/447], Loss: 2.9183
Epoch [9/60], Batch [220/447], Loss: 3.4603

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [10/60], Batch [0/447], Loss: 3.3382
Epoch [10/60], Batch [10/447], Loss: 3.2741
Epoch [10/60], Batch [20/447], Loss: 3.2300
Epoch [10/60], Batch [30/447], Loss: 3.1059
Epoch [10/60], Batch [40/447], Loss: 3.0840
Epoch [10/60], Batch [50/447], Loss: 3.2795
Epoch [10/60], Batch [60/447], Loss: 2.7524
Epoch [10/60], Batch [70/447], Loss: 2.6152
Epoch [10/60], Batch [80/447], Loss: 3.3215
Epoch [10/60], Batch [90/447], Loss: 3.2870
Epoch [10/60], Batch [100/447], Loss: 3.3418
Epoch [10/60], Batch [110/447], Loss: 3.0650
Epoch [10/60], Batch [120/447], Loss: 3.5654
Epoch [10/60], Batch [130/447], Loss: 3.2390
Epoch [10/60], Batch [140/447], Loss: 3.1785
Epoch [10/60], Batch [150/447], Loss: 3.0776
Epoch [10/60], Batch [160/447], Loss: 2.9281
Epoch [10/60], Batch [170/447], Loss: 3.1273
Epoch [10/60], Batch [180/447], Loss: 2.8765
Epoch [10/60], Batch [190/447], Loss: 3.3046
Epoch [10/60], Batch [200/447], Loss: 2.9861
Epoch [10/60], Batch [210/447], Loss: 3.5226
Epoch [10/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [11/60], Batch [0/447], Loss: 3.2427
Epoch [11/60], Batch [10/447], Loss: 3.0766
Epoch [11/60], Batch [20/447], Loss: 2.9437
Epoch [11/60], Batch [30/447], Loss: 3.4229
Epoch [11/60], Batch [40/447], Loss: 3.2477
Epoch [11/60], Batch [50/447], Loss: 3.1600
Epoch [11/60], Batch [60/447], Loss: 3.2784
Epoch [11/60], Batch [70/447], Loss: 3.1449
Epoch [11/60], Batch [80/447], Loss: 2.7408
Epoch [11/60], Batch [90/447], Loss: 3.1378
Epoch [11/60], Batch [100/447], Loss: 2.9858
Epoch [11/60], Batch [110/447], Loss: 3.1207
Epoch [11/60], Batch [120/447], Loss: 3.2365
Epoch [11/60], Batch [130/447], Loss: 2.5455
Epoch [11/60], Batch [140/447], Loss: 3.3973
Epoch [11/60], Batch [150/447], Loss: 3.1037
Epoch [11/60], Batch [160/447], Loss: 3.2707
Epoch [11/60], Batch [170/447], Loss: 3.4528
Epoch [11/60], Batch [180/447], Loss: 2.8587
Epoch [11/60], Batch [190/447], Loss: 2.4216
Epoch [11/60], Batch [200/447], Loss: 3.2086
Epoch [11/60], Batch [210/447], Loss: 2.9079
Epoch [11/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [12/60], Batch [0/447], Loss: 3.0681
Epoch [12/60], Batch [10/447], Loss: 3.2435
Epoch [12/60], Batch [20/447], Loss: 3.0143
Epoch [12/60], Batch [30/447], Loss: 3.0857
Epoch [12/60], Batch [40/447], Loss: 3.3036
Epoch [12/60], Batch [50/447], Loss: 3.0940
Epoch [12/60], Batch [60/447], Loss: 3.0167
Epoch [12/60], Batch [70/447], Loss: 3.4704
Epoch [12/60], Batch [80/447], Loss: 3.1527
Epoch [12/60], Batch [90/447], Loss: 2.9135
Epoch [12/60], Batch [100/447], Loss: 2.7240
Epoch [12/60], Batch [110/447], Loss: 3.2142
Epoch [12/60], Batch [120/447], Loss: 2.7167
Epoch [12/60], Batch [130/447], Loss: 2.8843
Epoch [12/60], Batch [140/447], Loss: 3.3883
Epoch [12/60], Batch [150/447], Loss: 3.3315
Epoch [12/60], Batch [160/447], Loss: 2.8007
Epoch [12/60], Batch [170/447], Loss: 3.1363
Epoch [12/60], Batch [180/447], Loss: 3.4537
Epoch [12/60], Batch [190/447], Loss: 3.0768
Epoch [12/60], Batch [200/447], Loss: 2.7809
Epoch [12/60], Batch [210/447], Loss: 3.2310
Epoch [12/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [13/60], Batch [0/447], Loss: 2.9982
Epoch [13/60], Batch [10/447], Loss: 2.5151
Epoch [13/60], Batch [20/447], Loss: 3.2317
Epoch [13/60], Batch [30/447], Loss: 2.9504
Epoch [13/60], Batch [40/447], Loss: 3.2509
Epoch [13/60], Batch [50/447], Loss: 3.0036
Epoch [13/60], Batch [60/447], Loss: 3.0926
Epoch [13/60], Batch [70/447], Loss: 3.3416
Epoch [13/60], Batch [80/447], Loss: 3.3076
Epoch [13/60], Batch [90/447], Loss: 3.2841
Epoch [13/60], Batch [100/447], Loss: 3.5089
Epoch [13/60], Batch [110/447], Loss: 2.6568
Epoch [13/60], Batch [120/447], Loss: 3.1361
Epoch [13/60], Batch [130/447], Loss: 3.3052
Epoch [13/60], Batch [140/447], Loss: 3.2736
Epoch [13/60], Batch [150/447], Loss: 3.3113
Epoch [13/60], Batch [160/447], Loss: 3.4453
Epoch [13/60], Batch [170/447], Loss: 2.7965
Epoch [13/60], Batch [180/447], Loss: 2.8720
Epoch [13/60], Batch [190/447], Loss: 3.3188
Epoch [13/60], Batch [200/447], Loss: 2.7551
Epoch [13/60], Batch [210/447], Loss: 3.3613
Epoch [13/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [14/60], Batch [0/447], Loss: 2.7110
Epoch [14/60], Batch [10/447], Loss: 3.1576
Epoch [14/60], Batch [20/447], Loss: 2.6942
Epoch [14/60], Batch [30/447], Loss: 3.1210
Epoch [14/60], Batch [40/447], Loss: 3.1158
Epoch [14/60], Batch [50/447], Loss: 3.0807
Epoch [14/60], Batch [60/447], Loss: 2.7743
Epoch [14/60], Batch [70/447], Loss: 3.1502
Epoch [14/60], Batch [80/447], Loss: 3.3144
Epoch [14/60], Batch [90/447], Loss: 3.2875
Epoch [14/60], Batch [100/447], Loss: 3.1871
Epoch [14/60], Batch [110/447], Loss: 2.7368
Epoch [14/60], Batch [120/447], Loss: 3.0681
Epoch [14/60], Batch [130/447], Loss: 2.7931
Epoch [14/60], Batch [140/447], Loss: 3.7769
Epoch [14/60], Batch [150/447], Loss: 2.6473
Epoch [14/60], Batch [160/447], Loss: 3.0526
Epoch [14/60], Batch [170/447], Loss: 3.3837
Epoch [14/60], Batch [180/447], Loss: 3.3849
Epoch [14/60], Batch [190/447], Loss: 3.2420
Epoch [14/60], Batch [200/447], Loss: 2.9691
Epoch [14/60], Batch [210/447], Loss: 3.0052
Epoch [14/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [15/60], Batch [0/447], Loss: 2.7606
Epoch [15/60], Batch [10/447], Loss: 3.3092
Epoch [15/60], Batch [20/447], Loss: 3.4481
Epoch [15/60], Batch [30/447], Loss: 2.9063
Epoch [15/60], Batch [40/447], Loss: 3.3166
Epoch [15/60], Batch [50/447], Loss: 3.2960
Epoch [15/60], Batch [60/447], Loss: 2.8366
Epoch [15/60], Batch [70/447], Loss: 3.4785
Epoch [15/60], Batch [80/447], Loss: 1.6960
Epoch [15/60], Batch [90/447], Loss: 2.9709
Epoch [15/60], Batch [100/447], Loss: 2.2686
Epoch [15/60], Batch [110/447], Loss: 2.9361
Epoch [15/60], Batch [120/447], Loss: 2.5394
Epoch [15/60], Batch [130/447], Loss: 2.9208
Epoch [15/60], Batch [140/447], Loss: 2.9647
Epoch [15/60], Batch [150/447], Loss: 3.0469
Epoch [15/60], Batch [160/447], Loss: 3.2379
Epoch [15/60], Batch [170/447], Loss: 3.1779
Epoch [15/60], Batch [180/447], Loss: 3.2481
Epoch [15/60], Batch [190/447], Loss: 2.8751
Epoch [15/60], Batch [200/447], Loss: 3.2948
Epoch [15/60], Batch [210/447], Loss: 3.0152
Epoch [15/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [16/60], Batch [0/447], Loss: 2.7990
Epoch [16/60], Batch [10/447], Loss: 2.6625
Epoch [16/60], Batch [20/447], Loss: 3.3460
Epoch [16/60], Batch [30/447], Loss: 3.0895
Epoch [16/60], Batch [40/447], Loss: 2.2112
Epoch [16/60], Batch [50/447], Loss: 2.7225
Epoch [16/60], Batch [60/447], Loss: 2.9143
Epoch [16/60], Batch [70/447], Loss: 3.1978
Epoch [16/60], Batch [80/447], Loss: 3.3312
Epoch [16/60], Batch [90/447], Loss: 2.6936
Epoch [16/60], Batch [100/447], Loss: 2.5368
Epoch [16/60], Batch [110/447], Loss: 2.6472
Epoch [16/60], Batch [120/447], Loss: 3.1149
Epoch [16/60], Batch [130/447], Loss: 3.0907
Epoch [16/60], Batch [140/447], Loss: 2.8424
Epoch [16/60], Batch [150/447], Loss: 3.3341
Epoch [16/60], Batch [160/447], Loss: 2.9771
Epoch [16/60], Batch [170/447], Loss: 3.1716
Epoch [16/60], Batch [180/447], Loss: 3.1059
Epoch [16/60], Batch [190/447], Loss: 2.9897
Epoch [16/60], Batch [200/447], Loss: 2.9620
Epoch [16/60], Batch [210/447], Loss: 3.0027
Epoch [16/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [17/60], Batch [0/447], Loss: 2.7886
Epoch [17/60], Batch [10/447], Loss: 2.4790
Epoch [17/60], Batch [20/447], Loss: 2.8396
Epoch [17/60], Batch [30/447], Loss: 2.8517
Epoch [17/60], Batch [40/447], Loss: 3.3373
Epoch [17/60], Batch [50/447], Loss: 3.0485
Epoch [17/60], Batch [60/447], Loss: 2.8833
Epoch [17/60], Batch [70/447], Loss: 2.6744
Epoch [17/60], Batch [80/447], Loss: 3.1902
Epoch [17/60], Batch [90/447], Loss: 2.9343
Epoch [17/60], Batch [100/447], Loss: 2.5779
Epoch [17/60], Batch [110/447], Loss: 2.8803
Epoch [17/60], Batch [120/447], Loss: 2.9251
Epoch [17/60], Batch [130/447], Loss: 2.9724
Epoch [17/60], Batch [140/447], Loss: 2.8099
Epoch [17/60], Batch [150/447], Loss: 3.0719
Epoch [17/60], Batch [160/447], Loss: 3.2512
Epoch [17/60], Batch [170/447], Loss: 3.1265
Epoch [17/60], Batch [180/447], Loss: 2.8149
Epoch [17/60], Batch [190/447], Loss: 2.7773
Epoch [17/60], Batch [200/447], Loss: 2.7522
Epoch [17/60], Batch [210/447], Loss: 3.3372
Epoch [17/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [18/60], Batch [0/447], Loss: 2.6783
Epoch [18/60], Batch [10/447], Loss: 3.1623
Epoch [18/60], Batch [20/447], Loss: 2.6904
Epoch [18/60], Batch [30/447], Loss: 3.2205
Epoch [18/60], Batch [40/447], Loss: 2.6489
Epoch [18/60], Batch [50/447], Loss: 2.7369
Epoch [18/60], Batch [60/447], Loss: 2.5414
Epoch [18/60], Batch [70/447], Loss: 3.1744
Epoch [18/60], Batch [80/447], Loss: 2.9823
Epoch [18/60], Batch [90/447], Loss: 2.5019
Epoch [18/60], Batch [100/447], Loss: 2.4473
Epoch [18/60], Batch [110/447], Loss: 2.3566
Epoch [18/60], Batch [120/447], Loss: 2.9809
Epoch [18/60], Batch [130/447], Loss: 2.6709
Epoch [18/60], Batch [140/447], Loss: 2.8685
Epoch [18/60], Batch [150/447], Loss: 3.2359
Epoch [18/60], Batch [160/447], Loss: 2.8486
Epoch [18/60], Batch [170/447], Loss: 3.1144
Epoch [18/60], Batch [180/447], Loss: 2.7471
Epoch [18/60], Batch [190/447], Loss: 2.6110
Epoch [18/60], Batch [200/447], Loss: 2.6666
Epoch [18/60], Batch [210/447], Loss: 2.5843
Epoch [18/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [19/60], Batch [0/447], Loss: 3.0875
Epoch [19/60], Batch [10/447], Loss: 3.1448
Epoch [19/60], Batch [20/447], Loss: 2.3935
Epoch [19/60], Batch [30/447], Loss: 3.0780
Epoch [19/60], Batch [40/447], Loss: 3.2826
Epoch [19/60], Batch [50/447], Loss: 3.1049
Epoch [19/60], Batch [60/447], Loss: 2.4565
Epoch [19/60], Batch [70/447], Loss: 2.9078
Epoch [19/60], Batch [80/447], Loss: 3.0169
Epoch [19/60], Batch [90/447], Loss: 2.8811
Epoch [19/60], Batch [100/447], Loss: 2.5028
Epoch [19/60], Batch [110/447], Loss: 2.6467
Epoch [19/60], Batch [120/447], Loss: 2.7739
Epoch [19/60], Batch [130/447], Loss: 2.8245
Epoch [19/60], Batch [140/447], Loss: 2.8527
Epoch [19/60], Batch [150/447], Loss: 3.7490
Epoch [19/60], Batch [160/447], Loss: 2.1021
Epoch [19/60], Batch [170/447], Loss: 2.8010
Epoch [19/60], Batch [180/447], Loss: 3.0723
Epoch [19/60], Batch [190/447], Loss: 3.0607
Epoch [19/60], Batch [200/447], Loss: 3.3618
Epoch [19/60], Batch [210/447], Loss: 2.5629
Epoch [19/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [20/60], Batch [0/447], Loss: 3.1284
Epoch [20/60], Batch [10/447], Loss: 2.7001
Epoch [20/60], Batch [20/447], Loss: 2.7325
Epoch [20/60], Batch [30/447], Loss: 2.7733
Epoch [20/60], Batch [40/447], Loss: 2.8177
Epoch [20/60], Batch [50/447], Loss: 2.7735
Epoch [20/60], Batch [60/447], Loss: 2.9782
Epoch [20/60], Batch [70/447], Loss: 2.6663
Epoch [20/60], Batch [80/447], Loss: 2.8781
Epoch [20/60], Batch [90/447], Loss: 3.2062
Epoch [20/60], Batch [100/447], Loss: 3.2380
Epoch [20/60], Batch [110/447], Loss: 2.4253
Epoch [20/60], Batch [120/447], Loss: 2.6370
Epoch [20/60], Batch [130/447], Loss: 2.6729
Epoch [20/60], Batch [140/447], Loss: 2.5855
Epoch [20/60], Batch [150/447], Loss: 2.5960
Epoch [20/60], Batch [160/447], Loss: 3.2488
Epoch [20/60], Batch [170/447], Loss: 2.7720
Epoch [20/60], Batch [180/447], Loss: 2.7408
Epoch [20/60], Batch [190/447], Loss: 2.8028
Epoch [20/60], Batch [200/447], Loss: 2.5130
Epoch [20/60], Batch [210/447], Loss: 2.7675
Epoch [20/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [21/60], Batch [0/447], Loss: 2.8830
Epoch [21/60], Batch [10/447], Loss: 2.9554
Epoch [21/60], Batch [20/447], Loss: 3.1114
Epoch [21/60], Batch [30/447], Loss: 2.0496
Epoch [21/60], Batch [40/447], Loss: 2.5615
Epoch [21/60], Batch [50/447], Loss: 2.2697
Epoch [21/60], Batch [60/447], Loss: 2.2303
Epoch [21/60], Batch [70/447], Loss: 2.7802
Epoch [21/60], Batch [80/447], Loss: 2.3436
Epoch [21/60], Batch [90/447], Loss: 2.3559
Epoch [21/60], Batch [100/447], Loss: 2.9020
Epoch [21/60], Batch [110/447], Loss: 2.8426
Epoch [21/60], Batch [120/447], Loss: 2.9373
Epoch [21/60], Batch [130/447], Loss: 2.6373
Epoch [21/60], Batch [140/447], Loss: 3.0001
Epoch [21/60], Batch [150/447], Loss: 2.8426
Epoch [21/60], Batch [160/447], Loss: 2.5271
Epoch [21/60], Batch [170/447], Loss: 2.6700
Epoch [21/60], Batch [180/447], Loss: 2.5660
Epoch [21/60], Batch [190/447], Loss: 2.9138
Epoch [21/60], Batch [200/447], Loss: 2.3594
Epoch [21/60], Batch [210/447], Loss: 2.3032
Epoch [21/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [22/60], Batch [0/447], Loss: 3.0352
Epoch [22/60], Batch [10/447], Loss: 2.8407
Epoch [22/60], Batch [20/447], Loss: 2.3351
Epoch [22/60], Batch [30/447], Loss: 3.0342
Epoch [22/60], Batch [40/447], Loss: 3.0375
Epoch [22/60], Batch [50/447], Loss: 3.0186
Epoch [22/60], Batch [60/447], Loss: 2.6901
Epoch [22/60], Batch [70/447], Loss: 2.3850
Epoch [22/60], Batch [80/447], Loss: 1.9012
Epoch [22/60], Batch [90/447], Loss: 2.6921
Epoch [22/60], Batch [100/447], Loss: 2.9987
Epoch [22/60], Batch [110/447], Loss: 3.0913
Epoch [22/60], Batch [120/447], Loss: 2.5925
Epoch [22/60], Batch [130/447], Loss: 2.3084
Epoch [22/60], Batch [140/447], Loss: 2.0993
Epoch [22/60], Batch [150/447], Loss: 2.9325
Epoch [22/60], Batch [160/447], Loss: 3.0376
Epoch [22/60], Batch [170/447], Loss: 2.9505
Epoch [22/60], Batch [180/447], Loss: 2.8217
Epoch [22/60], Batch [190/447], Loss: 2.7389
Epoch [22/60], Batch [200/447], Loss: 2.4035
Epoch [22/60], Batch [210/447], Loss: 2.3541
Epoch [22/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [23/60], Batch [0/447], Loss: 3.1523
Epoch [23/60], Batch [10/447], Loss: 2.8101
Epoch [23/60], Batch [20/447], Loss: 2.5082
Epoch [23/60], Batch [30/447], Loss: 2.0145
Epoch [23/60], Batch [40/447], Loss: 3.2044
Epoch [23/60], Batch [50/447], Loss: 2.7201
Epoch [23/60], Batch [60/447], Loss: 2.7386
Epoch [23/60], Batch [70/447], Loss: 3.2237
Epoch [23/60], Batch [80/447], Loss: 2.9278
Epoch [23/60], Batch [90/447], Loss: 2.7330
Epoch [23/60], Batch [100/447], Loss: 2.8961
Epoch [23/60], Batch [110/447], Loss: 3.1267
Epoch [23/60], Batch [120/447], Loss: 2.3490
Epoch [23/60], Batch [130/447], Loss: 3.0572
Epoch [23/60], Batch [140/447], Loss: 2.9143
Epoch [23/60], Batch [150/447], Loss: 2.3163
Epoch [23/60], Batch [160/447], Loss: 2.2747
Epoch [23/60], Batch [170/447], Loss: 2.5982
Epoch [23/60], Batch [180/447], Loss: 2.9736
Epoch [23/60], Batch [190/447], Loss: 2.4592
Epoch [23/60], Batch [200/447], Loss: 2.1796
Epoch [23/60], Batch [210/447], Loss: 2.7711
Epoch [23/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [24/60], Batch [0/447], Loss: 2.6724
Epoch [24/60], Batch [10/447], Loss: 2.7783
Epoch [24/60], Batch [20/447], Loss: 2.8574
Epoch [24/60], Batch [30/447], Loss: 2.2569
Epoch [24/60], Batch [40/447], Loss: 2.2835
Epoch [24/60], Batch [50/447], Loss: 2.5523
Epoch [24/60], Batch [60/447], Loss: 2.8062
Epoch [24/60], Batch [70/447], Loss: 2.2304
Epoch [24/60], Batch [80/447], Loss: 2.8960
Epoch [24/60], Batch [90/447], Loss: 2.7848
Epoch [24/60], Batch [100/447], Loss: 2.0634
Epoch [24/60], Batch [110/447], Loss: 2.6460
Epoch [24/60], Batch [120/447], Loss: 2.5223
Epoch [24/60], Batch [130/447], Loss: 2.7933
Epoch [24/60], Batch [140/447], Loss: 2.1508
Epoch [24/60], Batch [150/447], Loss: 2.8360
Epoch [24/60], Batch [160/447], Loss: 2.1057
Epoch [24/60], Batch [170/447], Loss: 2.7084
Epoch [24/60], Batch [180/447], Loss: 2.6956
Epoch [24/60], Batch [190/447], Loss: 1.6226
Epoch [24/60], Batch [200/447], Loss: 2.0703
Epoch [24/60], Batch [210/447], Loss: 3.0079
Epoch [24/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [25/60], Batch [0/447], Loss: 2.2047
Epoch [25/60], Batch [10/447], Loss: 2.1030
Epoch [25/60], Batch [20/447], Loss: 2.5180
Epoch [25/60], Batch [30/447], Loss: 2.5985
Epoch [25/60], Batch [40/447], Loss: 2.6972
Epoch [25/60], Batch [50/447], Loss: 2.7947
Epoch [25/60], Batch [60/447], Loss: 2.7519
Epoch [25/60], Batch [70/447], Loss: 1.8719
Epoch [25/60], Batch [80/447], Loss: 2.6991
Epoch [25/60], Batch [90/447], Loss: 2.4637
Epoch [25/60], Batch [100/447], Loss: 3.3224
Epoch [25/60], Batch [110/447], Loss: 3.0468
Epoch [25/60], Batch [120/447], Loss: 2.4607
Epoch [25/60], Batch [130/447], Loss: 2.4476
Epoch [25/60], Batch [140/447], Loss: 2.3785
Epoch [25/60], Batch [150/447], Loss: 2.3554
Epoch [25/60], Batch [160/447], Loss: 2.3166
Epoch [25/60], Batch [170/447], Loss: 2.4405
Epoch [25/60], Batch [180/447], Loss: 2.4450
Epoch [25/60], Batch [190/447], Loss: 3.0413
Epoch [25/60], Batch [200/447], Loss: 2.4816
Epoch [25/60], Batch [210/447], Loss: 2.4009
Epoch [25/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [26/60], Batch [0/447], Loss: 2.7114
Epoch [26/60], Batch [10/447], Loss: 2.9130
Epoch [26/60], Batch [20/447], Loss: 2.8538
Epoch [26/60], Batch [30/447], Loss: 2.4134
Epoch [26/60], Batch [40/447], Loss: 2.7722
Epoch [26/60], Batch [50/447], Loss: 2.4164
Epoch [26/60], Batch [60/447], Loss: 2.6552
Epoch [26/60], Batch [70/447], Loss: 2.9774
Epoch [26/60], Batch [80/447], Loss: 2.6945
Epoch [26/60], Batch [90/447], Loss: 2.8045
Epoch [26/60], Batch [100/447], Loss: 2.6905
Epoch [26/60], Batch [110/447], Loss: 2.9375
Epoch [26/60], Batch [120/447], Loss: 2.3551
Epoch [26/60], Batch [130/447], Loss: 2.2379
Epoch [26/60], Batch [140/447], Loss: 2.9750
Epoch [26/60], Batch [150/447], Loss: 2.8916
Epoch [26/60], Batch [160/447], Loss: 2.4053
Epoch [26/60], Batch [170/447], Loss: 2.1512
Epoch [26/60], Batch [180/447], Loss: 2.9918
Epoch [26/60], Batch [190/447], Loss: 2.9695
Epoch [26/60], Batch [200/447], Loss: 2.8793
Epoch [26/60], Batch [210/447], Loss: 2.9887
Epoch [26/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [27/60], Batch [0/447], Loss: 2.8533
Epoch [27/60], Batch [10/447], Loss: 2.3979
Epoch [27/60], Batch [20/447], Loss: 2.6925
Epoch [27/60], Batch [30/447], Loss: 3.0281
Epoch [27/60], Batch [40/447], Loss: 2.7315
Epoch [27/60], Batch [50/447], Loss: 2.7588
Epoch [27/60], Batch [60/447], Loss: 2.4208
Epoch [27/60], Batch [70/447], Loss: 2.5974
Epoch [27/60], Batch [80/447], Loss: 2.9017
Epoch [27/60], Batch [90/447], Loss: 1.9124
Epoch [27/60], Batch [100/447], Loss: 2.0091
Epoch [27/60], Batch [110/447], Loss: 2.4029
Epoch [27/60], Batch [120/447], Loss: 2.6159
Epoch [27/60], Batch [130/447], Loss: 2.5700
Epoch [27/60], Batch [140/447], Loss: 2.2932
Epoch [27/60], Batch [150/447], Loss: 3.1245
Epoch [27/60], Batch [160/447], Loss: 2.5771
Epoch [27/60], Batch [170/447], Loss: 2.6007
Epoch [27/60], Batch [180/447], Loss: 2.1732
Epoch [27/60], Batch [190/447], Loss: 3.0084
Epoch [27/60], Batch [200/447], Loss: 2.8911
Epoch [27/60], Batch [210/447], Loss: 2.3587
Epoch [27/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [28/60], Batch [0/447], Loss: 3.0897
Epoch [28/60], Batch [10/447], Loss: 2.1244
Epoch [28/60], Batch [20/447], Loss: 2.7589
Epoch [28/60], Batch [30/447], Loss: 2.6488
Epoch [28/60], Batch [40/447], Loss: 2.9059
Epoch [28/60], Batch [50/447], Loss: 2.5214
Epoch [28/60], Batch [60/447], Loss: 2.1002
Epoch [28/60], Batch [70/447], Loss: 2.9062
Epoch [28/60], Batch [80/447], Loss: 2.4081
Epoch [28/60], Batch [90/447], Loss: 1.7031
Epoch [28/60], Batch [100/447], Loss: 2.5171
Epoch [28/60], Batch [110/447], Loss: 2.9459
Epoch [28/60], Batch [120/447], Loss: 3.1318
Epoch [28/60], Batch [130/447], Loss: 2.2507
Epoch [28/60], Batch [140/447], Loss: 2.0312
Epoch [28/60], Batch [150/447], Loss: 2.2053
Epoch [28/60], Batch [160/447], Loss: 2.5445
Epoch [28/60], Batch [170/447], Loss: 2.6694
Epoch [28/60], Batch [180/447], Loss: 2.6750
Epoch [28/60], Batch [190/447], Loss: 2.4506
Epoch [28/60], Batch [200/447], Loss: 3.0750
Epoch [28/60], Batch [210/447], Loss: 2.7538
Epoch [28/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [29/60], Batch [0/447], Loss: 2.7377
Epoch [29/60], Batch [10/447], Loss: 2.0249
Epoch [29/60], Batch [20/447], Loss: 2.6245
Epoch [29/60], Batch [30/447], Loss: 2.8694
Epoch [29/60], Batch [40/447], Loss: 2.1010
Epoch [29/60], Batch [50/447], Loss: 2.1283
Epoch [29/60], Batch [60/447], Loss: 2.5582
Epoch [29/60], Batch [70/447], Loss: 2.5209
Epoch [29/60], Batch [80/447], Loss: 2.0518
Epoch [29/60], Batch [90/447], Loss: 2.6515
Epoch [29/60], Batch [100/447], Loss: 3.0409
Epoch [29/60], Batch [110/447], Loss: 2.7798
Epoch [29/60], Batch [120/447], Loss: 2.9257
Epoch [29/60], Batch [130/447], Loss: 2.6120
Epoch [29/60], Batch [140/447], Loss: 2.7111
Epoch [29/60], Batch [150/447], Loss: 2.5927
Epoch [29/60], Batch [160/447], Loss: 2.6038
Epoch [29/60], Batch [170/447], Loss: 2.2551
Epoch [29/60], Batch [180/447], Loss: 1.3851
Epoch [29/60], Batch [190/447], Loss: 2.5711
Epoch [29/60], Batch [200/447], Loss: 2.7550
Epoch [29/60], Batch [210/447], Loss: 2.2540
Epoch [29/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [30/60], Batch [0/447], Loss: 2.4545
Epoch [30/60], Batch [10/447], Loss: 2.3211
Epoch [30/60], Batch [20/447], Loss: 2.3782
Epoch [30/60], Batch [30/447], Loss: 2.8150
Epoch [30/60], Batch [40/447], Loss: 2.6375
Epoch [30/60], Batch [50/447], Loss: 2.9893
Epoch [30/60], Batch [60/447], Loss: 2.1273
Epoch [30/60], Batch [70/447], Loss: 2.2457
Epoch [30/60], Batch [80/447], Loss: 2.1304
Epoch [30/60], Batch [90/447], Loss: 2.3079
Epoch [30/60], Batch [100/447], Loss: 2.6596
Epoch [30/60], Batch [110/447], Loss: 2.4968
Epoch [30/60], Batch [120/447], Loss: 2.6730
Epoch [30/60], Batch [130/447], Loss: 2.5881
Epoch [30/60], Batch [140/447], Loss: 2.3850
Epoch [30/60], Batch [150/447], Loss: 2.1524
Epoch [30/60], Batch [160/447], Loss: 2.1138
Epoch [30/60], Batch [170/447], Loss: 2.7033
Epoch [30/60], Batch [180/447], Loss: 2.5196
Epoch [30/60], Batch [190/447], Loss: 2.6200
Epoch [30/60], Batch [200/447], Loss: 2.4813
Epoch [30/60], Batch [210/447], Loss: 2.7767
Epoch [30/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [31/60], Batch [0/447], Loss: 2.7957
Epoch [31/60], Batch [10/447], Loss: 2.7568
Epoch [31/60], Batch [20/447], Loss: 2.4537
Epoch [31/60], Batch [30/447], Loss: 2.5973
Epoch [31/60], Batch [40/447], Loss: 2.2121
Epoch [31/60], Batch [50/447], Loss: 2.3639
Epoch [31/60], Batch [60/447], Loss: 2.1132
Epoch [31/60], Batch [70/447], Loss: 2.0688
Epoch [31/60], Batch [80/447], Loss: 2.7029
Epoch [31/60], Batch [90/447], Loss: 2.5145
Epoch [31/60], Batch [100/447], Loss: 2.8761
Epoch [31/60], Batch [110/447], Loss: 2.3096
Epoch [31/60], Batch [120/447], Loss: 2.4968
Epoch [31/60], Batch [130/447], Loss: 2.6722
Epoch [31/60], Batch [140/447], Loss: 2.9424
Epoch [31/60], Batch [150/447], Loss: 2.3617
Epoch [31/60], Batch [160/447], Loss: 2.9971
Epoch [31/60], Batch [170/447], Loss: 2.7930
Epoch [31/60], Batch [180/447], Loss: 2.6348
Epoch [31/60], Batch [190/447], Loss: 2.8864
Epoch [31/60], Batch [200/447], Loss: 2.6822
Epoch [31/60], Batch [210/447], Loss: 2.4669
Epoch [31/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [32/60], Batch [0/447], Loss: 2.0323
Epoch [32/60], Batch [10/447], Loss: 2.5510
Epoch [32/60], Batch [20/447], Loss: 2.6071
Epoch [32/60], Batch [30/447], Loss: 2.5947
Epoch [32/60], Batch [40/447], Loss: 2.4710
Epoch [32/60], Batch [50/447], Loss: 2.0557
Epoch [32/60], Batch [60/447], Loss: 2.9669
Epoch [32/60], Batch [70/447], Loss: 2.5132
Epoch [32/60], Batch [80/447], Loss: 2.5379
Epoch [32/60], Batch [90/447], Loss: 2.5760
Epoch [32/60], Batch [100/447], Loss: 3.0882
Epoch [32/60], Batch [110/447], Loss: 2.4650
Epoch [32/60], Batch [120/447], Loss: 2.4816
Epoch [32/60], Batch [130/447], Loss: 2.8930
Epoch [32/60], Batch [140/447], Loss: 2.4402
Epoch [32/60], Batch [150/447], Loss: 1.8823
Epoch [32/60], Batch [160/447], Loss: 2.2464
Epoch [32/60], Batch [170/447], Loss: 2.3013
Epoch [32/60], Batch [180/447], Loss: 1.8315
Epoch [32/60], Batch [190/447], Loss: 2.4714
Epoch [32/60], Batch [200/447], Loss: 2.6305
Epoch [32/60], Batch [210/447], Loss: 1.6216
Epoch [32/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [33/60], Batch [0/447], Loss: 1.9280
Epoch [33/60], Batch [10/447], Loss: 2.1081
Epoch [33/60], Batch [20/447], Loss: 2.1103
Epoch [33/60], Batch [30/447], Loss: 2.8656
Epoch [33/60], Batch [40/447], Loss: 2.1113
Epoch [33/60], Batch [50/447], Loss: 2.7538
Epoch [33/60], Batch [60/447], Loss: 2.6602
Epoch [33/60], Batch [70/447], Loss: 2.1795
Epoch [33/60], Batch [80/447], Loss: 2.7715
Epoch [33/60], Batch [90/447], Loss: 2.2475
Epoch [33/60], Batch [100/447], Loss: 2.5727
Epoch [33/60], Batch [110/447], Loss: 2.0174
Epoch [33/60], Batch [120/447], Loss: 2.1162
Epoch [33/60], Batch [130/447], Loss: 2.6847
Epoch [33/60], Batch [140/447], Loss: 3.0370
Epoch [33/60], Batch [150/447], Loss: 2.2858
Epoch [33/60], Batch [160/447], Loss: 2.7187
Epoch [33/60], Batch [170/447], Loss: 2.3900
Epoch [33/60], Batch [180/447], Loss: 1.8209
Epoch [33/60], Batch [190/447], Loss: 2.5995
Epoch [33/60], Batch [200/447], Loss: 2.8080
Epoch [33/60], Batch [210/447], Loss: 2.3728
Epoch [33/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [34/60], Batch [0/447], Loss: 2.5173
Epoch [34/60], Batch [10/447], Loss: 2.4735
Epoch [34/60], Batch [20/447], Loss: 2.4327
Epoch [34/60], Batch [30/447], Loss: 3.0189
Epoch [34/60], Batch [40/447], Loss: 2.5926
Epoch [34/60], Batch [50/447], Loss: 1.9309
Epoch [34/60], Batch [60/447], Loss: 2.2225
Epoch [34/60], Batch [70/447], Loss: 2.7572
Epoch [34/60], Batch [80/447], Loss: 2.2560
Epoch [34/60], Batch [90/447], Loss: 2.3741
Epoch [34/60], Batch [100/447], Loss: 2.3608
Epoch [34/60], Batch [110/447], Loss: 2.5058
Epoch [34/60], Batch [120/447], Loss: 2.3589
Epoch [34/60], Batch [130/447], Loss: 2.8639
Epoch [34/60], Batch [140/447], Loss: 2.3934
Epoch [34/60], Batch [150/447], Loss: 2.5270
Epoch [34/60], Batch [160/447], Loss: 2.2935
Epoch [34/60], Batch [170/447], Loss: 2.3878
Epoch [34/60], Batch [180/447], Loss: 2.8514
Epoch [34/60], Batch [190/447], Loss: 3.1633
Epoch [34/60], Batch [200/447], Loss: 3.3446
Epoch [34/60], Batch [210/447], Loss: 1.5736
Epoch [34/60], Batch 

[I 2024-12-13 05:19:12,634] Trial 1 pruned. 


Epoch [34/60], Validation Accuracy: 0.7065, Validation Loss: 1.0630
No improvement in validation accuracy for 5 epoch(s).
Early stopping at epoch 34.
Trial early stopped due to lack of improvement.
Starting a new trial...
Trial 2: alpha = 9.51207163345817
Building the model...


2024-12-13 05:19:12,975 - mmaction - INFO - load model from: https://download.openmmlab.com/mmaction/recognition/csn/ircsn_from_scratch_r50_ig65m_20210617-ce545a37.pth
2024-12-13 05:19:12,976 - mmaction - INFO - load checkpoint from http path: https://download.openmmlab.com/mmaction/recognition/csn/ircsn_from_scratch_r50_ig65m_20210617-ce545a37.pth


Model built successfully!
Starting training...


  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [1/60], Batch [0/447], Loss: 3.9044
Epoch [1/60], Batch [10/447], Loss: 4.0235
Epoch [1/60], Batch [20/447], Loss: 3.9149
Epoch [1/60], Batch [30/447], Loss: 3.9200
Epoch [1/60], Batch [40/447], Loss: 3.9618
Epoch [1/60], Batch [50/447], Loss: 3.9674
Epoch [1/60], Batch [60/447], Loss: 3.9275
Epoch [1/60], Batch [70/447], Loss: 3.9969
Epoch [1/60], Batch [80/447], Loss: 3.9918
Epoch [1/60], Batch [90/447], Loss: 4.0231
Epoch [1/60], Batch [100/447], Loss: 3.9924
Epoch [1/60], Batch [110/447], Loss: 3.9644
Epoch [1/60], Batch [120/447], Loss: 3.9879
Epoch [1/60], Batch [130/447], Loss: 3.8981
Epoch [1/60], Batch [140/447], Loss: 3.9029
Epoch [1/60], Batch [150/447], Loss: 4.0187
Epoch [1/60], Batch [160/447], Loss: 4.0556
Epoch [1/60], Batch [170/447], Loss: 3.9025
Epoch [1/60], Batch [180/447], Loss: 3.9553
Epoch [1/60], Batch [190/447], Loss: 3.9837
Epoch [1/60], Batch [200/447], Loss: 3.9733
Epoch [1/60], Batch [210/447], Loss: 3.9768
Epoch [1/60], Batch [220/447], Loss: 3.9963

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [2/60], Batch [0/447], Loss: 3.9529
Epoch [2/60], Batch [10/447], Loss: 3.8847
Epoch [2/60], Batch [20/447], Loss: 3.9070
Epoch [2/60], Batch [30/447], Loss: 3.8893
Epoch [2/60], Batch [40/447], Loss: 3.8440
Epoch [2/60], Batch [50/447], Loss: 3.8988
Epoch [2/60], Batch [60/447], Loss: 3.9737
Epoch [2/60], Batch [70/447], Loss: 3.9696
Epoch [2/60], Batch [80/447], Loss: 3.7464
Epoch [2/60], Batch [90/447], Loss: 3.8479
Epoch [2/60], Batch [100/447], Loss: 3.9531
Epoch [2/60], Batch [110/447], Loss: 3.8562
Epoch [2/60], Batch [120/447], Loss: 3.8219
Epoch [2/60], Batch [130/447], Loss: 3.7372
Epoch [2/60], Batch [140/447], Loss: 3.7390
Epoch [2/60], Batch [150/447], Loss: 3.6257
Epoch [2/60], Batch [160/447], Loss: 3.9873
Epoch [2/60], Batch [170/447], Loss: 3.6258
Epoch [2/60], Batch [180/447], Loss: 3.8039
Epoch [2/60], Batch [190/447], Loss: 3.7294
Epoch [2/60], Batch [200/447], Loss: 3.7891
Epoch [2/60], Batch [210/447], Loss: 3.6809
Epoch [2/60], Batch [220/447], Loss: 3.6298

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [3/60], Batch [0/447], Loss: 3.9228
Epoch [3/60], Batch [10/447], Loss: 3.8095
Epoch [3/60], Batch [20/447], Loss: 3.8536
Epoch [3/60], Batch [30/447], Loss: 3.4458
Epoch [3/60], Batch [40/447], Loss: 3.5439
Epoch [3/60], Batch [50/447], Loss: 3.9945
Epoch [3/60], Batch [60/447], Loss: 3.5277
Epoch [3/60], Batch [70/447], Loss: 3.7779
Epoch [3/60], Batch [80/447], Loss: 3.5835
Epoch [3/60], Batch [90/447], Loss: 3.9038
Epoch [3/60], Batch [100/447], Loss: 3.5456
Epoch [3/60], Batch [110/447], Loss: 3.8249
Epoch [3/60], Batch [120/447], Loss: 3.6696
Epoch [3/60], Batch [130/447], Loss: 3.7815
Epoch [3/60], Batch [140/447], Loss: 3.7689
Epoch [3/60], Batch [150/447], Loss: 3.8447
Epoch [3/60], Batch [160/447], Loss: 3.6694
Epoch [3/60], Batch [170/447], Loss: 3.8187
Epoch [3/60], Batch [180/447], Loss: 3.5936
Epoch [3/60], Batch [190/447], Loss: 3.8898
Epoch [3/60], Batch [200/447], Loss: 3.6898
Epoch [3/60], Batch [210/447], Loss: 3.7822
Epoch [3/60], Batch [220/447], Loss: 3.8368

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [4/60], Batch [0/447], Loss: 3.6494
Epoch [4/60], Batch [10/447], Loss: 3.5574
Epoch [4/60], Batch [20/447], Loss: 3.7604
Epoch [4/60], Batch [30/447], Loss: 3.8097
Epoch [4/60], Batch [40/447], Loss: 3.5159
Epoch [4/60], Batch [50/447], Loss: 3.7861
Epoch [4/60], Batch [60/447], Loss: 3.4266
Epoch [4/60], Batch [70/447], Loss: 3.5920
Epoch [4/60], Batch [80/447], Loss: 3.2657
Epoch [4/60], Batch [90/447], Loss: 3.7354
Epoch [4/60], Batch [100/447], Loss: 3.8007
Epoch [4/60], Batch [110/447], Loss: 3.7860
Epoch [4/60], Batch [120/447], Loss: 3.6252
Epoch [4/60], Batch [130/447], Loss: 3.6412
Epoch [4/60], Batch [140/447], Loss: 3.7515
Epoch [4/60], Batch [150/447], Loss: 3.6059
Epoch [4/60], Batch [160/447], Loss: 3.7388
Epoch [4/60], Batch [170/447], Loss: 3.5229
Epoch [4/60], Batch [180/447], Loss: 3.4978
Epoch [4/60], Batch [190/447], Loss: 3.1617
Epoch [4/60], Batch [200/447], Loss: 3.7107
Epoch [4/60], Batch [210/447], Loss: 3.7431
Epoch [4/60], Batch [220/447], Loss: 3.6796

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [5/60], Batch [0/447], Loss: 3.4884
Epoch [5/60], Batch [10/447], Loss: 3.4895
Epoch [5/60], Batch [20/447], Loss: 3.7385
Epoch [5/60], Batch [30/447], Loss: 3.8392
Epoch [5/60], Batch [40/447], Loss: 3.5093
Epoch [5/60], Batch [50/447], Loss: 3.6488
Epoch [5/60], Batch [60/447], Loss: 3.6551
Epoch [5/60], Batch [70/447], Loss: 3.6853
Epoch [5/60], Batch [80/447], Loss: 3.4556
Epoch [5/60], Batch [90/447], Loss: 3.5884
Epoch [5/60], Batch [100/447], Loss: 3.6040
Epoch [5/60], Batch [110/447], Loss: 3.8405
Epoch [5/60], Batch [120/447], Loss: 3.5802
Epoch [5/60], Batch [130/447], Loss: 3.6668
Epoch [5/60], Batch [140/447], Loss: 3.3104
Epoch [5/60], Batch [150/447], Loss: 3.3501
Epoch [5/60], Batch [160/447], Loss: 3.5118
Epoch [5/60], Batch [170/447], Loss: 3.3689
Epoch [5/60], Batch [180/447], Loss: 3.4601
Epoch [5/60], Batch [190/447], Loss: 3.6423
Epoch [5/60], Batch [200/447], Loss: 3.6512
Epoch [5/60], Batch [210/447], Loss: 3.7485
Epoch [5/60], Batch [220/447], Loss: 3.7664

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [6/60], Batch [0/447], Loss: 3.5619
Epoch [6/60], Batch [10/447], Loss: 3.3994
Epoch [6/60], Batch [20/447], Loss: 3.5698
Epoch [6/60], Batch [30/447], Loss: 3.6781
Epoch [6/60], Batch [40/447], Loss: 3.1058
Epoch [6/60], Batch [50/447], Loss: 3.5399
Epoch [6/60], Batch [60/447], Loss: 3.3920
Epoch [6/60], Batch [70/447], Loss: 3.4841
Epoch [6/60], Batch [80/447], Loss: 2.9951
Epoch [6/60], Batch [90/447], Loss: 3.7426
Epoch [6/60], Batch [100/447], Loss: 3.6085
Epoch [6/60], Batch [110/447], Loss: 3.7494
Epoch [6/60], Batch [120/447], Loss: 3.2701
Epoch [6/60], Batch [130/447], Loss: 3.5619
Epoch [6/60], Batch [140/447], Loss: 3.3659
Epoch [6/60], Batch [150/447], Loss: 3.3423
Epoch [6/60], Batch [160/447], Loss: 3.6693
Epoch [6/60], Batch [170/447], Loss: 3.5407
Epoch [6/60], Batch [180/447], Loss: 3.6057
Epoch [6/60], Batch [190/447], Loss: 3.5852
Epoch [6/60], Batch [200/447], Loss: 3.5935
Epoch [6/60], Batch [210/447], Loss: 3.5034
Epoch [6/60], Batch [220/447], Loss: 3.4897

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [7/60], Batch [0/447], Loss: 3.2117
Epoch [7/60], Batch [10/447], Loss: 3.1759
Epoch [7/60], Batch [20/447], Loss: 3.4589
Epoch [7/60], Batch [30/447], Loss: 3.5256
Epoch [7/60], Batch [40/447], Loss: 3.6177
Epoch [7/60], Batch [50/447], Loss: 3.4923
Epoch [7/60], Batch [60/447], Loss: 3.4567
Epoch [7/60], Batch [70/447], Loss: 3.1770
Epoch [7/60], Batch [80/447], Loss: 3.1764
Epoch [7/60], Batch [90/447], Loss: 2.9410
Epoch [7/60], Batch [100/447], Loss: 2.9909
Epoch [7/60], Batch [110/447], Loss: 3.3608
Epoch [7/60], Batch [120/447], Loss: 3.2729
Epoch [7/60], Batch [130/447], Loss: 3.3861
Epoch [7/60], Batch [140/447], Loss: 3.6582
Epoch [7/60], Batch [150/447], Loss: 3.3052
Epoch [7/60], Batch [160/447], Loss: 3.4983
Epoch [7/60], Batch [170/447], Loss: 3.0692
Epoch [7/60], Batch [180/447], Loss: 3.5157
Epoch [7/60], Batch [190/447], Loss: 3.7506
Epoch [7/60], Batch [200/447], Loss: 3.5354
Epoch [7/60], Batch [210/447], Loss: 3.8401
Epoch [7/60], Batch [220/447], Loss: 3.4609

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [8/60], Batch [0/447], Loss: 3.3100
Epoch [8/60], Batch [10/447], Loss: 3.3331
Epoch [8/60], Batch [20/447], Loss: 3.3375
Epoch [8/60], Batch [30/447], Loss: 2.8186
Epoch [8/60], Batch [40/447], Loss: 3.3902
Epoch [8/60], Batch [50/447], Loss: 3.3400
Epoch [8/60], Batch [60/447], Loss: 3.2312
Epoch [8/60], Batch [70/447], Loss: 3.1549
Epoch [8/60], Batch [80/447], Loss: 3.6499
Epoch [8/60], Batch [90/447], Loss: 3.1801
Epoch [8/60], Batch [100/447], Loss: 3.3746
Epoch [8/60], Batch [110/447], Loss: 3.3539
Epoch [8/60], Batch [120/447], Loss: 3.5238
Epoch [8/60], Batch [130/447], Loss: 3.3527
Epoch [8/60], Batch [140/447], Loss: 3.2490
Epoch [8/60], Batch [150/447], Loss: 3.1363
Epoch [8/60], Batch [160/447], Loss: 2.8836
Epoch [8/60], Batch [170/447], Loss: 3.3578
Epoch [8/60], Batch [180/447], Loss: 3.2434
Epoch [8/60], Batch [190/447], Loss: 3.3852
Epoch [8/60], Batch [200/447], Loss: 3.5993
Epoch [8/60], Batch [210/447], Loss: 3.0461
Epoch [8/60], Batch [220/447], Loss: 3.5025

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [9/60], Batch [0/447], Loss: 3.4388
Epoch [9/60], Batch [10/447], Loss: 3.1822
Epoch [9/60], Batch [20/447], Loss: 3.0097
Epoch [9/60], Batch [30/447], Loss: 3.3174
Epoch [9/60], Batch [40/447], Loss: 3.6837
Epoch [9/60], Batch [50/447], Loss: 3.4138
Epoch [9/60], Batch [60/447], Loss: 3.2854
Epoch [9/60], Batch [70/447], Loss: 3.5476
Epoch [9/60], Batch [80/447], Loss: 3.5405
Epoch [9/60], Batch [90/447], Loss: 3.3155
Epoch [9/60], Batch [100/447], Loss: 3.4252
Epoch [9/60], Batch [110/447], Loss: 3.4898
Epoch [9/60], Batch [120/447], Loss: 3.1771
Epoch [9/60], Batch [130/447], Loss: 3.2207
Epoch [9/60], Batch [140/447], Loss: 3.3727
Epoch [9/60], Batch [150/447], Loss: 2.9445
Epoch [9/60], Batch [160/447], Loss: 3.1035
Epoch [9/60], Batch [170/447], Loss: 3.2705
Epoch [9/60], Batch [180/447], Loss: 3.1956
Epoch [9/60], Batch [190/447], Loss: 3.3927
Epoch [9/60], Batch [200/447], Loss: 3.5092
Epoch [9/60], Batch [210/447], Loss: 3.3499
Epoch [9/60], Batch [220/447], Loss: 2.8557

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [10/60], Batch [0/447], Loss: 3.5740
Epoch [10/60], Batch [10/447], Loss: 3.6522
Epoch [10/60], Batch [20/447], Loss: 2.7347
Epoch [10/60], Batch [30/447], Loss: 3.1405
Epoch [10/60], Batch [40/447], Loss: 3.0538
Epoch [10/60], Batch [50/447], Loss: 3.2533
Epoch [10/60], Batch [60/447], Loss: 3.1348
Epoch [10/60], Batch [70/447], Loss: 3.2445
Epoch [10/60], Batch [80/447], Loss: 2.8989
Epoch [10/60], Batch [90/447], Loss: 3.4014
Epoch [10/60], Batch [100/447], Loss: 3.3580
Epoch [10/60], Batch [110/447], Loss: 3.0051
Epoch [10/60], Batch [120/447], Loss: 3.1547
Epoch [10/60], Batch [130/447], Loss: 3.6995
Epoch [10/60], Batch [140/447], Loss: 3.4130
Epoch [10/60], Batch [150/447], Loss: 3.1522
Epoch [10/60], Batch [160/447], Loss: 3.0599
Epoch [10/60], Batch [170/447], Loss: 2.9898
Epoch [10/60], Batch [180/447], Loss: 3.4374
Epoch [10/60], Batch [190/447], Loss: 2.8501
Epoch [10/60], Batch [200/447], Loss: 3.3591
Epoch [10/60], Batch [210/447], Loss: 3.3322
Epoch [10/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [11/60], Batch [0/447], Loss: 3.2913
Epoch [11/60], Batch [10/447], Loss: 3.1628
Epoch [11/60], Batch [20/447], Loss: 3.1967
Epoch [11/60], Batch [30/447], Loss: 2.8967
Epoch [11/60], Batch [40/447], Loss: 3.2808
Epoch [11/60], Batch [50/447], Loss: 3.4537
Epoch [11/60], Batch [60/447], Loss: 3.0043
Epoch [11/60], Batch [70/447], Loss: 2.8296
Epoch [11/60], Batch [80/447], Loss: 3.0058
Epoch [11/60], Batch [90/447], Loss: 3.3328
Epoch [11/60], Batch [100/447], Loss: 3.4886
Epoch [11/60], Batch [110/447], Loss: 3.1755
Epoch [11/60], Batch [120/447], Loss: 2.9012
Epoch [11/60], Batch [130/447], Loss: 2.8189
Epoch [11/60], Batch [140/447], Loss: 2.9339
Epoch [11/60], Batch [150/447], Loss: 2.9170
Epoch [11/60], Batch [160/447], Loss: 2.7851
Epoch [11/60], Batch [170/447], Loss: 3.1170
Epoch [11/60], Batch [180/447], Loss: 3.3544
Epoch [11/60], Batch [190/447], Loss: 3.4038
Epoch [11/60], Batch [200/447], Loss: 3.0195
Epoch [11/60], Batch [210/447], Loss: 2.5937
Epoch [11/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [12/60], Batch [0/447], Loss: 3.1305
Epoch [12/60], Batch [10/447], Loss: 3.2571
Epoch [12/60], Batch [20/447], Loss: 3.2562
Epoch [12/60], Batch [30/447], Loss: 3.2556
Epoch [12/60], Batch [40/447], Loss: 2.3092
Epoch [12/60], Batch [50/447], Loss: 2.8549
Epoch [12/60], Batch [60/447], Loss: 3.4699
Epoch [12/60], Batch [70/447], Loss: 2.7427
Epoch [12/60], Batch [80/447], Loss: 3.6149
Epoch [12/60], Batch [90/447], Loss: 3.3037
Epoch [12/60], Batch [100/447], Loss: 2.7043
Epoch [12/60], Batch [110/447], Loss: 2.8950
Epoch [12/60], Batch [120/447], Loss: 2.9197
Epoch [12/60], Batch [130/447], Loss: 3.4682
Epoch [12/60], Batch [140/447], Loss: 2.8884
Epoch [12/60], Batch [150/447], Loss: 2.8917
Epoch [12/60], Batch [160/447], Loss: 2.5918
Epoch [12/60], Batch [170/447], Loss: 3.3621
Epoch [12/60], Batch [180/447], Loss: 3.6061
Epoch [12/60], Batch [190/447], Loss: 3.2141
Epoch [12/60], Batch [200/447], Loss: 3.1781
Epoch [12/60], Batch [210/447], Loss: 2.5670
Epoch [12/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [13/60], Batch [0/447], Loss: 2.9409
Epoch [13/60], Batch [10/447], Loss: 3.0078
Epoch [13/60], Batch [20/447], Loss: 2.8945
Epoch [13/60], Batch [30/447], Loss: 3.1241
Epoch [13/60], Batch [40/447], Loss: 3.3597
Epoch [13/60], Batch [50/447], Loss: 3.1602
Epoch [13/60], Batch [60/447], Loss: 3.2381
Epoch [13/60], Batch [70/447], Loss: 2.9883
Epoch [13/60], Batch [80/447], Loss: 3.2510
Epoch [13/60], Batch [90/447], Loss: 2.8726
Epoch [13/60], Batch [100/447], Loss: 3.7649
Epoch [13/60], Batch [110/447], Loss: 2.4579
Epoch [13/60], Batch [120/447], Loss: 2.9411
Epoch [13/60], Batch [130/447], Loss: 3.2315
Epoch [13/60], Batch [140/447], Loss: 3.3625
Epoch [13/60], Batch [150/447], Loss: 2.5418
Epoch [13/60], Batch [160/447], Loss: 3.1394
Epoch [13/60], Batch [170/447], Loss: 3.5315
Epoch [13/60], Batch [180/447], Loss: 2.8929
Epoch [13/60], Batch [190/447], Loss: 3.1785
Epoch [13/60], Batch [200/447], Loss: 3.2470
Epoch [13/60], Batch [210/447], Loss: 2.7544
Epoch [13/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [14/60], Batch [0/447], Loss: 2.6532
Epoch [14/60], Batch [10/447], Loss: 2.5555
Epoch [14/60], Batch [20/447], Loss: 3.0196
Epoch [14/60], Batch [30/447], Loss: 2.3100
Epoch [14/60], Batch [40/447], Loss: 3.0028
Epoch [14/60], Batch [50/447], Loss: 2.6415
Epoch [14/60], Batch [60/447], Loss: 3.4866
Epoch [14/60], Batch [70/447], Loss: 3.0893
Epoch [14/60], Batch [80/447], Loss: 3.0699
Epoch [14/60], Batch [90/447], Loss: 3.0008
Epoch [14/60], Batch [100/447], Loss: 2.8008
Epoch [14/60], Batch [110/447], Loss: 2.6695
Epoch [14/60], Batch [120/447], Loss: 3.0403
Epoch [14/60], Batch [130/447], Loss: 3.0414
Epoch [14/60], Batch [140/447], Loss: 3.2540
Epoch [14/60], Batch [150/447], Loss: 3.0145
Epoch [14/60], Batch [160/447], Loss: 2.7940
Epoch [14/60], Batch [170/447], Loss: 3.0961
Epoch [14/60], Batch [180/447], Loss: 2.7718
Epoch [14/60], Batch [190/447], Loss: 2.4489
Epoch [14/60], Batch [200/447], Loss: 3.1297
Epoch [14/60], Batch [210/447], Loss: 2.9418
Epoch [14/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [15/60], Batch [0/447], Loss: 3.1952
Epoch [15/60], Batch [10/447], Loss: 2.6709
Epoch [15/60], Batch [20/447], Loss: 2.9835
Epoch [15/60], Batch [30/447], Loss: 3.0297
Epoch [15/60], Batch [40/447], Loss: 2.7407
Epoch [15/60], Batch [50/447], Loss: 3.0780
Epoch [15/60], Batch [60/447], Loss: 2.8941
Epoch [15/60], Batch [70/447], Loss: 2.8460
Epoch [15/60], Batch [80/447], Loss: 3.0316
Epoch [15/60], Batch [90/447], Loss: 3.0642
Epoch [15/60], Batch [100/447], Loss: 3.0957
Epoch [15/60], Batch [110/447], Loss: 3.3881
Epoch [15/60], Batch [120/447], Loss: 2.7242
Epoch [15/60], Batch [130/447], Loss: 2.6683
Epoch [15/60], Batch [140/447], Loss: 3.3485
Epoch [15/60], Batch [150/447], Loss: 2.7776
Epoch [15/60], Batch [160/447], Loss: 2.2500
Epoch [15/60], Batch [170/447], Loss: 2.9616
Epoch [15/60], Batch [180/447], Loss: 2.8290
Epoch [15/60], Batch [190/447], Loss: 2.4555
Epoch [15/60], Batch [200/447], Loss: 2.6350
Epoch [15/60], Batch [210/447], Loss: 2.7219
Epoch [15/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [16/60], Batch [0/447], Loss: 3.0691
Epoch [16/60], Batch [10/447], Loss: 2.5703
Epoch [16/60], Batch [20/447], Loss: 2.9050
Epoch [16/60], Batch [30/447], Loss: 3.4757
Epoch [16/60], Batch [40/447], Loss: 2.4753
Epoch [16/60], Batch [50/447], Loss: 2.9783
Epoch [16/60], Batch [60/447], Loss: 2.4921
Epoch [16/60], Batch [70/447], Loss: 3.1042
Epoch [16/60], Batch [80/447], Loss: 2.3535
Epoch [16/60], Batch [90/447], Loss: 2.7013
Epoch [16/60], Batch [100/447], Loss: 2.9762
Epoch [16/60], Batch [110/447], Loss: 2.7370
Epoch [16/60], Batch [120/447], Loss: 2.9373
Epoch [16/60], Batch [130/447], Loss: 2.8445
Epoch [16/60], Batch [140/447], Loss: 3.2963
Epoch [16/60], Batch [150/447], Loss: 3.2539
Epoch [16/60], Batch [160/447], Loss: 2.6700
Epoch [16/60], Batch [170/447], Loss: 3.4605
Epoch [16/60], Batch [180/447], Loss: 2.7055
Epoch [16/60], Batch [190/447], Loss: 2.6468
Epoch [16/60], Batch [200/447], Loss: 3.0384
Epoch [16/60], Batch [210/447], Loss: 3.2043
Epoch [16/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [17/60], Batch [0/447], Loss: 3.1039
Epoch [17/60], Batch [10/447], Loss: 2.7242
Epoch [17/60], Batch [20/447], Loss: 2.7886
Epoch [17/60], Batch [30/447], Loss: 2.8514
Epoch [17/60], Batch [40/447], Loss: 2.6610
Epoch [17/60], Batch [50/447], Loss: 2.5132
Epoch [17/60], Batch [60/447], Loss: 3.3696
Epoch [17/60], Batch [70/447], Loss: 3.0088
Epoch [17/60], Batch [80/447], Loss: 3.2112
Epoch [17/60], Batch [90/447], Loss: 3.0471
Epoch [17/60], Batch [100/447], Loss: 2.4564
Epoch [17/60], Batch [110/447], Loss: 3.1070
Epoch [17/60], Batch [120/447], Loss: 2.8807
Epoch [17/60], Batch [130/447], Loss: 3.5052
Epoch [17/60], Batch [140/447], Loss: 3.4421
Epoch [17/60], Batch [150/447], Loss: 3.3243
Epoch [17/60], Batch [160/447], Loss: 2.8331
Epoch [17/60], Batch [170/447], Loss: 2.7897
Epoch [17/60], Batch [180/447], Loss: 2.7497
Epoch [17/60], Batch [190/447], Loss: 3.1484
Epoch [17/60], Batch [200/447], Loss: 3.2467
Epoch [17/60], Batch [210/447], Loss: 2.7888
Epoch [17/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [18/60], Batch [0/447], Loss: 2.7275
Epoch [18/60], Batch [10/447], Loss: 3.0074
Epoch [18/60], Batch [20/447], Loss: 3.4704
Epoch [18/60], Batch [30/447], Loss: 3.3135
Epoch [18/60], Batch [40/447], Loss: 2.2498
Epoch [18/60], Batch [50/447], Loss: 2.2697
Epoch [18/60], Batch [60/447], Loss: 2.9714
Epoch [18/60], Batch [70/447], Loss: 3.0566
Epoch [18/60], Batch [80/447], Loss: 2.8189
Epoch [18/60], Batch [90/447], Loss: 2.9814
Epoch [18/60], Batch [100/447], Loss: 2.7394
Epoch [18/60], Batch [110/447], Loss: 3.3267
Epoch [18/60], Batch [120/447], Loss: 2.8852
Epoch [18/60], Batch [130/447], Loss: 3.0302
Epoch [18/60], Batch [140/447], Loss: 2.6964
Epoch [18/60], Batch [150/447], Loss: 2.8253
Epoch [18/60], Batch [160/447], Loss: 2.7829
Epoch [18/60], Batch [170/447], Loss: 2.2049
Epoch [18/60], Batch [180/447], Loss: 2.6582
Epoch [18/60], Batch [190/447], Loss: 2.5453
Epoch [18/60], Batch [200/447], Loss: 3.4524
Epoch [18/60], Batch [210/447], Loss: 3.4458
Epoch [18/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [19/60], Batch [0/447], Loss: 2.7345
Epoch [19/60], Batch [10/447], Loss: 2.5098
Epoch [19/60], Batch [20/447], Loss: 2.9449
Epoch [19/60], Batch [30/447], Loss: 3.0966
Epoch [19/60], Batch [40/447], Loss: 2.4476
Epoch [19/60], Batch [50/447], Loss: 2.7475
Epoch [19/60], Batch [60/447], Loss: 3.1199
Epoch [19/60], Batch [70/447], Loss: 2.1035
Epoch [19/60], Batch [80/447], Loss: 2.7073
Epoch [19/60], Batch [90/447], Loss: 3.3649
Epoch [19/60], Batch [100/447], Loss: 2.8026
Epoch [19/60], Batch [110/447], Loss: 3.0922
Epoch [19/60], Batch [120/447], Loss: 2.0799
Epoch [19/60], Batch [130/447], Loss: 2.7482
Epoch [19/60], Batch [140/447], Loss: 2.9467
Epoch [19/60], Batch [150/447], Loss: 2.5216
Epoch [19/60], Batch [160/447], Loss: 2.3771
Epoch [19/60], Batch [170/447], Loss: 2.5938
Epoch [19/60], Batch [180/447], Loss: 2.4811
Epoch [19/60], Batch [190/447], Loss: 2.9355
Epoch [19/60], Batch [200/447], Loss: 2.1851
Epoch [19/60], Batch [210/447], Loss: 2.5126
Epoch [19/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [20/60], Batch [0/447], Loss: 3.1506
Epoch [20/60], Batch [10/447], Loss: 2.4237
Epoch [20/60], Batch [20/447], Loss: 2.8799
Epoch [20/60], Batch [30/447], Loss: 3.2465
Epoch [20/60], Batch [40/447], Loss: 3.0465
Epoch [20/60], Batch [50/447], Loss: 2.8885
Epoch [20/60], Batch [60/447], Loss: 2.2769
Epoch [20/60], Batch [70/447], Loss: 1.9509
Epoch [20/60], Batch [80/447], Loss: 3.1041
Epoch [20/60], Batch [90/447], Loss: 2.6409
Epoch [20/60], Batch [100/447], Loss: 2.7179
Epoch [20/60], Batch [110/447], Loss: 2.7812
Epoch [20/60], Batch [120/447], Loss: 3.1322
Epoch [20/60], Batch [130/447], Loss: 2.9031
Epoch [20/60], Batch [140/447], Loss: 3.1290
Epoch [20/60], Batch [150/447], Loss: 2.5457
Epoch [20/60], Batch [160/447], Loss: 2.4910
Epoch [20/60], Batch [170/447], Loss: 2.6770
Epoch [20/60], Batch [180/447], Loss: 2.8787
Epoch [20/60], Batch [190/447], Loss: 2.8234
Epoch [20/60], Batch [200/447], Loss: 2.5474
Epoch [20/60], Batch [210/447], Loss: 2.6235
Epoch [20/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [21/60], Batch [0/447], Loss: 2.7653
Epoch [21/60], Batch [10/447], Loss: 2.6147
Epoch [21/60], Batch [20/447], Loss: 2.2196
Epoch [21/60], Batch [30/447], Loss: 2.3702
Epoch [21/60], Batch [40/447], Loss: 2.8115
Epoch [21/60], Batch [50/447], Loss: 2.8582
Epoch [21/60], Batch [60/447], Loss: 2.8037
Epoch [21/60], Batch [70/447], Loss: 2.3539
Epoch [21/60], Batch [80/447], Loss: 3.0437
Epoch [21/60], Batch [90/447], Loss: 2.2303
Epoch [21/60], Batch [100/447], Loss: 2.6830
Epoch [21/60], Batch [110/447], Loss: 3.0183
Epoch [21/60], Batch [120/447], Loss: 2.4140
Epoch [21/60], Batch [130/447], Loss: 2.7165
Epoch [21/60], Batch [140/447], Loss: 2.4892
Epoch [21/60], Batch [150/447], Loss: 2.7049
Epoch [21/60], Batch [160/447], Loss: 3.0084
Epoch [21/60], Batch [170/447], Loss: 3.0181
Epoch [21/60], Batch [180/447], Loss: 2.7101
Epoch [21/60], Batch [190/447], Loss: 2.9409
Epoch [21/60], Batch [200/447], Loss: 3.2039
Epoch [21/60], Batch [210/447], Loss: 2.8912
Epoch [21/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [22/60], Batch [0/447], Loss: 2.9024
Epoch [22/60], Batch [10/447], Loss: 2.9001
Epoch [22/60], Batch [20/447], Loss: 2.8648
Epoch [22/60], Batch [30/447], Loss: 2.9036
Epoch [22/60], Batch [40/447], Loss: 2.6836
Epoch [22/60], Batch [50/447], Loss: 2.7678
Epoch [22/60], Batch [60/447], Loss: 2.4774
Epoch [22/60], Batch [70/447], Loss: 2.5605
Epoch [22/60], Batch [80/447], Loss: 2.7117
Epoch [22/60], Batch [90/447], Loss: 2.5933
Epoch [22/60], Batch [100/447], Loss: 2.7232
Epoch [22/60], Batch [110/447], Loss: 2.9711
Epoch [22/60], Batch [120/447], Loss: 2.0550
Epoch [22/60], Batch [130/447], Loss: 3.1268
Epoch [22/60], Batch [140/447], Loss: 2.2625
Epoch [22/60], Batch [150/447], Loss: 2.8504
Epoch [22/60], Batch [160/447], Loss: 1.9880
Epoch [22/60], Batch [170/447], Loss: 3.3565
Epoch [22/60], Batch [180/447], Loss: 2.6478
Epoch [22/60], Batch [190/447], Loss: 2.8328
Epoch [22/60], Batch [200/447], Loss: 2.4714
Epoch [22/60], Batch [210/447], Loss: 2.8523
Epoch [22/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [23/60], Batch [0/447], Loss: 2.2446
Epoch [23/60], Batch [10/447], Loss: 2.8726
Epoch [23/60], Batch [20/447], Loss: 2.7538
Epoch [23/60], Batch [30/447], Loss: 2.3919
Epoch [23/60], Batch [40/447], Loss: 2.8307
Epoch [23/60], Batch [50/447], Loss: 2.9107
Epoch [23/60], Batch [60/447], Loss: 2.7364
Epoch [23/60], Batch [70/447], Loss: 2.5213
Epoch [23/60], Batch [80/447], Loss: 2.7339
Epoch [23/60], Batch [90/447], Loss: 2.8628
Epoch [23/60], Batch [100/447], Loss: 2.6168
Epoch [23/60], Batch [110/447], Loss: 2.3764
Epoch [23/60], Batch [120/447], Loss: 2.8299
Epoch [23/60], Batch [130/447], Loss: 2.6700
Epoch [23/60], Batch [140/447], Loss: 2.1349
Epoch [23/60], Batch [150/447], Loss: 2.2803
Epoch [23/60], Batch [160/447], Loss: 2.2396
Epoch [23/60], Batch [170/447], Loss: 3.0371
Epoch [23/60], Batch [180/447], Loss: 2.3167
Epoch [23/60], Batch [190/447], Loss: 2.9026
Epoch [23/60], Batch [200/447], Loss: 3.1215
Epoch [23/60], Batch [210/447], Loss: 2.8917
Epoch [23/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [24/60], Batch [0/447], Loss: 2.8395
Epoch [24/60], Batch [10/447], Loss: 2.6791
Epoch [24/60], Batch [20/447], Loss: 3.0313
Epoch [24/60], Batch [30/447], Loss: 2.5088
Epoch [24/60], Batch [40/447], Loss: 2.4169
Epoch [24/60], Batch [50/447], Loss: 2.6620
Epoch [24/60], Batch [60/447], Loss: 3.0827
Epoch [24/60], Batch [70/447], Loss: 2.4722
Epoch [24/60], Batch [80/447], Loss: 2.4783
Epoch [24/60], Batch [90/447], Loss: 2.4715
Epoch [24/60], Batch [100/447], Loss: 2.6426
Epoch [24/60], Batch [110/447], Loss: 2.8565
Epoch [24/60], Batch [120/447], Loss: 2.6860
Epoch [24/60], Batch [130/447], Loss: 2.6263
Epoch [24/60], Batch [140/447], Loss: 1.9660
Epoch [24/60], Batch [150/447], Loss: 2.8036
Epoch [24/60], Batch [160/447], Loss: 2.7501
Epoch [24/60], Batch [170/447], Loss: 2.7704
Epoch [24/60], Batch [180/447], Loss: 2.3370
Epoch [24/60], Batch [190/447], Loss: 2.5851
Epoch [24/60], Batch [200/447], Loss: 2.4151
Epoch [24/60], Batch [210/447], Loss: 2.5503
Epoch [24/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [25/60], Batch [0/447], Loss: 2.8951
Epoch [25/60], Batch [10/447], Loss: 3.1029
Epoch [25/60], Batch [20/447], Loss: 2.5098
Epoch [25/60], Batch [30/447], Loss: 2.5920
Epoch [25/60], Batch [40/447], Loss: 2.9354
Epoch [25/60], Batch [50/447], Loss: 2.9088
Epoch [25/60], Batch [60/447], Loss: 2.7705
Epoch [25/60], Batch [70/447], Loss: 2.7287
Epoch [25/60], Batch [80/447], Loss: 2.8909
Epoch [25/60], Batch [90/447], Loss: 2.5186
Epoch [25/60], Batch [100/447], Loss: 1.9908
Epoch [25/60], Batch [110/447], Loss: 2.0865
Epoch [25/60], Batch [120/447], Loss: 2.1895
Epoch [25/60], Batch [130/447], Loss: 2.1135
Epoch [25/60], Batch [140/447], Loss: 2.7309
Epoch [25/60], Batch [150/447], Loss: 3.1634
Epoch [25/60], Batch [160/447], Loss: 3.1403
Epoch [25/60], Batch [170/447], Loss: 2.1140
Epoch [25/60], Batch [180/447], Loss: 3.4681
Epoch [25/60], Batch [190/447], Loss: 2.7112
Epoch [25/60], Batch [200/447], Loss: 2.7297
Epoch [25/60], Batch [210/447], Loss: 2.2877
Epoch [25/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [26/60], Batch [0/447], Loss: 2.9282
Epoch [26/60], Batch [10/447], Loss: 2.5445
Epoch [26/60], Batch [20/447], Loss: 2.6472
Epoch [26/60], Batch [30/447], Loss: 2.6708
Epoch [26/60], Batch [40/447], Loss: 3.0011
Epoch [26/60], Batch [50/447], Loss: 2.3215
Epoch [26/60], Batch [60/447], Loss: 1.8777
Epoch [26/60], Batch [70/447], Loss: 2.7408
Epoch [26/60], Batch [80/447], Loss: 2.3109
Epoch [26/60], Batch [90/447], Loss: 2.8434
Epoch [26/60], Batch [100/447], Loss: 3.2941
Epoch [26/60], Batch [110/447], Loss: 2.4518
Epoch [26/60], Batch [120/447], Loss: 2.1705
Epoch [26/60], Batch [130/447], Loss: 2.3769
Epoch [26/60], Batch [140/447], Loss: 2.4294
Epoch [26/60], Batch [150/447], Loss: 2.1720
Epoch [26/60], Batch [160/447], Loss: 3.0747
Epoch [26/60], Batch [170/447], Loss: 2.4037
Epoch [26/60], Batch [180/447], Loss: 2.3229
Epoch [26/60], Batch [190/447], Loss: 2.1806
Epoch [26/60], Batch [200/447], Loss: 2.5888
Epoch [26/60], Batch [210/447], Loss: 2.3546
Epoch [26/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [27/60], Batch [0/447], Loss: 2.9599
Epoch [27/60], Batch [10/447], Loss: 2.3579
Epoch [27/60], Batch [20/447], Loss: 2.8324
Epoch [27/60], Batch [30/447], Loss: 2.5206
Epoch [27/60], Batch [40/447], Loss: 2.8395
Epoch [27/60], Batch [50/447], Loss: 2.7642
Epoch [27/60], Batch [60/447], Loss: 2.6960
Epoch [27/60], Batch [70/447], Loss: 2.5972
Epoch [27/60], Batch [80/447], Loss: 2.8529
Epoch [27/60], Batch [90/447], Loss: 2.4735
Epoch [27/60], Batch [100/447], Loss: 2.0896
Epoch [27/60], Batch [110/447], Loss: 2.8047
Epoch [27/60], Batch [120/447], Loss: 2.5248
Epoch [27/60], Batch [130/447], Loss: 3.1385
Epoch [27/60], Batch [140/447], Loss: 2.6498
Epoch [27/60], Batch [150/447], Loss: 2.4812
Epoch [27/60], Batch [160/447], Loss: 2.7910
Epoch [27/60], Batch [170/447], Loss: 2.4972
Epoch [27/60], Batch [180/447], Loss: 2.5533
Epoch [27/60], Batch [190/447], Loss: 2.9290
Epoch [27/60], Batch [200/447], Loss: 2.2287
Epoch [27/60], Batch [210/447], Loss: 2.5440
Epoch [27/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [28/60], Batch [0/447], Loss: 2.7037
Epoch [28/60], Batch [10/447], Loss: 2.4515
Epoch [28/60], Batch [20/447], Loss: 2.8549
Epoch [28/60], Batch [30/447], Loss: 2.2908
Epoch [28/60], Batch [40/447], Loss: 2.3952
Epoch [28/60], Batch [50/447], Loss: 2.4559
Epoch [28/60], Batch [60/447], Loss: 2.7356
Epoch [28/60], Batch [70/447], Loss: 2.3586
Epoch [28/60], Batch [80/447], Loss: 2.8193
Epoch [28/60], Batch [90/447], Loss: 2.9518
Epoch [28/60], Batch [100/447], Loss: 2.6544
Epoch [28/60], Batch [110/447], Loss: 2.2237
Epoch [28/60], Batch [120/447], Loss: 2.7135
Epoch [28/60], Batch [130/447], Loss: 2.2542
Epoch [28/60], Batch [140/447], Loss: 2.6934
Epoch [28/60], Batch [150/447], Loss: 2.7490
Epoch [28/60], Batch [160/447], Loss: 2.6244
Epoch [28/60], Batch [170/447], Loss: 2.3677
Epoch [28/60], Batch [180/447], Loss: 2.1787
Epoch [28/60], Batch [190/447], Loss: 2.6446
Epoch [28/60], Batch [200/447], Loss: 2.6706
Epoch [28/60], Batch [210/447], Loss: 2.5501
Epoch [28/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [29/60], Batch [0/447], Loss: 2.9783
Epoch [29/60], Batch [10/447], Loss: 1.9963
Epoch [29/60], Batch [20/447], Loss: 2.3832
Epoch [29/60], Batch [30/447], Loss: 2.2472
Epoch [29/60], Batch [40/447], Loss: 2.5847
Epoch [29/60], Batch [50/447], Loss: 2.3821
Epoch [29/60], Batch [60/447], Loss: 2.6987
Epoch [29/60], Batch [70/447], Loss: 2.5063
Epoch [29/60], Batch [80/447], Loss: 2.2699
Epoch [29/60], Batch [90/447], Loss: 2.7226
Epoch [29/60], Batch [100/447], Loss: 2.2046
Epoch [29/60], Batch [110/447], Loss: 2.7801
Epoch [29/60], Batch [120/447], Loss: 2.2141
Epoch [29/60], Batch [130/447], Loss: 1.2956
Epoch [29/60], Batch [140/447], Loss: 2.7717
Epoch [29/60], Batch [150/447], Loss: 2.5859
Epoch [29/60], Batch [160/447], Loss: 2.4951
Epoch [29/60], Batch [170/447], Loss: 2.6395
Epoch [29/60], Batch [180/447], Loss: 2.7295
Epoch [29/60], Batch [190/447], Loss: 2.1210
Epoch [29/60], Batch [200/447], Loss: 2.7036
Epoch [29/60], Batch [210/447], Loss: 2.4119
Epoch [29/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [30/60], Batch [0/447], Loss: 2.5394
Epoch [30/60], Batch [10/447], Loss: 2.2634
Epoch [30/60], Batch [20/447], Loss: 2.6535
Epoch [30/60], Batch [30/447], Loss: 2.2323
Epoch [30/60], Batch [40/447], Loss: 2.3003
Epoch [30/60], Batch [50/447], Loss: 2.5351
Epoch [30/60], Batch [60/447], Loss: 2.8663
Epoch [30/60], Batch [70/447], Loss: 2.2974
Epoch [30/60], Batch [80/447], Loss: 2.3798
Epoch [30/60], Batch [90/447], Loss: 2.1475
Epoch [30/60], Batch [100/447], Loss: 2.3213
Epoch [30/60], Batch [110/447], Loss: 2.1671
Epoch [30/60], Batch [120/447], Loss: 1.8000
Epoch [30/60], Batch [130/447], Loss: 2.7231
Epoch [30/60], Batch [140/447], Loss: 2.6806
Epoch [30/60], Batch [150/447], Loss: 2.0738
Epoch [30/60], Batch [160/447], Loss: 2.6221
Epoch [30/60], Batch [170/447], Loss: 2.6078
Epoch [30/60], Batch [180/447], Loss: 2.8765
Epoch [30/60], Batch [190/447], Loss: 2.1663
Epoch [30/60], Batch [200/447], Loss: 1.9936
Epoch [30/60], Batch [210/447], Loss: 2.2960
Epoch [30/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [31/60], Batch [0/447], Loss: 2.6190
Epoch [31/60], Batch [10/447], Loss: 2.4501
Epoch [31/60], Batch [20/447], Loss: 2.5054
Epoch [31/60], Batch [30/447], Loss: 2.5297
Epoch [31/60], Batch [40/447], Loss: 1.6659
Epoch [31/60], Batch [50/447], Loss: 2.3692
Epoch [31/60], Batch [60/447], Loss: 2.1770
Epoch [31/60], Batch [70/447], Loss: 2.1235
Epoch [31/60], Batch [80/447], Loss: 2.5662
Epoch [31/60], Batch [90/447], Loss: 2.9110
Epoch [31/60], Batch [100/447], Loss: 2.6488
Epoch [31/60], Batch [110/447], Loss: 2.5587
Epoch [31/60], Batch [120/447], Loss: 2.4000
Epoch [31/60], Batch [130/447], Loss: 2.2528
Epoch [31/60], Batch [140/447], Loss: 2.0330
Epoch [31/60], Batch [150/447], Loss: 2.4342
Epoch [31/60], Batch [160/447], Loss: 2.5727
Epoch [31/60], Batch [170/447], Loss: 2.2107
Epoch [31/60], Batch [180/447], Loss: 1.6664
Epoch [31/60], Batch [190/447], Loss: 2.4752
Epoch [31/60], Batch [200/447], Loss: 2.9240
Epoch [31/60], Batch [210/447], Loss: 1.6371
Epoch [31/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [32/60], Batch [0/447], Loss: 2.6149
Epoch [32/60], Batch [10/447], Loss: 3.1156
Epoch [32/60], Batch [20/447], Loss: 2.0171
Epoch [32/60], Batch [30/447], Loss: 2.2175
Epoch [32/60], Batch [40/447], Loss: 2.5805
Epoch [32/60], Batch [50/447], Loss: 2.2076
Epoch [32/60], Batch [60/447], Loss: 1.6494
Epoch [32/60], Batch [70/447], Loss: 2.3645
Epoch [32/60], Batch [80/447], Loss: 2.4493
Epoch [32/60], Batch [90/447], Loss: 2.6768
Epoch [32/60], Batch [100/447], Loss: 1.9281
Epoch [32/60], Batch [110/447], Loss: 1.9108
Epoch [32/60], Batch [120/447], Loss: 2.4417
Epoch [32/60], Batch [130/447], Loss: 2.4889
Epoch [32/60], Batch [140/447], Loss: 2.5073
Epoch [32/60], Batch [150/447], Loss: 2.5604
Epoch [32/60], Batch [160/447], Loss: 2.0630
Epoch [32/60], Batch [170/447], Loss: 1.9866
Epoch [32/60], Batch [180/447], Loss: 2.7201
Epoch [32/60], Batch [190/447], Loss: 2.7408
Epoch [32/60], Batch [200/447], Loss: 1.8998
Epoch [32/60], Batch [210/447], Loss: 2.4279
Epoch [32/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [33/60], Batch [0/447], Loss: 2.1023
Epoch [33/60], Batch [10/447], Loss: 2.1407
Epoch [33/60], Batch [20/447], Loss: 2.7603
Epoch [33/60], Batch [30/447], Loss: 1.5635
Epoch [33/60], Batch [40/447], Loss: 2.3260
Epoch [33/60], Batch [50/447], Loss: 2.6713
Epoch [33/60], Batch [60/447], Loss: 2.8452
Epoch [33/60], Batch [70/447], Loss: 2.3316
Epoch [33/60], Batch [80/447], Loss: 2.0717
Epoch [33/60], Batch [90/447], Loss: 2.8197
Epoch [33/60], Batch [100/447], Loss: 2.4278
Epoch [33/60], Batch [110/447], Loss: 2.0189
Epoch [33/60], Batch [120/447], Loss: 2.4511
Epoch [33/60], Batch [130/447], Loss: 2.7022
Epoch [33/60], Batch [140/447], Loss: 2.2632
Epoch [33/60], Batch [150/447], Loss: 2.5793
Epoch [33/60], Batch [160/447], Loss: 2.1792
Epoch [33/60], Batch [170/447], Loss: 1.8842
Epoch [33/60], Batch [180/447], Loss: 2.5505
Epoch [33/60], Batch [190/447], Loss: 2.4205
Epoch [33/60], Batch [200/447], Loss: 2.6472
Epoch [33/60], Batch [210/447], Loss: 2.6192
Epoch [33/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [34/60], Batch [0/447], Loss: 2.4267
Epoch [34/60], Batch [10/447], Loss: 2.3731
Epoch [34/60], Batch [20/447], Loss: 2.2351
Epoch [34/60], Batch [30/447], Loss: 2.7264
Epoch [34/60], Batch [40/447], Loss: 3.2329
Epoch [34/60], Batch [50/447], Loss: 2.4632
Epoch [34/60], Batch [60/447], Loss: 2.2161
Epoch [34/60], Batch [70/447], Loss: 2.2964
Epoch [34/60], Batch [80/447], Loss: 2.8304
Epoch [34/60], Batch [90/447], Loss: 2.5721
Epoch [34/60], Batch [100/447], Loss: 2.2127
Epoch [34/60], Batch [110/447], Loss: 2.5349
Epoch [34/60], Batch [120/447], Loss: 1.4039
Epoch [34/60], Batch [130/447], Loss: 2.1586
Epoch [34/60], Batch [140/447], Loss: 2.7022
Epoch [34/60], Batch [150/447], Loss: 2.2574
Epoch [34/60], Batch [160/447], Loss: 2.4290
Epoch [34/60], Batch [170/447], Loss: 2.2301
Epoch [34/60], Batch [180/447], Loss: 2.7184
Epoch [34/60], Batch [190/447], Loss: 2.0022
Epoch [34/60], Batch [200/447], Loss: 2.6840
Epoch [34/60], Batch [210/447], Loss: 1.7503
Epoch [34/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [35/60], Batch [0/447], Loss: 2.3585
Epoch [35/60], Batch [10/447], Loss: 2.2137
Epoch [35/60], Batch [20/447], Loss: 2.4492
Epoch [35/60], Batch [30/447], Loss: 2.6764
Epoch [35/60], Batch [40/447], Loss: 2.7276
Epoch [35/60], Batch [50/447], Loss: 1.7013
Epoch [35/60], Batch [60/447], Loss: 1.6042
Epoch [35/60], Batch [70/447], Loss: 2.3800
Epoch [35/60], Batch [80/447], Loss: 1.9145
Epoch [35/60], Batch [90/447], Loss: 2.3870
Epoch [35/60], Batch [100/447], Loss: 2.2974
Epoch [35/60], Batch [110/447], Loss: 2.7550
Epoch [35/60], Batch [120/447], Loss: 1.8384
Epoch [35/60], Batch [130/447], Loss: 2.3714
Epoch [35/60], Batch [140/447], Loss: 1.8318
Epoch [35/60], Batch [150/447], Loss: 2.3412
Epoch [35/60], Batch [160/447], Loss: 2.4670
Epoch [35/60], Batch [170/447], Loss: 2.1944
Epoch [35/60], Batch [180/447], Loss: 1.2570
Epoch [35/60], Batch [190/447], Loss: 2.7541
Epoch [35/60], Batch [200/447], Loss: 3.0129
Epoch [35/60], Batch [210/447], Loss: 1.3398
Epoch [35/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [36/60], Batch [0/447], Loss: 1.9680
Epoch [36/60], Batch [10/447], Loss: 1.9890
Epoch [36/60], Batch [20/447], Loss: 2.0606
Epoch [36/60], Batch [30/447], Loss: 2.5590
Epoch [36/60], Batch [40/447], Loss: 1.8825
Epoch [36/60], Batch [50/447], Loss: 2.6392
Epoch [36/60], Batch [60/447], Loss: 2.4682
Epoch [36/60], Batch [70/447], Loss: 1.9844
Epoch [36/60], Batch [80/447], Loss: 2.6650
Epoch [36/60], Batch [90/447], Loss: 2.2638
Epoch [36/60], Batch [100/447], Loss: 1.9514
Epoch [36/60], Batch [110/447], Loss: 2.6760
Epoch [36/60], Batch [120/447], Loss: 2.1065
Epoch [36/60], Batch [130/447], Loss: 2.9174
Epoch [36/60], Batch [140/447], Loss: 2.8999
Epoch [36/60], Batch [150/447], Loss: 2.6069
Epoch [36/60], Batch [160/447], Loss: 2.2435
Epoch [36/60], Batch [170/447], Loss: 2.8020
Epoch [36/60], Batch [180/447], Loss: 1.9990
Epoch [36/60], Batch [190/447], Loss: 2.4310
Epoch [36/60], Batch [200/447], Loss: 2.1551
Epoch [36/60], Batch [210/447], Loss: 2.2085
Epoch [36/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [37/60], Batch [0/447], Loss: 2.8723
Epoch [37/60], Batch [10/447], Loss: 1.7482
Epoch [37/60], Batch [20/447], Loss: 2.4485
Epoch [37/60], Batch [30/447], Loss: 2.3869
Epoch [37/60], Batch [40/447], Loss: 2.0275
Epoch [37/60], Batch [50/447], Loss: 2.3177
Epoch [37/60], Batch [60/447], Loss: 2.4628
Epoch [37/60], Batch [70/447], Loss: 2.2821
Epoch [37/60], Batch [80/447], Loss: 2.3100
Epoch [37/60], Batch [90/447], Loss: 2.1049
Epoch [37/60], Batch [100/447], Loss: 1.8945
Epoch [37/60], Batch [110/447], Loss: 2.3258
Epoch [37/60], Batch [120/447], Loss: 2.5029
Epoch [37/60], Batch [130/447], Loss: 1.4571
Epoch [37/60], Batch [140/447], Loss: 1.9006
Epoch [37/60], Batch [150/447], Loss: 2.8437
Epoch [37/60], Batch [160/447], Loss: 2.0723
Epoch [37/60], Batch [170/447], Loss: 2.2121
Epoch [37/60], Batch [180/447], Loss: 2.7380
Epoch [37/60], Batch [190/447], Loss: 2.5070
Epoch [37/60], Batch [200/447], Loss: 2.7065
Epoch [37/60], Batch [210/447], Loss: 2.4009
Epoch [37/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [38/60], Batch [0/447], Loss: 2.3281
Epoch [38/60], Batch [10/447], Loss: 2.1248
Epoch [38/60], Batch [20/447], Loss: 2.2110
Epoch [38/60], Batch [30/447], Loss: 2.7481
Epoch [38/60], Batch [40/447], Loss: 2.3628
Epoch [38/60], Batch [50/447], Loss: 1.9810
Epoch [38/60], Batch [60/447], Loss: 1.7996
Epoch [38/60], Batch [70/447], Loss: 2.2528
Epoch [38/60], Batch [80/447], Loss: 2.0560
Epoch [38/60], Batch [90/447], Loss: 2.1795
Epoch [38/60], Batch [100/447], Loss: 2.7020
Epoch [38/60], Batch [110/447], Loss: 1.8149
Epoch [38/60], Batch [120/447], Loss: 1.5512
Epoch [38/60], Batch [130/447], Loss: 1.9742
Epoch [38/60], Batch [140/447], Loss: 2.2590
Epoch [38/60], Batch [150/447], Loss: 2.8104
Epoch [38/60], Batch [160/447], Loss: 1.8184
Epoch [38/60], Batch [170/447], Loss: 1.7004
Epoch [38/60], Batch [180/447], Loss: 2.3678
Epoch [38/60], Batch [190/447], Loss: 1.8155
Epoch [38/60], Batch [200/447], Loss: 2.2782
Epoch [38/60], Batch [210/447], Loss: 2.2718
Epoch [38/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [39/60], Batch [0/447], Loss: 1.6525
Epoch [39/60], Batch [10/447], Loss: 2.6407
Epoch [39/60], Batch [20/447], Loss: 2.3725
Epoch [39/60], Batch [30/447], Loss: 1.9865
Epoch [39/60], Batch [40/447], Loss: 2.3689
Epoch [39/60], Batch [50/447], Loss: 1.0800
Epoch [39/60], Batch [60/447], Loss: 2.1483
Epoch [39/60], Batch [70/447], Loss: 2.6933
Epoch [39/60], Batch [80/447], Loss: 2.4829
Epoch [39/60], Batch [90/447], Loss: 2.7294
Epoch [39/60], Batch [100/447], Loss: 2.8395
Epoch [39/60], Batch [110/447], Loss: 2.4838
Epoch [39/60], Batch [120/447], Loss: 2.4144
Epoch [39/60], Batch [130/447], Loss: 2.0552
Epoch [39/60], Batch [140/447], Loss: 2.7996
Epoch [39/60], Batch [150/447], Loss: 1.5596
Epoch [39/60], Batch [160/447], Loss: 2.4795
Epoch [39/60], Batch [170/447], Loss: 2.4767
Epoch [39/60], Batch [180/447], Loss: 2.8013
Epoch [39/60], Batch [190/447], Loss: 2.2465
Epoch [39/60], Batch [200/447], Loss: 2.6960
Epoch [39/60], Batch [210/447], Loss: 2.2077
Epoch [39/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [40/60], Batch [0/447], Loss: 2.6094
Epoch [40/60], Batch [10/447], Loss: 2.4561
Epoch [40/60], Batch [20/447], Loss: 2.3109
Epoch [40/60], Batch [30/447], Loss: 2.2811
Epoch [40/60], Batch [40/447], Loss: 1.9218
Epoch [40/60], Batch [50/447], Loss: 2.4341
Epoch [40/60], Batch [60/447], Loss: 2.3959
Epoch [40/60], Batch [70/447], Loss: 2.9543
Epoch [40/60], Batch [80/447], Loss: 2.3460
Epoch [40/60], Batch [90/447], Loss: 2.1758
Epoch [40/60], Batch [100/447], Loss: 2.2449
Epoch [40/60], Batch [110/447], Loss: 2.9192
Epoch [40/60], Batch [120/447], Loss: 2.3450
Epoch [40/60], Batch [130/447], Loss: 1.9473
Epoch [40/60], Batch [140/447], Loss: 2.0159
Epoch [40/60], Batch [150/447], Loss: 1.8131
Epoch [40/60], Batch [160/447], Loss: 2.2075
Epoch [40/60], Batch [170/447], Loss: 2.1295
Epoch [40/60], Batch [180/447], Loss: 2.1628
Epoch [40/60], Batch [190/447], Loss: 2.3027
Epoch [40/60], Batch [200/447], Loss: 1.3618
Epoch [40/60], Batch [210/447], Loss: 2.9991
Epoch [40/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [41/60], Batch [0/447], Loss: 2.4460
Epoch [41/60], Batch [10/447], Loss: 2.0557
Epoch [41/60], Batch [20/447], Loss: 2.3050
Epoch [41/60], Batch [30/447], Loss: 2.8558
Epoch [41/60], Batch [40/447], Loss: 2.2576
Epoch [41/60], Batch [50/447], Loss: 2.9380
Epoch [41/60], Batch [60/447], Loss: 2.1808
Epoch [41/60], Batch [70/447], Loss: 1.9399
Epoch [41/60], Batch [80/447], Loss: 2.5295
Epoch [41/60], Batch [90/447], Loss: 2.4903
Epoch [41/60], Batch [100/447], Loss: 2.0438
Epoch [41/60], Batch [110/447], Loss: 2.7238
Epoch [41/60], Batch [120/447], Loss: 2.2758
Epoch [41/60], Batch [130/447], Loss: 2.3284
Epoch [41/60], Batch [140/447], Loss: 1.9367
Epoch [41/60], Batch [150/447], Loss: 1.9521
Epoch [41/60], Batch [160/447], Loss: 2.4267
Epoch [41/60], Batch [170/447], Loss: 2.1616
Epoch [41/60], Batch [180/447], Loss: 1.7812
Epoch [41/60], Batch [190/447], Loss: 2.2791
Epoch [41/60], Batch [200/447], Loss: 2.0214
Epoch [41/60], Batch [210/447], Loss: 2.6319
Epoch [41/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [42/60], Batch [0/447], Loss: 2.9237
Epoch [42/60], Batch [10/447], Loss: 1.7647
Epoch [42/60], Batch [20/447], Loss: 2.5378
Epoch [42/60], Batch [30/447], Loss: 2.1067
Epoch [42/60], Batch [40/447], Loss: 2.1576
Epoch [42/60], Batch [50/447], Loss: 2.1737
Epoch [42/60], Batch [60/447], Loss: 2.3738
Epoch [42/60], Batch [70/447], Loss: 2.6430
Epoch [42/60], Batch [80/447], Loss: 2.9449
Epoch [42/60], Batch [90/447], Loss: 2.4842
Epoch [42/60], Batch [100/447], Loss: 2.5228
Epoch [42/60], Batch [110/447], Loss: 2.0328
Epoch [42/60], Batch [120/447], Loss: 2.3912
Epoch [42/60], Batch [130/447], Loss: 1.8375
Epoch [42/60], Batch [140/447], Loss: 2.1656
Epoch [42/60], Batch [150/447], Loss: 2.6852
Epoch [42/60], Batch [160/447], Loss: 2.1640
Epoch [42/60], Batch [170/447], Loss: 2.7660
Epoch [42/60], Batch [180/447], Loss: 2.8026
Epoch [42/60], Batch [190/447], Loss: 2.5479
Epoch [42/60], Batch [200/447], Loss: 2.5180
Epoch [42/60], Batch [210/447], Loss: 2.8297
Epoch [42/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [43/60], Batch [0/447], Loss: 1.7124
Epoch [43/60], Batch [10/447], Loss: 2.6287
Epoch [43/60], Batch [20/447], Loss: 2.3460
Epoch [43/60], Batch [30/447], Loss: 1.9325
Epoch [43/60], Batch [40/447], Loss: 2.0467
Epoch [43/60], Batch [50/447], Loss: 2.6694
Epoch [43/60], Batch [60/447], Loss: 2.5517
Epoch [43/60], Batch [70/447], Loss: 2.2174
Epoch [43/60], Batch [80/447], Loss: 2.2065
Epoch [43/60], Batch [90/447], Loss: 1.6059
Epoch [43/60], Batch [100/447], Loss: 1.9035
Epoch [43/60], Batch [110/447], Loss: 2.1931
Epoch [43/60], Batch [120/447], Loss: 2.1707
Epoch [43/60], Batch [130/447], Loss: 2.0579
Epoch [43/60], Batch [140/447], Loss: 1.9228
Epoch [43/60], Batch [150/447], Loss: 2.4106
Epoch [43/60], Batch [160/447], Loss: 2.3804
Epoch [43/60], Batch [170/447], Loss: 2.7900
Epoch [43/60], Batch [180/447], Loss: 2.5983
Epoch [43/60], Batch [190/447], Loss: 2.2701
Epoch [43/60], Batch [200/447], Loss: 2.4572
Epoch [43/60], Batch [210/447], Loss: 2.2994
Epoch [43/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [44/60], Batch [0/447], Loss: 2.5255
Epoch [44/60], Batch [10/447], Loss: 2.0886
Epoch [44/60], Batch [20/447], Loss: 2.4355
Epoch [44/60], Batch [30/447], Loss: 1.9856
Epoch [44/60], Batch [40/447], Loss: 2.1465
Epoch [44/60], Batch [50/447], Loss: 2.6064
Epoch [44/60], Batch [60/447], Loss: 2.3493
Epoch [44/60], Batch [70/447], Loss: 2.3707
Epoch [44/60], Batch [80/447], Loss: 2.4758
Epoch [44/60], Batch [90/447], Loss: 2.7503
Epoch [44/60], Batch [100/447], Loss: 2.5795
Epoch [44/60], Batch [110/447], Loss: 2.1453
Epoch [44/60], Batch [120/447], Loss: 2.5715
Epoch [44/60], Batch [130/447], Loss: 2.2512
Epoch [44/60], Batch [140/447], Loss: 2.2397
Epoch [44/60], Batch [150/447], Loss: 2.0360
Epoch [44/60], Batch [160/447], Loss: 2.6652
Epoch [44/60], Batch [170/447], Loss: 1.7878
Epoch [44/60], Batch [180/447], Loss: 2.1366
Epoch [44/60], Batch [190/447], Loss: 2.7678
Epoch [44/60], Batch [200/447], Loss: 2.1204
Epoch [44/60], Batch [210/447], Loss: 1.7002
Epoch [44/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [45/60], Batch [0/447], Loss: 2.5867
Epoch [45/60], Batch [10/447], Loss: 2.2354
Epoch [45/60], Batch [20/447], Loss: 2.0021
Epoch [45/60], Batch [30/447], Loss: 1.9830
Epoch [45/60], Batch [40/447], Loss: 2.4088
Epoch [45/60], Batch [50/447], Loss: 2.8421
Epoch [45/60], Batch [60/447], Loss: 1.8127
Epoch [45/60], Batch [70/447], Loss: 2.4260
Epoch [45/60], Batch [80/447], Loss: 1.9740
Epoch [45/60], Batch [90/447], Loss: 1.3036
Epoch [45/60], Batch [100/447], Loss: 2.7415
Epoch [45/60], Batch [110/447], Loss: 2.7225
Epoch [45/60], Batch [120/447], Loss: 2.6449
Epoch [45/60], Batch [130/447], Loss: 2.2206
Epoch [45/60], Batch [140/447], Loss: 2.2863
Epoch [45/60], Batch [150/447], Loss: 2.0053
Epoch [45/60], Batch [160/447], Loss: 2.3346
Epoch [45/60], Batch [170/447], Loss: 2.0772
Epoch [45/60], Batch [180/447], Loss: 1.9624
Epoch [45/60], Batch [190/447], Loss: 2.5227
Epoch [45/60], Batch [200/447], Loss: 2.1030
Epoch [45/60], Batch [210/447], Loss: 1.4851
Epoch [45/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [46/60], Batch [0/447], Loss: 2.2322
Epoch [46/60], Batch [10/447], Loss: 2.4299
Epoch [46/60], Batch [20/447], Loss: 1.6430
Epoch [46/60], Batch [30/447], Loss: 1.9739
Epoch [46/60], Batch [40/447], Loss: 1.8982
Epoch [46/60], Batch [50/447], Loss: 1.5541
Epoch [46/60], Batch [60/447], Loss: 2.5026
Epoch [46/60], Batch [70/447], Loss: 2.3081
Epoch [46/60], Batch [80/447], Loss: 2.6150
Epoch [46/60], Batch [90/447], Loss: 2.5055
Epoch [46/60], Batch [100/447], Loss: 2.2792
Epoch [46/60], Batch [110/447], Loss: 2.1430
Epoch [46/60], Batch [120/447], Loss: 2.3501
Epoch [46/60], Batch [130/447], Loss: 1.7837
Epoch [46/60], Batch [140/447], Loss: 2.2018
Epoch [46/60], Batch [150/447], Loss: 2.7058
Epoch [46/60], Batch [160/447], Loss: 1.8307
Epoch [46/60], Batch [170/447], Loss: 2.2450
Epoch [46/60], Batch [180/447], Loss: 1.9922
Epoch [46/60], Batch [190/447], Loss: 1.7294
Epoch [46/60], Batch [200/447], Loss: 2.3460
Epoch [46/60], Batch [210/447], Loss: 1.4622
Epoch [46/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [47/60], Batch [0/447], Loss: 1.9670
Epoch [47/60], Batch [10/447], Loss: 2.3747
Epoch [47/60], Batch [20/447], Loss: 1.4828
Epoch [47/60], Batch [30/447], Loss: 1.3846
Epoch [47/60], Batch [40/447], Loss: 2.4741
Epoch [47/60], Batch [50/447], Loss: 2.5328
Epoch [47/60], Batch [60/447], Loss: 2.2461
Epoch [47/60], Batch [70/447], Loss: 2.4546
Epoch [47/60], Batch [80/447], Loss: 2.4884
Epoch [47/60], Batch [90/447], Loss: 1.7583
Epoch [47/60], Batch [100/447], Loss: 2.6335
Epoch [47/60], Batch [110/447], Loss: 2.3559
Epoch [47/60], Batch [120/447], Loss: 2.3373
Epoch [47/60], Batch [130/447], Loss: 1.5928
Epoch [47/60], Batch [140/447], Loss: 1.9107
Epoch [47/60], Batch [150/447], Loss: 2.3913
Epoch [47/60], Batch [160/447], Loss: 2.2574
Epoch [47/60], Batch [170/447], Loss: 1.7516
Epoch [47/60], Batch [180/447], Loss: 2.7509
Epoch [47/60], Batch [190/447], Loss: 2.2522
Epoch [47/60], Batch [200/447], Loss: 2.2495
Epoch [47/60], Batch [210/447], Loss: 2.2640
Epoch [47/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [48/60], Batch [0/447], Loss: 1.9583
Epoch [48/60], Batch [10/447], Loss: 2.4099
Epoch [48/60], Batch [20/447], Loss: 2.2458
Epoch [48/60], Batch [30/447], Loss: 2.1526
Epoch [48/60], Batch [40/447], Loss: 2.4654
Epoch [48/60], Batch [50/447], Loss: 2.3242
Epoch [48/60], Batch [60/447], Loss: 2.1878
Epoch [48/60], Batch [70/447], Loss: 1.7013
Epoch [48/60], Batch [80/447], Loss: 2.3585
Epoch [48/60], Batch [90/447], Loss: 1.9422
Epoch [48/60], Batch [100/447], Loss: 1.8702
Epoch [48/60], Batch [110/447], Loss: 1.4786
Epoch [48/60], Batch [120/447], Loss: 1.9485
Epoch [48/60], Batch [130/447], Loss: 1.9746
Epoch [48/60], Batch [140/447], Loss: 2.6919
Epoch [48/60], Batch [150/447], Loss: 2.3684
Epoch [48/60], Batch [160/447], Loss: 2.3281
Epoch [48/60], Batch [170/447], Loss: 2.3270
Epoch [48/60], Batch [180/447], Loss: 2.7969
Epoch [48/60], Batch [190/447], Loss: 2.3179
Epoch [48/60], Batch [200/447], Loss: 2.9752
Epoch [48/60], Batch [210/447], Loss: 2.7184
Epoch [48/60], Batch 

[I 2024-12-13 07:19:15,146] Trial 2 pruned. 


Epoch [48/60], Validation Accuracy: 0.7288, Validation Loss: 1.0200
No improvement in validation accuracy for 5 epoch(s).
Early stopping at epoch 48.
Trial early stopped due to lack of improvement.
Starting a new trial...
Trial 3: alpha = 7.34674002393291
Building the model...


2024-12-13 07:19:15,487 - mmaction - INFO - load model from: https://download.openmmlab.com/mmaction/recognition/csn/ircsn_from_scratch_r50_ig65m_20210617-ce545a37.pth
2024-12-13 07:19:15,488 - mmaction - INFO - load checkpoint from http path: https://download.openmmlab.com/mmaction/recognition/csn/ircsn_from_scratch_r50_ig65m_20210617-ce545a37.pth


Model built successfully!
Starting training...


  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [1/60], Batch [0/447], Loss: 3.9179
Epoch [1/60], Batch [10/447], Loss: 3.9754
Epoch [1/60], Batch [20/447], Loss: 3.9425
Epoch [1/60], Batch [30/447], Loss: 3.9369
Epoch [1/60], Batch [40/447], Loss: 4.0078
Epoch [1/60], Batch [50/447], Loss: 3.9467
Epoch [1/60], Batch [60/447], Loss: 3.9588
Epoch [1/60], Batch [70/447], Loss: 3.9377
Epoch [1/60], Batch [80/447], Loss: 3.9102
Epoch [1/60], Batch [90/447], Loss: 3.9084
Epoch [1/60], Batch [100/447], Loss: 3.9397
Epoch [1/60], Batch [110/447], Loss: 4.0436
Epoch [1/60], Batch [120/447], Loss: 4.0511
Epoch [1/60], Batch [130/447], Loss: 3.9700
Epoch [1/60], Batch [140/447], Loss: 3.9194
Epoch [1/60], Batch [150/447], Loss: 3.9952
Epoch [1/60], Batch [160/447], Loss: 3.9512
Epoch [1/60], Batch [170/447], Loss: 3.9676
Epoch [1/60], Batch [180/447], Loss: 3.9557
Epoch [1/60], Batch [190/447], Loss: 3.9694
Epoch [1/60], Batch [200/447], Loss: 3.9846
Epoch [1/60], Batch [210/447], Loss: 3.9477
Epoch [1/60], Batch [220/447], Loss: 3.8709

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [2/60], Batch [0/447], Loss: 3.8981
Epoch [2/60], Batch [10/447], Loss: 3.7229
Epoch [2/60], Batch [20/447], Loss: 3.8156
Epoch [2/60], Batch [30/447], Loss: 3.9581
Epoch [2/60], Batch [40/447], Loss: 3.9843
Epoch [2/60], Batch [50/447], Loss: 3.8527
Epoch [2/60], Batch [60/447], Loss: 3.8367
Epoch [2/60], Batch [70/447], Loss: 3.8731
Epoch [2/60], Batch [80/447], Loss: 3.8067
Epoch [2/60], Batch [90/447], Loss: 3.9146
Epoch [2/60], Batch [100/447], Loss: 3.7639
Epoch [2/60], Batch [110/447], Loss: 4.0464
Epoch [2/60], Batch [120/447], Loss: 3.6585
Epoch [2/60], Batch [130/447], Loss: 3.8642
Epoch [2/60], Batch [140/447], Loss: 3.7507
Epoch [2/60], Batch [150/447], Loss: 4.0357
Epoch [2/60], Batch [160/447], Loss: 3.9014
Epoch [2/60], Batch [170/447], Loss: 3.8718
Epoch [2/60], Batch [180/447], Loss: 3.8973
Epoch [2/60], Batch [190/447], Loss: 3.8502
Epoch [2/60], Batch [200/447], Loss: 3.8629
Epoch [2/60], Batch [210/447], Loss: 3.6836
Epoch [2/60], Batch [220/447], Loss: 3.7374

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [3/60], Batch [0/447], Loss: 3.8236
Epoch [3/60], Batch [10/447], Loss: 3.8445
Epoch [3/60], Batch [20/447], Loss: 3.8392
Epoch [3/60], Batch [30/447], Loss: 3.7548
Epoch [3/60], Batch [40/447], Loss: 3.6819
Epoch [3/60], Batch [50/447], Loss: 3.7892
Epoch [3/60], Batch [60/447], Loss: 3.7028
Epoch [3/60], Batch [70/447], Loss: 3.6480
Epoch [3/60], Batch [80/447], Loss: 3.7999
Epoch [3/60], Batch [90/447], Loss: 3.8216
Epoch [3/60], Batch [100/447], Loss: 3.6452
Epoch [3/60], Batch [110/447], Loss: 3.6719
Epoch [3/60], Batch [120/447], Loss: 3.7671
Epoch [3/60], Batch [130/447], Loss: 3.8846
Epoch [3/60], Batch [140/447], Loss: 3.6213
Epoch [3/60], Batch [150/447], Loss: 3.7038
Epoch [3/60], Batch [160/447], Loss: 3.9341
Epoch [3/60], Batch [170/447], Loss: 4.0289
Epoch [3/60], Batch [180/447], Loss: 3.9142
Epoch [3/60], Batch [190/447], Loss: 3.6702
Epoch [3/60], Batch [200/447], Loss: 3.4869
Epoch [3/60], Batch [210/447], Loss: 3.7255
Epoch [3/60], Batch [220/447], Loss: 3.6892

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [4/60], Batch [0/447], Loss: 3.4240
Epoch [4/60], Batch [10/447], Loss: 3.5688
Epoch [4/60], Batch [20/447], Loss: 3.8267
Epoch [4/60], Batch [30/447], Loss: 3.5622
Epoch [4/60], Batch [40/447], Loss: 3.6543
Epoch [4/60], Batch [50/447], Loss: 3.7295
Epoch [4/60], Batch [60/447], Loss: 3.4694
Epoch [4/60], Batch [70/447], Loss: 3.8302
Epoch [4/60], Batch [80/447], Loss: 3.8758
Epoch [4/60], Batch [90/447], Loss: 3.7035
Epoch [4/60], Batch [100/447], Loss: 3.4757
Epoch [4/60], Batch [110/447], Loss: 3.8681
Epoch [4/60], Batch [120/447], Loss: 3.5481
Epoch [4/60], Batch [130/447], Loss: 3.6960
Epoch [4/60], Batch [140/447], Loss: 3.6461
Epoch [4/60], Batch [150/447], Loss: 3.5786
Epoch [4/60], Batch [160/447], Loss: 3.6849
Epoch [4/60], Batch [170/447], Loss: 3.7817
Epoch [4/60], Batch [180/447], Loss: 3.5969
Epoch [4/60], Batch [190/447], Loss: 3.2745
Epoch [4/60], Batch [200/447], Loss: 3.5647
Epoch [4/60], Batch [210/447], Loss: 3.6771
Epoch [4/60], Batch [220/447], Loss: 3.6515

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [5/60], Batch [0/447], Loss: 3.7236
Epoch [5/60], Batch [10/447], Loss: 3.3161
Epoch [5/60], Batch [20/447], Loss: 3.6577
Epoch [5/60], Batch [30/447], Loss: 3.6550
Epoch [5/60], Batch [40/447], Loss: 3.4565
Epoch [5/60], Batch [50/447], Loss: 3.8693
Epoch [5/60], Batch [60/447], Loss: 3.4460
Epoch [5/60], Batch [70/447], Loss: 3.4974
Epoch [5/60], Batch [80/447], Loss: 3.2610
Epoch [5/60], Batch [90/447], Loss: 3.6172
Epoch [5/60], Batch [100/447], Loss: 3.5887
Epoch [5/60], Batch [110/447], Loss: 3.5972
Epoch [5/60], Batch [120/447], Loss: 3.4635
Epoch [5/60], Batch [130/447], Loss: 3.2370
Epoch [5/60], Batch [140/447], Loss: 3.3950
Epoch [5/60], Batch [150/447], Loss: 3.6171
Epoch [5/60], Batch [160/447], Loss: 3.4568
Epoch [5/60], Batch [170/447], Loss: 3.5036
Epoch [5/60], Batch [180/447], Loss: 3.4638
Epoch [5/60], Batch [190/447], Loss: 3.5917
Epoch [5/60], Batch [200/447], Loss: 3.6572
Epoch [5/60], Batch [210/447], Loss: 3.4446
Epoch [5/60], Batch [220/447], Loss: 3.8629

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [6/60], Batch [0/447], Loss: 3.6091
Epoch [6/60], Batch [10/447], Loss: 3.7250
Epoch [6/60], Batch [20/447], Loss: 3.5922
Epoch [6/60], Batch [30/447], Loss: 3.5769
Epoch [6/60], Batch [40/447], Loss: 3.2698
Epoch [6/60], Batch [50/447], Loss: 3.2833
Epoch [6/60], Batch [60/447], Loss: 3.3349
Epoch [6/60], Batch [70/447], Loss: 3.3691
Epoch [6/60], Batch [80/447], Loss: 3.7050
Epoch [6/60], Batch [90/447], Loss: 3.7202
Epoch [6/60], Batch [100/447], Loss: 3.6235
Epoch [6/60], Batch [110/447], Loss: 2.9397
Epoch [6/60], Batch [120/447], Loss: 3.5215
Epoch [6/60], Batch [130/447], Loss: 3.3955
Epoch [6/60], Batch [140/447], Loss: 3.4743
Epoch [6/60], Batch [150/447], Loss: 3.6695
Epoch [6/60], Batch [160/447], Loss: 3.6559
Epoch [6/60], Batch [170/447], Loss: 3.2094
Epoch [6/60], Batch [180/447], Loss: 3.2816
Epoch [6/60], Batch [190/447], Loss: 3.5724
Epoch [6/60], Batch [200/447], Loss: 3.7916
Epoch [6/60], Batch [210/447], Loss: 3.2701
Epoch [6/60], Batch [220/447], Loss: 3.5410

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [7/60], Batch [0/447], Loss: 3.1739
Epoch [7/60], Batch [10/447], Loss: 3.5468
Epoch [7/60], Batch [20/447], Loss: 3.1154
Epoch [7/60], Batch [30/447], Loss: 2.9967
Epoch [7/60], Batch [40/447], Loss: 3.7165
Epoch [7/60], Batch [50/447], Loss: 3.4411
Epoch [7/60], Batch [60/447], Loss: 3.3783
Epoch [7/60], Batch [70/447], Loss: 3.5266
Epoch [7/60], Batch [80/447], Loss: 3.3049
Epoch [7/60], Batch [90/447], Loss: 3.5833
Epoch [7/60], Batch [100/447], Loss: 3.4857
Epoch [7/60], Batch [110/447], Loss: 3.4752
Epoch [7/60], Batch [120/447], Loss: 3.4573
Epoch [7/60], Batch [130/447], Loss: 3.5095
Epoch [7/60], Batch [140/447], Loss: 3.7991
Epoch [7/60], Batch [150/447], Loss: 3.2304
Epoch [7/60], Batch [160/447], Loss: 3.4262
Epoch [7/60], Batch [170/447], Loss: 3.4851
Epoch [7/60], Batch [180/447], Loss: 2.8650
Epoch [7/60], Batch [190/447], Loss: 3.3929
Epoch [7/60], Batch [200/447], Loss: 3.6105
Epoch [7/60], Batch [210/447], Loss: 3.6735
Epoch [7/60], Batch [220/447], Loss: 3.0666

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [8/60], Batch [0/447], Loss: 3.2927
Epoch [8/60], Batch [10/447], Loss: 3.2018
Epoch [8/60], Batch [20/447], Loss: 3.5682
Epoch [8/60], Batch [30/447], Loss: 3.3527
Epoch [8/60], Batch [40/447], Loss: 3.4177
Epoch [8/60], Batch [50/447], Loss: 2.8841
Epoch [8/60], Batch [60/447], Loss: 3.4303
Epoch [8/60], Batch [70/447], Loss: 3.3654
Epoch [8/60], Batch [80/447], Loss: 3.2945
Epoch [8/60], Batch [90/447], Loss: 3.4675
Epoch [8/60], Batch [100/447], Loss: 2.9372
Epoch [8/60], Batch [110/447], Loss: 2.9217
Epoch [8/60], Batch [120/447], Loss: 3.3889
Epoch [8/60], Batch [130/447], Loss: 3.5990
Epoch [8/60], Batch [140/447], Loss: 2.7253
Epoch [8/60], Batch [150/447], Loss: 3.5291
Epoch [8/60], Batch [160/447], Loss: 3.1250
Epoch [8/60], Batch [170/447], Loss: 2.9469
Epoch [8/60], Batch [180/447], Loss: 3.6432
Epoch [8/60], Batch [190/447], Loss: 3.2696
Epoch [8/60], Batch [200/447], Loss: 3.3616
Epoch [8/60], Batch [210/447], Loss: 2.7711
Epoch [8/60], Batch [220/447], Loss: 3.5980

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [9/60], Batch [0/447], Loss: 3.6075
Epoch [9/60], Batch [10/447], Loss: 3.1277
Epoch [9/60], Batch [20/447], Loss: 3.1376
Epoch [9/60], Batch [30/447], Loss: 3.2794
Epoch [9/60], Batch [40/447], Loss: 3.7306
Epoch [9/60], Batch [50/447], Loss: 3.0731
Epoch [9/60], Batch [60/447], Loss: 3.5512
Epoch [9/60], Batch [70/447], Loss: 3.2110
Epoch [9/60], Batch [80/447], Loss: 3.1186
Epoch [9/60], Batch [90/447], Loss: 3.3668
Epoch [9/60], Batch [100/447], Loss: 2.8156
Epoch [9/60], Batch [110/447], Loss: 3.3384
Epoch [9/60], Batch [120/447], Loss: 3.3192
Epoch [9/60], Batch [130/447], Loss: 3.2890
Epoch [9/60], Batch [140/447], Loss: 3.3279
Epoch [9/60], Batch [150/447], Loss: 3.2918
Epoch [9/60], Batch [160/447], Loss: 3.6275
Epoch [9/60], Batch [170/447], Loss: 3.0870
Epoch [9/60], Batch [180/447], Loss: 3.5064
Epoch [9/60], Batch [190/447], Loss: 3.2608
Epoch [9/60], Batch [200/447], Loss: 3.5594
Epoch [9/60], Batch [210/447], Loss: 3.5092
Epoch [9/60], Batch [220/447], Loss: 3.0817

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [10/60], Batch [0/447], Loss: 3.2984
Epoch [10/60], Batch [10/447], Loss: 3.6598
Epoch [10/60], Batch [20/447], Loss: 3.1883
Epoch [10/60], Batch [30/447], Loss: 3.3569
Epoch [10/60], Batch [40/447], Loss: 3.2356
Epoch [10/60], Batch [50/447], Loss: 3.2526
Epoch [10/60], Batch [60/447], Loss: 3.2438
Epoch [10/60], Batch [70/447], Loss: 3.3823
Epoch [10/60], Batch [80/447], Loss: 3.5362
Epoch [10/60], Batch [90/447], Loss: 3.0959
Epoch [10/60], Batch [100/447], Loss: 3.4021
Epoch [10/60], Batch [110/447], Loss: 2.6297
Epoch [10/60], Batch [120/447], Loss: 3.2659
Epoch [10/60], Batch [130/447], Loss: 3.3773
Epoch [10/60], Batch [140/447], Loss: 3.0551
Epoch [10/60], Batch [150/447], Loss: 3.3740
Epoch [10/60], Batch [160/447], Loss: 2.9380
Epoch [10/60], Batch [170/447], Loss: 3.0973
Epoch [10/60], Batch [180/447], Loss: 3.1028
Epoch [10/60], Batch [190/447], Loss: 3.2313
Epoch [10/60], Batch [200/447], Loss: 3.3638
Epoch [10/60], Batch [210/447], Loss: 2.6944
Epoch [10/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [11/60], Batch [0/447], Loss: 2.9877
Epoch [11/60], Batch [10/447], Loss: 3.4814
Epoch [11/60], Batch [20/447], Loss: 3.3363
Epoch [11/60], Batch [30/447], Loss: 3.3316
Epoch [11/60], Batch [40/447], Loss: 2.8049
Epoch [11/60], Batch [50/447], Loss: 3.3623
Epoch [11/60], Batch [60/447], Loss: 3.2897
Epoch [11/60], Batch [70/447], Loss: 3.1845
Epoch [11/60], Batch [80/447], Loss: 2.9685
Epoch [11/60], Batch [90/447], Loss: 2.8558
Epoch [11/60], Batch [100/447], Loss: 3.3280
Epoch [11/60], Batch [110/447], Loss: 3.1795
Epoch [11/60], Batch [120/447], Loss: 2.9971
Epoch [11/60], Batch [130/447], Loss: 2.7907
Epoch [11/60], Batch [140/447], Loss: 3.0715
Epoch [11/60], Batch [150/447], Loss: 3.2504
Epoch [11/60], Batch [160/447], Loss: 3.2517
Epoch [11/60], Batch [170/447], Loss: 2.9583
Epoch [11/60], Batch [180/447], Loss: 3.5387
Epoch [11/60], Batch [190/447], Loss: 3.4635
Epoch [11/60], Batch [200/447], Loss: 3.0678
Epoch [11/60], Batch [210/447], Loss: 2.9489
Epoch [11/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [12/60], Batch [0/447], Loss: 3.1535
Epoch [12/60], Batch [10/447], Loss: 2.7190
Epoch [12/60], Batch [20/447], Loss: 3.6576
Epoch [12/60], Batch [30/447], Loss: 2.7195
Epoch [12/60], Batch [40/447], Loss: 3.4234
Epoch [12/60], Batch [50/447], Loss: 2.7841
Epoch [12/60], Batch [60/447], Loss: 2.8039
Epoch [12/60], Batch [70/447], Loss: 3.1913
Epoch [12/60], Batch [80/447], Loss: 3.1843
Epoch [12/60], Batch [90/447], Loss: 3.0103
Epoch [12/60], Batch [100/447], Loss: 3.5278
Epoch [12/60], Batch [110/447], Loss: 3.0692
Epoch [12/60], Batch [120/447], Loss: 3.2864
Epoch [12/60], Batch [130/447], Loss: 3.4727
Epoch [12/60], Batch [140/447], Loss: 3.4958
Epoch [12/60], Batch [150/447], Loss: 2.9098
Epoch [12/60], Batch [160/447], Loss: 2.9182
Epoch [12/60], Batch [170/447], Loss: 3.1713
Epoch [12/60], Batch [180/447], Loss: 2.9615
Epoch [12/60], Batch [190/447], Loss: 3.2397
Epoch [12/60], Batch [200/447], Loss: 3.4665
Epoch [12/60], Batch [210/447], Loss: 3.2954
Epoch [12/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [13/60], Batch [0/447], Loss: 3.1193
Epoch [13/60], Batch [10/447], Loss: 3.1633
Epoch [13/60], Batch [20/447], Loss: 3.1634
Epoch [13/60], Batch [30/447], Loss: 2.9486
Epoch [13/60], Batch [40/447], Loss: 3.1605
Epoch [13/60], Batch [50/447], Loss: 2.8876
Epoch [13/60], Batch [60/447], Loss: 3.7613
Epoch [13/60], Batch [70/447], Loss: 3.2213
Epoch [13/60], Batch [80/447], Loss: 3.2853
Epoch [13/60], Batch [90/447], Loss: 3.4576
Epoch [13/60], Batch [100/447], Loss: 3.1138
Epoch [13/60], Batch [110/447], Loss: 3.2426
Epoch [13/60], Batch [120/447], Loss: 3.2747
Epoch [13/60], Batch [130/447], Loss: 2.8499
Epoch [13/60], Batch [140/447], Loss: 3.2684
Epoch [13/60], Batch [150/447], Loss: 2.8007
Epoch [13/60], Batch [160/447], Loss: 3.5608
Epoch [13/60], Batch [170/447], Loss: 3.3386
Epoch [13/60], Batch [180/447], Loss: 3.2640
Epoch [13/60], Batch [190/447], Loss: 3.0858
Epoch [13/60], Batch [200/447], Loss: 2.9958
Epoch [13/60], Batch [210/447], Loss: 2.6574
Epoch [13/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [14/60], Batch [0/447], Loss: 2.9330
Epoch [14/60], Batch [10/447], Loss: 3.1332
Epoch [14/60], Batch [20/447], Loss: 2.8489
Epoch [14/60], Batch [30/447], Loss: 3.3398
Epoch [14/60], Batch [40/447], Loss: 2.9388
Epoch [14/60], Batch [50/447], Loss: 2.4959
Epoch [14/60], Batch [60/447], Loss: 3.1100
Epoch [14/60], Batch [70/447], Loss: 3.1751
Epoch [14/60], Batch [80/447], Loss: 2.6336
Epoch [14/60], Batch [90/447], Loss: 2.8265
Epoch [14/60], Batch [100/447], Loss: 3.1767
Epoch [14/60], Batch [110/447], Loss: 2.9790
Epoch [14/60], Batch [120/447], Loss: 3.1812
Epoch [14/60], Batch [130/447], Loss: 3.3896
Epoch [14/60], Batch [140/447], Loss: 2.6280
Epoch [14/60], Batch [150/447], Loss: 3.0533
Epoch [14/60], Batch [160/447], Loss: 2.7757
Epoch [14/60], Batch [170/447], Loss: 3.1403
Epoch [14/60], Batch [180/447], Loss: 3.0656
Epoch [14/60], Batch [190/447], Loss: 2.9467
Epoch [14/60], Batch [200/447], Loss: 2.8587
Epoch [14/60], Batch [210/447], Loss: 2.8102
Epoch [14/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [15/60], Batch [0/447], Loss: 2.5944
Epoch [15/60], Batch [10/447], Loss: 3.1919
Epoch [15/60], Batch [20/447], Loss: 2.8898
Epoch [15/60], Batch [30/447], Loss: 2.7632
Epoch [15/60], Batch [40/447], Loss: 3.0050
Epoch [15/60], Batch [50/447], Loss: 3.1031
Epoch [15/60], Batch [60/447], Loss: 2.9133
Epoch [15/60], Batch [70/447], Loss: 3.0808
Epoch [15/60], Batch [80/447], Loss: 2.9243
Epoch [15/60], Batch [90/447], Loss: 2.7943
Epoch [15/60], Batch [100/447], Loss: 2.5829
Epoch [15/60], Batch [110/447], Loss: 3.1214
Epoch [15/60], Batch [120/447], Loss: 3.0254
Epoch [15/60], Batch [130/447], Loss: 2.5422
Epoch [15/60], Batch [140/447], Loss: 3.2490
Epoch [15/60], Batch [150/447], Loss: 2.9277
Epoch [15/60], Batch [160/447], Loss: 2.8394
Epoch [15/60], Batch [170/447], Loss: 3.2635
Epoch [15/60], Batch [180/447], Loss: 3.2942
Epoch [15/60], Batch [190/447], Loss: 3.2250
Epoch [15/60], Batch [200/447], Loss: 3.2702
Epoch [15/60], Batch [210/447], Loss: 3.3773
Epoch [15/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [16/60], Batch [0/447], Loss: 3.1656
Epoch [16/60], Batch [10/447], Loss: 2.5401
Epoch [16/60], Batch [20/447], Loss: 2.8143
Epoch [16/60], Batch [30/447], Loss: 2.4569
Epoch [16/60], Batch [40/447], Loss: 2.9608
Epoch [16/60], Batch [50/447], Loss: 3.0104
Epoch [16/60], Batch [60/447], Loss: 3.2963
Epoch [16/60], Batch [70/447], Loss: 2.7112
Epoch [16/60], Batch [80/447], Loss: 3.4188
Epoch [16/60], Batch [90/447], Loss: 3.5923
Epoch [16/60], Batch [100/447], Loss: 2.7842
Epoch [16/60], Batch [110/447], Loss: 2.4441
Epoch [16/60], Batch [120/447], Loss: 3.2408
Epoch [16/60], Batch [130/447], Loss: 2.9880
Epoch [16/60], Batch [140/447], Loss: 2.3142
Epoch [16/60], Batch [150/447], Loss: 3.1513
Epoch [16/60], Batch [160/447], Loss: 3.2745
Epoch [16/60], Batch [170/447], Loss: 3.5439
Epoch [16/60], Batch [180/447], Loss: 2.5783
Epoch [16/60], Batch [190/447], Loss: 2.5003
Epoch [16/60], Batch [200/447], Loss: 2.9334
Epoch [16/60], Batch [210/447], Loss: 2.7046
Epoch [16/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [17/60], Batch [0/447], Loss: 3.0400
Epoch [17/60], Batch [10/447], Loss: 2.7429
Epoch [17/60], Batch [20/447], Loss: 2.9944
Epoch [17/60], Batch [30/447], Loss: 3.4250
Epoch [17/60], Batch [40/447], Loss: 3.0156
Epoch [17/60], Batch [50/447], Loss: 2.6373
Epoch [17/60], Batch [60/447], Loss: 3.1165
Epoch [17/60], Batch [70/447], Loss: 3.0414
Epoch [17/60], Batch [80/447], Loss: 2.9726
Epoch [17/60], Batch [90/447], Loss: 2.8818
Epoch [17/60], Batch [100/447], Loss: 3.1162
Epoch [17/60], Batch [110/447], Loss: 2.6314
Epoch [17/60], Batch [120/447], Loss: 2.8621
Epoch [17/60], Batch [130/447], Loss: 3.2811
Epoch [17/60], Batch [140/447], Loss: 2.9442
Epoch [17/60], Batch [150/447], Loss: 2.7672
Epoch [17/60], Batch [160/447], Loss: 3.0530
Epoch [17/60], Batch [170/447], Loss: 2.7570
Epoch [17/60], Batch [180/447], Loss: 2.7049
Epoch [17/60], Batch [190/447], Loss: 2.6521
Epoch [17/60], Batch [200/447], Loss: 2.4976
Epoch [17/60], Batch [210/447], Loss: 2.9769
Epoch [17/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [18/60], Batch [0/447], Loss: 2.8070
Epoch [18/60], Batch [10/447], Loss: 3.2963
Epoch [18/60], Batch [20/447], Loss: 3.2866
Epoch [18/60], Batch [30/447], Loss: 3.3327
Epoch [18/60], Batch [40/447], Loss: 2.7391
Epoch [18/60], Batch [50/447], Loss: 2.8000
Epoch [18/60], Batch [60/447], Loss: 2.9101
Epoch [18/60], Batch [70/447], Loss: 2.7961
Epoch [18/60], Batch [80/447], Loss: 2.4046
Epoch [18/60], Batch [90/447], Loss: 2.7427
Epoch [18/60], Batch [100/447], Loss: 2.6229
Epoch [18/60], Batch [110/447], Loss: 2.7867
Epoch [18/60], Batch [120/447], Loss: 2.8627
Epoch [18/60], Batch [130/447], Loss: 3.2881
Epoch [18/60], Batch [140/447], Loss: 2.5649
Epoch [18/60], Batch [150/447], Loss: 2.8698
Epoch [18/60], Batch [160/447], Loss: 3.2110
Epoch [18/60], Batch [170/447], Loss: 2.9956
Epoch [18/60], Batch [180/447], Loss: 3.0863
Epoch [18/60], Batch [190/447], Loss: 2.7220
Epoch [18/60], Batch [200/447], Loss: 3.1420
Epoch [18/60], Batch [210/447], Loss: 3.0639
Epoch [18/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [19/60], Batch [0/447], Loss: 2.7203
Epoch [19/60], Batch [10/447], Loss: 3.3181
Epoch [19/60], Batch [20/447], Loss: 2.9302
Epoch [19/60], Batch [30/447], Loss: 3.1632
Epoch [19/60], Batch [40/447], Loss: 2.8143
Epoch [19/60], Batch [50/447], Loss: 3.0117
Epoch [19/60], Batch [60/447], Loss: 2.2531
Epoch [19/60], Batch [70/447], Loss: 3.1511
Epoch [19/60], Batch [80/447], Loss: 2.7731
Epoch [19/60], Batch [90/447], Loss: 3.1905
Epoch [19/60], Batch [100/447], Loss: 2.9244
Epoch [19/60], Batch [110/447], Loss: 2.5916
Epoch [19/60], Batch [120/447], Loss: 2.4517
Epoch [19/60], Batch [130/447], Loss: 2.4968
Epoch [19/60], Batch [140/447], Loss: 3.0798
Epoch [19/60], Batch [150/447], Loss: 3.2555
Epoch [19/60], Batch [160/447], Loss: 3.0276
Epoch [19/60], Batch [170/447], Loss: 3.0371
Epoch [19/60], Batch [180/447], Loss: 2.4567
Epoch [19/60], Batch [190/447], Loss: 2.8572
Epoch [19/60], Batch [200/447], Loss: 2.7186
Epoch [19/60], Batch [210/447], Loss: 2.3872
Epoch [19/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [20/60], Batch [0/447], Loss: 2.9630
Epoch [20/60], Batch [10/447], Loss: 2.6963
Epoch [20/60], Batch [20/447], Loss: 2.6132
Epoch [20/60], Batch [30/447], Loss: 2.8505
Epoch [20/60], Batch [40/447], Loss: 2.9817
Epoch [20/60], Batch [50/447], Loss: 1.8188
Epoch [20/60], Batch [60/447], Loss: 1.9378
Epoch [20/60], Batch [70/447], Loss: 2.5508
Epoch [20/60], Batch [80/447], Loss: 2.6083
Epoch [20/60], Batch [90/447], Loss: 2.7116
Epoch [20/60], Batch [100/447], Loss: 3.0582
Epoch [20/60], Batch [110/447], Loss: 2.8785
Epoch [20/60], Batch [120/447], Loss: 3.1109
Epoch [20/60], Batch [130/447], Loss: 2.3745
Epoch [20/60], Batch [140/447], Loss: 2.4275
Epoch [20/60], Batch [150/447], Loss: 2.6934
Epoch [20/60], Batch [160/447], Loss: 3.4472
Epoch [20/60], Batch [170/447], Loss: 2.7216
Epoch [20/60], Batch [180/447], Loss: 2.4852
Epoch [20/60], Batch [190/447], Loss: 3.0904
Epoch [20/60], Batch [200/447], Loss: 3.1952
Epoch [20/60], Batch [210/447], Loss: 2.4458
Epoch [20/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [21/60], Batch [0/447], Loss: 3.3258
Epoch [21/60], Batch [10/447], Loss: 2.8482
Epoch [21/60], Batch [20/447], Loss: 3.0501
Epoch [21/60], Batch [30/447], Loss: 2.9847
Epoch [21/60], Batch [40/447], Loss: 2.9505
Epoch [21/60], Batch [50/447], Loss: 2.8741
Epoch [21/60], Batch [60/447], Loss: 2.6097
Epoch [21/60], Batch [70/447], Loss: 2.3140
Epoch [21/60], Batch [80/447], Loss: 2.3656
Epoch [21/60], Batch [90/447], Loss: 2.9398
Epoch [21/60], Batch [100/447], Loss: 2.2121
Epoch [21/60], Batch [110/447], Loss: 2.8182
Epoch [21/60], Batch [120/447], Loss: 2.6817
Epoch [21/60], Batch [130/447], Loss: 2.3926
Epoch [21/60], Batch [140/447], Loss: 2.8737
Epoch [21/60], Batch [150/447], Loss: 2.8041
Epoch [21/60], Batch [160/447], Loss: 3.1038
Epoch [21/60], Batch [170/447], Loss: 2.7200
Epoch [21/60], Batch [180/447], Loss: 3.3994
Epoch [21/60], Batch [190/447], Loss: 2.2897
Epoch [21/60], Batch [200/447], Loss: 2.1283
Epoch [21/60], Batch [210/447], Loss: 2.9964
Epoch [21/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [22/60], Batch [0/447], Loss: 2.8319
Epoch [22/60], Batch [10/447], Loss: 2.9822
Epoch [22/60], Batch [20/447], Loss: 2.2970
Epoch [22/60], Batch [30/447], Loss: 1.8653
Epoch [22/60], Batch [40/447], Loss: 2.3653
Epoch [22/60], Batch [50/447], Loss: 2.8353
Epoch [22/60], Batch [60/447], Loss: 2.2713
Epoch [22/60], Batch [70/447], Loss: 2.7160
Epoch [22/60], Batch [80/447], Loss: 2.6152
Epoch [22/60], Batch [90/447], Loss: 2.8141
Epoch [22/60], Batch [100/447], Loss: 1.6978
Epoch [22/60], Batch [110/447], Loss: 2.8907
Epoch [22/60], Batch [120/447], Loss: 2.5006
Epoch [22/60], Batch [130/447], Loss: 2.3335
Epoch [22/60], Batch [140/447], Loss: 3.0618
Epoch [22/60], Batch [150/447], Loss: 2.7480
Epoch [22/60], Batch [160/447], Loss: 1.9521
Epoch [22/60], Batch [170/447], Loss: 2.5835
Epoch [22/60], Batch [180/447], Loss: 2.7040
Epoch [22/60], Batch [190/447], Loss: 2.4025
Epoch [22/60], Batch [200/447], Loss: 2.9936
Epoch [22/60], Batch [210/447], Loss: 2.8481
Epoch [22/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [23/60], Batch [0/447], Loss: 2.9837
Epoch [23/60], Batch [10/447], Loss: 2.2106
Epoch [23/60], Batch [20/447], Loss: 2.5665
Epoch [23/60], Batch [30/447], Loss: 2.8136
Epoch [23/60], Batch [40/447], Loss: 2.3837
Epoch [23/60], Batch [50/447], Loss: 2.1688
Epoch [23/60], Batch [60/447], Loss: 3.0157
Epoch [23/60], Batch [70/447], Loss: 2.6765
Epoch [23/60], Batch [80/447], Loss: 2.7586
Epoch [23/60], Batch [90/447], Loss: 2.5372
Epoch [23/60], Batch [100/447], Loss: 2.3038
Epoch [23/60], Batch [110/447], Loss: 2.7362
Epoch [23/60], Batch [120/447], Loss: 2.4951
Epoch [23/60], Batch [130/447], Loss: 2.7398
Epoch [23/60], Batch [140/447], Loss: 2.1828
Epoch [23/60], Batch [150/447], Loss: 2.9258
Epoch [23/60], Batch [160/447], Loss: 2.6973
Epoch [23/60], Batch [170/447], Loss: 2.7049
Epoch [23/60], Batch [180/447], Loss: 2.5830
Epoch [23/60], Batch [190/447], Loss: 2.6896
Epoch [23/60], Batch [200/447], Loss: 2.6115
Epoch [23/60], Batch [210/447], Loss: 2.9771
Epoch [23/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [24/60], Batch [0/447], Loss: 3.0450
Epoch [24/60], Batch [10/447], Loss: 2.9184
Epoch [24/60], Batch [20/447], Loss: 2.6083
Epoch [24/60], Batch [30/447], Loss: 2.5174
Epoch [24/60], Batch [40/447], Loss: 2.6063
Epoch [24/60], Batch [50/447], Loss: 2.8460
Epoch [24/60], Batch [60/447], Loss: 3.2407
Epoch [24/60], Batch [70/447], Loss: 2.2938
Epoch [24/60], Batch [80/447], Loss: 2.1905
Epoch [24/60], Batch [90/447], Loss: 1.9186
Epoch [24/60], Batch [100/447], Loss: 2.6863
Epoch [24/60], Batch [110/447], Loss: 2.8056
Epoch [24/60], Batch [120/447], Loss: 2.7707
Epoch [24/60], Batch [130/447], Loss: 2.8623
Epoch [24/60], Batch [140/447], Loss: 2.5873
Epoch [24/60], Batch [150/447], Loss: 2.7138
Epoch [24/60], Batch [160/447], Loss: 2.9274
Epoch [24/60], Batch [170/447], Loss: 2.0166
Epoch [24/60], Batch [180/447], Loss: 2.6162
Epoch [24/60], Batch [190/447], Loss: 2.7781
Epoch [24/60], Batch [200/447], Loss: 2.4896
Epoch [24/60], Batch [210/447], Loss: 2.6887
Epoch [24/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [25/60], Batch [0/447], Loss: 2.6767
Epoch [25/60], Batch [10/447], Loss: 2.7597
Epoch [25/60], Batch [20/447], Loss: 2.7402
Epoch [25/60], Batch [30/447], Loss: 3.0141
Epoch [25/60], Batch [40/447], Loss: 2.5308
Epoch [25/60], Batch [50/447], Loss: 2.9739
Epoch [25/60], Batch [60/447], Loss: 2.3281
Epoch [25/60], Batch [70/447], Loss: 2.1412
Epoch [25/60], Batch [80/447], Loss: 2.3096
Epoch [25/60], Batch [90/447], Loss: 2.4135
Epoch [25/60], Batch [100/447], Loss: 2.9933
Epoch [25/60], Batch [110/447], Loss: 2.8374
Epoch [25/60], Batch [120/447], Loss: 2.3156
Epoch [25/60], Batch [130/447], Loss: 2.3938
Epoch [25/60], Batch [140/447], Loss: 2.0743
Epoch [25/60], Batch [150/447], Loss: 3.0406
Epoch [25/60], Batch [160/447], Loss: 2.8208
Epoch [25/60], Batch [170/447], Loss: 2.6902
Epoch [25/60], Batch [180/447], Loss: 2.4773
Epoch [25/60], Batch [190/447], Loss: 2.3065
Epoch [25/60], Batch [200/447], Loss: 2.4704
Epoch [25/60], Batch [210/447], Loss: 2.3159
Epoch [25/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [26/60], Batch [0/447], Loss: 2.8058
Epoch [26/60], Batch [10/447], Loss: 2.0922
Epoch [26/60], Batch [20/447], Loss: 1.8133
Epoch [26/60], Batch [30/447], Loss: 2.7357
Epoch [26/60], Batch [40/447], Loss: 2.6920
Epoch [26/60], Batch [50/447], Loss: 3.0394
Epoch [26/60], Batch [60/447], Loss: 2.7045
Epoch [26/60], Batch [70/447], Loss: 3.3017
Epoch [26/60], Batch [80/447], Loss: 2.3939
Epoch [26/60], Batch [90/447], Loss: 2.5313
Epoch [26/60], Batch [100/447], Loss: 2.4318
Epoch [26/60], Batch [110/447], Loss: 2.4759
Epoch [26/60], Batch [120/447], Loss: 2.6364
Epoch [26/60], Batch [130/447], Loss: 2.4891
Epoch [26/60], Batch [140/447], Loss: 2.9651
Epoch [26/60], Batch [150/447], Loss: 2.9895
Epoch [26/60], Batch [160/447], Loss: 2.4707
Epoch [26/60], Batch [170/447], Loss: 2.2187
Epoch [26/60], Batch [180/447], Loss: 2.6838
Epoch [26/60], Batch [190/447], Loss: 2.6178
Epoch [26/60], Batch [200/447], Loss: 1.9003
Epoch [26/60], Batch [210/447], Loss: 2.3245
Epoch [26/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [27/60], Batch [0/447], Loss: 2.4442
Epoch [27/60], Batch [10/447], Loss: 2.0826
Epoch [27/60], Batch [20/447], Loss: 3.0445
Epoch [27/60], Batch [30/447], Loss: 2.6122
Epoch [27/60], Batch [40/447], Loss: 2.2435
Epoch [27/60], Batch [50/447], Loss: 2.5418
Epoch [27/60], Batch [60/447], Loss: 2.7447
Epoch [27/60], Batch [70/447], Loss: 2.9152
Epoch [27/60], Batch [80/447], Loss: 2.6463
Epoch [27/60], Batch [90/447], Loss: 3.2117
Epoch [27/60], Batch [100/447], Loss: 2.2394
Epoch [27/60], Batch [110/447], Loss: 3.1247
Epoch [27/60], Batch [120/447], Loss: 2.2755
Epoch [27/60], Batch [130/447], Loss: 2.2026
Epoch [27/60], Batch [140/447], Loss: 3.0470
Epoch [27/60], Batch [150/447], Loss: 2.7356
Epoch [27/60], Batch [160/447], Loss: 2.6658
Epoch [27/60], Batch [170/447], Loss: 2.6913
Epoch [27/60], Batch [180/447], Loss: 2.5354
Epoch [27/60], Batch [190/447], Loss: 2.6555
Epoch [27/60], Batch [200/447], Loss: 2.6679
Epoch [27/60], Batch [210/447], Loss: 2.2802
Epoch [27/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [28/60], Batch [0/447], Loss: 2.6745
Epoch [28/60], Batch [10/447], Loss: 2.5773
Epoch [28/60], Batch [20/447], Loss: 2.5535
Epoch [28/60], Batch [30/447], Loss: 2.9654
Epoch [28/60], Batch [40/447], Loss: 2.5019
Epoch [28/60], Batch [50/447], Loss: 1.9235
Epoch [28/60], Batch [60/447], Loss: 2.7504
Epoch [28/60], Batch [70/447], Loss: 2.1524
Epoch [28/60], Batch [80/447], Loss: 2.6895
Epoch [28/60], Batch [90/447], Loss: 2.3711
Epoch [28/60], Batch [100/447], Loss: 2.7698
Epoch [28/60], Batch [110/447], Loss: 3.0963
Epoch [28/60], Batch [120/447], Loss: 2.8132
Epoch [28/60], Batch [130/447], Loss: 2.6224
Epoch [28/60], Batch [140/447], Loss: 2.4206
Epoch [28/60], Batch [150/447], Loss: 3.4323
Epoch [28/60], Batch [160/447], Loss: 2.4489
Epoch [28/60], Batch [170/447], Loss: 2.7450
Epoch [28/60], Batch [180/447], Loss: 2.9237
Epoch [28/60], Batch [190/447], Loss: 2.3511
Epoch [28/60], Batch [200/447], Loss: 2.3609
Epoch [28/60], Batch [210/447], Loss: 2.5345
Epoch [28/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [29/60], Batch [0/447], Loss: 2.9398
Epoch [29/60], Batch [10/447], Loss: 2.5910
Epoch [29/60], Batch [20/447], Loss: 2.2642
Epoch [29/60], Batch [30/447], Loss: 2.2819
Epoch [29/60], Batch [40/447], Loss: 2.4069
Epoch [29/60], Batch [50/447], Loss: 1.9947
Epoch [29/60], Batch [60/447], Loss: 2.0101
Epoch [29/60], Batch [70/447], Loss: 2.1447
Epoch [29/60], Batch [80/447], Loss: 1.9228
Epoch [29/60], Batch [90/447], Loss: 2.9092
Epoch [29/60], Batch [100/447], Loss: 2.4975
Epoch [29/60], Batch [110/447], Loss: 2.2489
Epoch [29/60], Batch [120/447], Loss: 2.3953
Epoch [29/60], Batch [130/447], Loss: 3.2755
Epoch [29/60], Batch [140/447], Loss: 2.2797
Epoch [29/60], Batch [150/447], Loss: 2.1978
Epoch [29/60], Batch [160/447], Loss: 2.5844
Epoch [29/60], Batch [170/447], Loss: 1.5820
Epoch [29/60], Batch [180/447], Loss: 2.4580
Epoch [29/60], Batch [190/447], Loss: 2.1212
Epoch [29/60], Batch [200/447], Loss: 2.0061
Epoch [29/60], Batch [210/447], Loss: 1.5865
Epoch [29/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [30/60], Batch [0/447], Loss: 2.0950
Epoch [30/60], Batch [10/447], Loss: 2.6230
Epoch [30/60], Batch [20/447], Loss: 1.7398
Epoch [30/60], Batch [30/447], Loss: 2.7019
Epoch [30/60], Batch [40/447], Loss: 2.9838
Epoch [30/60], Batch [50/447], Loss: 2.3195
Epoch [30/60], Batch [60/447], Loss: 2.4126
Epoch [30/60], Batch [70/447], Loss: 2.4674
Epoch [30/60], Batch [80/447], Loss: 2.8272
Epoch [30/60], Batch [90/447], Loss: 2.6007
Epoch [30/60], Batch [100/447], Loss: 2.1421
Epoch [30/60], Batch [110/447], Loss: 2.8814
Epoch [30/60], Batch [120/447], Loss: 2.0282
Epoch [30/60], Batch [130/447], Loss: 2.1042
Epoch [30/60], Batch [140/447], Loss: 3.1741
Epoch [30/60], Batch [150/447], Loss: 2.9143
Epoch [30/60], Batch [160/447], Loss: 3.0014
Epoch [30/60], Batch [170/447], Loss: 2.7086
Epoch [30/60], Batch [180/447], Loss: 2.5185
Epoch [30/60], Batch [190/447], Loss: 2.8544
Epoch [30/60], Batch [200/447], Loss: 2.7007
Epoch [30/60], Batch [210/447], Loss: 2.7442
Epoch [30/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [31/60], Batch [0/447], Loss: 2.2101
Epoch [31/60], Batch [10/447], Loss: 2.1971
Epoch [31/60], Batch [20/447], Loss: 2.3504
Epoch [31/60], Batch [30/447], Loss: 2.2428
Epoch [31/60], Batch [40/447], Loss: 1.9807
Epoch [31/60], Batch [50/447], Loss: 2.3435
Epoch [31/60], Batch [60/447], Loss: 2.3763
Epoch [31/60], Batch [70/447], Loss: 1.9509
Epoch [31/60], Batch [80/447], Loss: 2.4845
Epoch [31/60], Batch [90/447], Loss: 1.8292
Epoch [31/60], Batch [100/447], Loss: 2.3396
Epoch [31/60], Batch [110/447], Loss: 2.4898
Epoch [31/60], Batch [120/447], Loss: 2.7202
Epoch [31/60], Batch [130/447], Loss: 1.9297
Epoch [31/60], Batch [140/447], Loss: 2.9385
Epoch [31/60], Batch [150/447], Loss: 2.0882
Epoch [31/60], Batch [160/447], Loss: 2.0026
Epoch [31/60], Batch [170/447], Loss: 2.3263
Epoch [31/60], Batch [180/447], Loss: 2.4059
Epoch [31/60], Batch [190/447], Loss: 2.7724
Epoch [31/60], Batch [200/447], Loss: 2.5438
Epoch [31/60], Batch [210/447], Loss: 2.6924
Epoch [31/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [32/60], Batch [0/447], Loss: 2.3868
Epoch [32/60], Batch [10/447], Loss: 2.4618
Epoch [32/60], Batch [20/447], Loss: 2.2093
Epoch [32/60], Batch [30/447], Loss: 1.9969
Epoch [32/60], Batch [40/447], Loss: 2.1121
Epoch [32/60], Batch [50/447], Loss: 2.2884
Epoch [32/60], Batch [60/447], Loss: 2.3089
Epoch [32/60], Batch [70/447], Loss: 2.2137
Epoch [32/60], Batch [80/447], Loss: 2.8503
Epoch [32/60], Batch [90/447], Loss: 2.3577
Epoch [32/60], Batch [100/447], Loss: 2.4527
Epoch [32/60], Batch [110/447], Loss: 2.0541
Epoch [32/60], Batch [120/447], Loss: 1.9830
Epoch [32/60], Batch [130/447], Loss: 2.7568
Epoch [32/60], Batch [140/447], Loss: 2.3692
Epoch [32/60], Batch [150/447], Loss: 2.1556
Epoch [32/60], Batch [160/447], Loss: 2.1154
Epoch [32/60], Batch [170/447], Loss: 1.2190
Epoch [32/60], Batch [180/447], Loss: 2.5347
Epoch [32/60], Batch [190/447], Loss: 2.5279
Epoch [32/60], Batch [200/447], Loss: 2.2103
Epoch [32/60], Batch [210/447], Loss: 2.5129
Epoch [32/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [33/60], Batch [0/447], Loss: 2.7246
Epoch [33/60], Batch [10/447], Loss: 1.9785
Epoch [33/60], Batch [20/447], Loss: 2.4045
Epoch [33/60], Batch [30/447], Loss: 2.5638
Epoch [33/60], Batch [40/447], Loss: 2.3940
Epoch [33/60], Batch [50/447], Loss: 2.7424
Epoch [33/60], Batch [60/447], Loss: 2.4730
Epoch [33/60], Batch [70/447], Loss: 2.4530
Epoch [33/60], Batch [80/447], Loss: 2.5695
Epoch [33/60], Batch [90/447], Loss: 2.3247
Epoch [33/60], Batch [100/447], Loss: 2.4474
Epoch [33/60], Batch [110/447], Loss: 2.4996
Epoch [33/60], Batch [120/447], Loss: 2.6614
Epoch [33/60], Batch [130/447], Loss: 2.5905
Epoch [33/60], Batch [140/447], Loss: 2.3444
Epoch [33/60], Batch [150/447], Loss: 2.5980
Epoch [33/60], Batch [160/447], Loss: 2.4150
Epoch [33/60], Batch [170/447], Loss: 2.0780
Epoch [33/60], Batch [180/447], Loss: 3.1055
Epoch [33/60], Batch [190/447], Loss: 2.3416
Epoch [33/60], Batch [200/447], Loss: 2.0752
Epoch [33/60], Batch [210/447], Loss: 2.1254
Epoch [33/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [34/60], Batch [0/447], Loss: 1.3842
Epoch [34/60], Batch [10/447], Loss: 2.5437
Epoch [34/60], Batch [20/447], Loss: 2.3079
Epoch [34/60], Batch [30/447], Loss: 2.1666
Epoch [34/60], Batch [40/447], Loss: 2.4038
Epoch [34/60], Batch [50/447], Loss: 2.5605
Epoch [34/60], Batch [60/447], Loss: 2.4909
Epoch [34/60], Batch [70/447], Loss: 2.6905
Epoch [34/60], Batch [80/447], Loss: 1.9812
Epoch [34/60], Batch [90/447], Loss: 2.8256
Epoch [34/60], Batch [100/447], Loss: 1.8724
Epoch [34/60], Batch [110/447], Loss: 1.9057
Epoch [34/60], Batch [120/447], Loss: 2.1169
Epoch [34/60], Batch [130/447], Loss: 2.4245
Epoch [34/60], Batch [140/447], Loss: 2.2830
Epoch [34/60], Batch [150/447], Loss: 2.0657
Epoch [34/60], Batch [160/447], Loss: 2.1543
Epoch [34/60], Batch [170/447], Loss: 2.1686
Epoch [34/60], Batch [180/447], Loss: 2.4558
Epoch [34/60], Batch [190/447], Loss: 1.8736
Epoch [34/60], Batch [200/447], Loss: 2.2723
Epoch [34/60], Batch [210/447], Loss: 2.3569
Epoch [34/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [35/60], Batch [0/447], Loss: 2.1587
Epoch [35/60], Batch [10/447], Loss: 2.2901
Epoch [35/60], Batch [20/447], Loss: 2.5699
Epoch [35/60], Batch [30/447], Loss: 2.6009
Epoch [35/60], Batch [40/447], Loss: 2.5742
Epoch [35/60], Batch [50/447], Loss: 1.8693
Epoch [35/60], Batch [60/447], Loss: 2.1988
Epoch [35/60], Batch [70/447], Loss: 2.6969
Epoch [35/60], Batch [80/447], Loss: 2.2976
Epoch [35/60], Batch [90/447], Loss: 1.8366
Epoch [35/60], Batch [100/447], Loss: 2.4905
Epoch [35/60], Batch [110/447], Loss: 2.3550
Epoch [35/60], Batch [120/447], Loss: 2.5067
Epoch [35/60], Batch [130/447], Loss: 2.2368
Epoch [35/60], Batch [140/447], Loss: 2.3942
Epoch [35/60], Batch [150/447], Loss: 3.1382
Epoch [35/60], Batch [160/447], Loss: 2.4437
Epoch [35/60], Batch [170/447], Loss: 3.0716
Epoch [35/60], Batch [180/447], Loss: 2.6333
Epoch [35/60], Batch [190/447], Loss: 2.8411
Epoch [35/60], Batch [200/447], Loss: 2.6410
Epoch [35/60], Batch [210/447], Loss: 2.7535
Epoch [35/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [36/60], Batch [0/447], Loss: 2.1706
Epoch [36/60], Batch [10/447], Loss: 2.4680
Epoch [36/60], Batch [20/447], Loss: 2.6767
Epoch [36/60], Batch [30/447], Loss: 2.2078
Epoch [36/60], Batch [40/447], Loss: 2.1533
Epoch [36/60], Batch [50/447], Loss: 2.3537
Epoch [36/60], Batch [60/447], Loss: 2.4426
Epoch [36/60], Batch [70/447], Loss: 2.1281
Epoch [36/60], Batch [80/447], Loss: 2.5402
Epoch [36/60], Batch [90/447], Loss: 2.4344
Epoch [36/60], Batch [100/447], Loss: 2.6714
Epoch [36/60], Batch [110/447], Loss: 2.4961
Epoch [36/60], Batch [120/447], Loss: 1.8265
Epoch [36/60], Batch [130/447], Loss: 2.2140
Epoch [36/60], Batch [140/447], Loss: 2.3575
Epoch [36/60], Batch [150/447], Loss: 2.0975
Epoch [36/60], Batch [160/447], Loss: 2.3273
Epoch [36/60], Batch [170/447], Loss: 2.3742
Epoch [36/60], Batch [180/447], Loss: 1.6740
Epoch [36/60], Batch [190/447], Loss: 2.2330
Epoch [36/60], Batch [200/447], Loss: 2.1180
Epoch [36/60], Batch [210/447], Loss: 2.7527
Epoch [36/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [37/60], Batch [0/447], Loss: 2.3059
Epoch [37/60], Batch [10/447], Loss: 2.1184
Epoch [37/60], Batch [20/447], Loss: 2.4165
Epoch [37/60], Batch [30/447], Loss: 2.8129
Epoch [37/60], Batch [40/447], Loss: 1.8739
Epoch [37/60], Batch [50/447], Loss: 1.6622
Epoch [37/60], Batch [60/447], Loss: 2.5093
Epoch [37/60], Batch [70/447], Loss: 2.5806
Epoch [37/60], Batch [80/447], Loss: 2.0382
Epoch [37/60], Batch [90/447], Loss: 3.2136
Epoch [37/60], Batch [100/447], Loss: 2.1442
Epoch [37/60], Batch [110/447], Loss: 2.6035
Epoch [37/60], Batch [120/447], Loss: 2.6684
Epoch [37/60], Batch [130/447], Loss: 2.6916
Epoch [37/60], Batch [140/447], Loss: 2.5021
Epoch [37/60], Batch [150/447], Loss: 2.2655
Epoch [37/60], Batch [160/447], Loss: 2.6896
Epoch [37/60], Batch [170/447], Loss: 2.3699
Epoch [37/60], Batch [180/447], Loss: 2.2740
Epoch [37/60], Batch [190/447], Loss: 1.7784
Epoch [37/60], Batch [200/447], Loss: 2.1338
Epoch [37/60], Batch [210/447], Loss: 1.8949
Epoch [37/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [38/60], Batch [0/447], Loss: 2.8205
Epoch [38/60], Batch [10/447], Loss: 1.7317
Epoch [38/60], Batch [20/447], Loss: 2.1880
Epoch [38/60], Batch [30/447], Loss: 2.3343
Epoch [38/60], Batch [40/447], Loss: 2.3860
Epoch [38/60], Batch [50/447], Loss: 2.2259
Epoch [38/60], Batch [60/447], Loss: 2.6553
Epoch [38/60], Batch [70/447], Loss: 2.3488
Epoch [38/60], Batch [80/447], Loss: 2.9547
Epoch [38/60], Batch [90/447], Loss: 2.3809
Epoch [38/60], Batch [100/447], Loss: 2.0939
Epoch [38/60], Batch [110/447], Loss: 1.3210
Epoch [38/60], Batch [120/447], Loss: 2.1964
Epoch [38/60], Batch [130/447], Loss: 2.1708
Epoch [38/60], Batch [140/447], Loss: 1.8945
Epoch [38/60], Batch [150/447], Loss: 2.6587
Epoch [38/60], Batch [160/447], Loss: 2.0508
Epoch [38/60], Batch [170/447], Loss: 2.4198
Epoch [38/60], Batch [180/447], Loss: 2.7653
Epoch [38/60], Batch [190/447], Loss: 1.9336
Epoch [38/60], Batch [200/447], Loss: 2.6947
Epoch [38/60], Batch [210/447], Loss: 2.1608
Epoch [38/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [39/60], Batch [0/447], Loss: 2.6398
Epoch [39/60], Batch [10/447], Loss: 2.1964
Epoch [39/60], Batch [20/447], Loss: 3.0591
Epoch [39/60], Batch [30/447], Loss: 2.2218
Epoch [39/60], Batch [40/447], Loss: 2.5389
Epoch [39/60], Batch [50/447], Loss: 2.5907
Epoch [39/60], Batch [60/447], Loss: 2.6995
Epoch [39/60], Batch [70/447], Loss: 1.7955
Epoch [39/60], Batch [80/447], Loss: 2.3786
Epoch [39/60], Batch [90/447], Loss: 2.6977
Epoch [39/60], Batch [100/447], Loss: 2.1871
Epoch [39/60], Batch [110/447], Loss: 1.9403
Epoch [39/60], Batch [120/447], Loss: 2.6566
Epoch [39/60], Batch [130/447], Loss: 1.7098
Epoch [39/60], Batch [140/447], Loss: 2.0880
Epoch [39/60], Batch [150/447], Loss: 2.1124
Epoch [39/60], Batch [160/447], Loss: 2.7001
Epoch [39/60], Batch [170/447], Loss: 2.0756
Epoch [39/60], Batch [180/447], Loss: 1.8834
Epoch [39/60], Batch [190/447], Loss: 1.5795
Epoch [39/60], Batch [200/447], Loss: 1.8717
Epoch [39/60], Batch [210/447], Loss: 2.3501
Epoch [39/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [40/60], Batch [0/447], Loss: 2.9375
Epoch [40/60], Batch [10/447], Loss: 1.9991
Epoch [40/60], Batch [20/447], Loss: 2.5180
Epoch [40/60], Batch [30/447], Loss: 2.2434
Epoch [40/60], Batch [40/447], Loss: 2.4972
Epoch [40/60], Batch [50/447], Loss: 2.4474
Epoch [40/60], Batch [60/447], Loss: 1.7526
Epoch [40/60], Batch [70/447], Loss: 2.1728
Epoch [40/60], Batch [80/447], Loss: 2.6332
Epoch [40/60], Batch [90/447], Loss: 1.7053
Epoch [40/60], Batch [100/447], Loss: 2.6238
Epoch [40/60], Batch [110/447], Loss: 2.7534
Epoch [40/60], Batch [120/447], Loss: 1.4509
Epoch [40/60], Batch [130/447], Loss: 2.4816
Epoch [40/60], Batch [140/447], Loss: 2.1456
Epoch [40/60], Batch [150/447], Loss: 2.4762
Epoch [40/60], Batch [160/447], Loss: 2.3026
Epoch [40/60], Batch [170/447], Loss: 2.0868
Epoch [40/60], Batch [180/447], Loss: 2.5732
Epoch [40/60], Batch [190/447], Loss: 2.6243
Epoch [40/60], Batch [200/447], Loss: 1.4838
Epoch [40/60], Batch [210/447], Loss: 3.1097
Epoch [40/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [41/60], Batch [0/447], Loss: 2.7357
Epoch [41/60], Batch [10/447], Loss: 3.0396
Epoch [41/60], Batch [20/447], Loss: 3.1687
Epoch [41/60], Batch [30/447], Loss: 1.9229
Epoch [41/60], Batch [40/447], Loss: 2.8068
Epoch [41/60], Batch [50/447], Loss: 2.1237
Epoch [41/60], Batch [60/447], Loss: 1.5401
Epoch [41/60], Batch [70/447], Loss: 2.3724
Epoch [41/60], Batch [80/447], Loss: 1.9295
Epoch [41/60], Batch [90/447], Loss: 2.2067
Epoch [41/60], Batch [100/447], Loss: 2.0618
Epoch [41/60], Batch [110/447], Loss: 1.9399
Epoch [41/60], Batch [120/447], Loss: 2.3980
Epoch [41/60], Batch [130/447], Loss: 1.8910
Epoch [41/60], Batch [140/447], Loss: 2.1311
Epoch [41/60], Batch [150/447], Loss: 1.8596
Epoch [41/60], Batch [160/447], Loss: 2.6210
Epoch [41/60], Batch [170/447], Loss: 2.5382
Epoch [41/60], Batch [180/447], Loss: 1.7982
Epoch [41/60], Batch [190/447], Loss: 2.1740
Epoch [41/60], Batch [200/447], Loss: 2.9314
Epoch [41/60], Batch [210/447], Loss: 2.5776
Epoch [41/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [42/60], Batch [0/447], Loss: 2.6982
Epoch [42/60], Batch [10/447], Loss: 2.1612
Epoch [42/60], Batch [20/447], Loss: 2.2828
Epoch [42/60], Batch [30/447], Loss: 2.5385
Epoch [42/60], Batch [40/447], Loss: 1.5366
Epoch [42/60], Batch [50/447], Loss: 2.5130
Epoch [42/60], Batch [60/447], Loss: 1.7361
Epoch [42/60], Batch [70/447], Loss: 2.7637
Epoch [42/60], Batch [80/447], Loss: 2.5329
Epoch [42/60], Batch [90/447], Loss: 1.8106
Epoch [42/60], Batch [100/447], Loss: 2.5109
Epoch [42/60], Batch [110/447], Loss: 1.8617
Epoch [42/60], Batch [120/447], Loss: 2.3879
Epoch [42/60], Batch [130/447], Loss: 2.6696
Epoch [42/60], Batch [140/447], Loss: 2.5561
Epoch [42/60], Batch [150/447], Loss: 2.9221
Epoch [42/60], Batch [160/447], Loss: 2.8882
Epoch [42/60], Batch [170/447], Loss: 2.2668
Epoch [42/60], Batch [180/447], Loss: 2.5435
Epoch [42/60], Batch [190/447], Loss: 2.0070
Epoch [42/60], Batch [200/447], Loss: 2.5457
Epoch [42/60], Batch [210/447], Loss: 2.4961
Epoch [42/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [43/60], Batch [0/447], Loss: 1.7617
Epoch [43/60], Batch [10/447], Loss: 2.0326
Epoch [43/60], Batch [20/447], Loss: 1.8981
Epoch [43/60], Batch [30/447], Loss: 2.3496
Epoch [43/60], Batch [40/447], Loss: 2.7119
Epoch [43/60], Batch [50/447], Loss: 2.1828
Epoch [43/60], Batch [60/447], Loss: 1.9977
Epoch [43/60], Batch [70/447], Loss: 2.1731
Epoch [43/60], Batch [80/447], Loss: 2.6362
Epoch [43/60], Batch [90/447], Loss: 2.7345
Epoch [43/60], Batch [100/447], Loss: 2.3260
Epoch [43/60], Batch [110/447], Loss: 2.3822
Epoch [43/60], Batch [120/447], Loss: 2.2431
Epoch [43/60], Batch [130/447], Loss: 2.4347
Epoch [43/60], Batch [140/447], Loss: 2.1473
Epoch [43/60], Batch [150/447], Loss: 2.0264
Epoch [43/60], Batch [160/447], Loss: 2.3276
Epoch [43/60], Batch [170/447], Loss: 2.6941
Epoch [43/60], Batch [180/447], Loss: 2.4180
Epoch [43/60], Batch [190/447], Loss: 2.1280
Epoch [43/60], Batch [200/447], Loss: 2.5404
Epoch [43/60], Batch [210/447], Loss: 1.8756
Epoch [43/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [44/60], Batch [0/447], Loss: 1.6558
Epoch [44/60], Batch [10/447], Loss: 1.9940
Epoch [44/60], Batch [20/447], Loss: 2.5962
Epoch [44/60], Batch [30/447], Loss: 2.5159
Epoch [44/60], Batch [40/447], Loss: 2.3314
Epoch [44/60], Batch [50/447], Loss: 2.2448
Epoch [44/60], Batch [60/447], Loss: 2.3448
Epoch [44/60], Batch [70/447], Loss: 1.7626
Epoch [44/60], Batch [80/447], Loss: 2.6529
Epoch [44/60], Batch [90/447], Loss: 2.0773
Epoch [44/60], Batch [100/447], Loss: 2.4293
Epoch [44/60], Batch [110/447], Loss: 2.5114
Epoch [44/60], Batch [120/447], Loss: 2.3576
Epoch [44/60], Batch [130/447], Loss: 2.2856
Epoch [44/60], Batch [140/447], Loss: 2.3931
Epoch [44/60], Batch [150/447], Loss: 2.2594
Epoch [44/60], Batch [160/447], Loss: 2.3092
Epoch [44/60], Batch [170/447], Loss: 2.1951
Epoch [44/60], Batch [180/447], Loss: 1.8540
Epoch [44/60], Batch [190/447], Loss: 2.1629
Epoch [44/60], Batch [200/447], Loss: 2.3133
Epoch [44/60], Batch [210/447], Loss: 2.6664
Epoch [44/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [45/60], Batch [0/447], Loss: 1.6448
Epoch [45/60], Batch [10/447], Loss: 2.0250
Epoch [45/60], Batch [20/447], Loss: 2.2510
Epoch [45/60], Batch [30/447], Loss: 1.9086
Epoch [45/60], Batch [40/447], Loss: 2.2349
Epoch [45/60], Batch [50/447], Loss: 1.5618
Epoch [45/60], Batch [60/447], Loss: 2.4005
Epoch [45/60], Batch [70/447], Loss: 2.3223
Epoch [45/60], Batch [80/447], Loss: 2.9573
Epoch [45/60], Batch [90/447], Loss: 2.0709
Epoch [45/60], Batch [100/447], Loss: 1.9296
Epoch [45/60], Batch [110/447], Loss: 1.8539
Epoch [45/60], Batch [120/447], Loss: 2.3049
Epoch [45/60], Batch [130/447], Loss: 2.3899
Epoch [45/60], Batch [140/447], Loss: 1.9706
Epoch [45/60], Batch [150/447], Loss: 1.5852
Epoch [45/60], Batch [160/447], Loss: 1.7204
Epoch [45/60], Batch [170/447], Loss: 1.4617
Epoch [45/60], Batch [180/447], Loss: 1.9342
Epoch [45/60], Batch [190/447], Loss: 1.8660
Epoch [45/60], Batch [200/447], Loss: 2.3555
Epoch [45/60], Batch [210/447], Loss: 2.7904
Epoch [45/60], Batch 

[I 2024-12-13 09:11:53,003] Trial 3 pruned. 


Epoch [45/60], Validation Accuracy: 0.7261, Validation Loss: 1.0200
No improvement in validation accuracy for 5 epoch(s).
Early stopping at epoch 45.
Trial early stopped due to lack of improvement.
Starting a new trial...
Trial 4: alpha = 6.026718993550662
Building the model...


2024-12-13 09:11:53,353 - mmaction - INFO - load model from: https://download.openmmlab.com/mmaction/recognition/csn/ircsn_from_scratch_r50_ig65m_20210617-ce545a37.pth
2024-12-13 09:11:53,353 - mmaction - INFO - load checkpoint from http path: https://download.openmmlab.com/mmaction/recognition/csn/ircsn_from_scratch_r50_ig65m_20210617-ce545a37.pth


Model built successfully!
Starting training...


  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [1/60], Batch [0/447], Loss: 3.9349
Epoch [1/60], Batch [10/447], Loss: 3.9333
Epoch [1/60], Batch [20/447], Loss: 3.9691
Epoch [1/60], Batch [30/447], Loss: 3.9958
Epoch [1/60], Batch [40/447], Loss: 3.9869
Epoch [1/60], Batch [50/447], Loss: 3.9094
Epoch [1/60], Batch [60/447], Loss: 3.9059
Epoch [1/60], Batch [70/447], Loss: 3.9698
Epoch [1/60], Batch [80/447], Loss: 3.9007
Epoch [1/60], Batch [90/447], Loss: 3.9836
Epoch [1/60], Batch [100/447], Loss: 4.0850
Epoch [1/60], Batch [110/447], Loss: 3.9489
Epoch [1/60], Batch [120/447], Loss: 3.9883
Epoch [1/60], Batch [130/447], Loss: 3.9589
Epoch [1/60], Batch [140/447], Loss: 3.9682
Epoch [1/60], Batch [150/447], Loss: 3.9709
Epoch [1/60], Batch [160/447], Loss: 3.9849
Epoch [1/60], Batch [170/447], Loss: 3.9022
Epoch [1/60], Batch [180/447], Loss: 3.9216
Epoch [1/60], Batch [190/447], Loss: 3.9943
Epoch [1/60], Batch [200/447], Loss: 3.9156
Epoch [1/60], Batch [210/447], Loss: 3.9692
Epoch [1/60], Batch [220/447], Loss: 3.9410

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [2/60], Batch [0/447], Loss: 3.8801
Epoch [2/60], Batch [10/447], Loss: 3.9728
Epoch [2/60], Batch [20/447], Loss: 3.9311
Epoch [2/60], Batch [30/447], Loss: 3.7984
Epoch [2/60], Batch [40/447], Loss: 3.7920
Epoch [2/60], Batch [50/447], Loss: 3.8910
Epoch [2/60], Batch [60/447], Loss: 3.8854
Epoch [2/60], Batch [70/447], Loss: 3.9136
Epoch [2/60], Batch [80/447], Loss: 3.9235
Epoch [2/60], Batch [90/447], Loss: 3.9382
Epoch [2/60], Batch [100/447], Loss: 3.8463
Epoch [2/60], Batch [110/447], Loss: 3.9208
Epoch [2/60], Batch [120/447], Loss: 3.9366
Epoch [2/60], Batch [130/447], Loss: 3.9198
Epoch [2/60], Batch [140/447], Loss: 3.7187
Epoch [2/60], Batch [150/447], Loss: 3.8598
Epoch [2/60], Batch [160/447], Loss: 3.9881
Epoch [2/60], Batch [170/447], Loss: 3.6450
Epoch [2/60], Batch [180/447], Loss: 3.9648
Epoch [2/60], Batch [190/447], Loss: 4.0107
Epoch [2/60], Batch [200/447], Loss: 3.7854
Epoch [2/60], Batch [210/447], Loss: 3.7481
Epoch [2/60], Batch [220/447], Loss: 3.8908

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [3/60], Batch [0/447], Loss: 3.4842
Epoch [3/60], Batch [10/447], Loss: 3.6066
Epoch [3/60], Batch [20/447], Loss: 3.7099
Epoch [3/60], Batch [30/447], Loss: 3.9573
Epoch [3/60], Batch [40/447], Loss: 3.5953
Epoch [3/60], Batch [50/447], Loss: 3.7374
Epoch [3/60], Batch [60/447], Loss: 3.6314
Epoch [3/60], Batch [70/447], Loss: 3.9143
Epoch [3/60], Batch [80/447], Loss: 3.5145
Epoch [3/60], Batch [90/447], Loss: 3.5433
Epoch [3/60], Batch [100/447], Loss: 3.7147
Epoch [3/60], Batch [110/447], Loss: 3.4995
Epoch [3/60], Batch [120/447], Loss: 3.6541
Epoch [3/60], Batch [130/447], Loss: 3.6522
Epoch [3/60], Batch [140/447], Loss: 3.8267
Epoch [3/60], Batch [150/447], Loss: 3.9001
Epoch [3/60], Batch [160/447], Loss: 3.8083
Epoch [3/60], Batch [170/447], Loss: 3.8262
Epoch [3/60], Batch [180/447], Loss: 3.7502
Epoch [3/60], Batch [190/447], Loss: 3.5219
Epoch [3/60], Batch [200/447], Loss: 3.4851
Epoch [3/60], Batch [210/447], Loss: 3.6102
Epoch [3/60], Batch [220/447], Loss: 3.9605

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [4/60], Batch [0/447], Loss: 3.5607
Epoch [4/60], Batch [10/447], Loss: 3.5351
Epoch [4/60], Batch [20/447], Loss: 3.3687
Epoch [4/60], Batch [30/447], Loss: 3.6152
Epoch [4/60], Batch [40/447], Loss: 3.7172
Epoch [4/60], Batch [50/447], Loss: 3.6673
Epoch [4/60], Batch [60/447], Loss: 3.8613
Epoch [4/60], Batch [70/447], Loss: 3.6323
Epoch [4/60], Batch [80/447], Loss: 3.8471
Epoch [4/60], Batch [90/447], Loss: 3.6949
Epoch [4/60], Batch [100/447], Loss: 3.5631
Epoch [4/60], Batch [110/447], Loss: 3.4919
Epoch [4/60], Batch [120/447], Loss: 3.7906
Epoch [4/60], Batch [130/447], Loss: 3.6637
Epoch [4/60], Batch [140/447], Loss: 3.6633
Epoch [4/60], Batch [150/447], Loss: 3.7784
Epoch [4/60], Batch [160/447], Loss: 3.4016
Epoch [4/60], Batch [170/447], Loss: 3.4395
Epoch [4/60], Batch [180/447], Loss: 3.7622
Epoch [4/60], Batch [190/447], Loss: 3.9744
Epoch [4/60], Batch [200/447], Loss: 3.5419
Epoch [4/60], Batch [210/447], Loss: 3.9383
Epoch [4/60], Batch [220/447], Loss: 3.7399

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [5/60], Batch [0/447], Loss: 3.7356
Epoch [5/60], Batch [10/447], Loss: 3.5614
Epoch [5/60], Batch [20/447], Loss: 3.2514
Epoch [5/60], Batch [30/447], Loss: 3.5709
Epoch [5/60], Batch [40/447], Loss: 3.4015
Epoch [5/60], Batch [50/447], Loss: 3.6733
Epoch [5/60], Batch [60/447], Loss: 3.4899
Epoch [5/60], Batch [70/447], Loss: 3.3764
Epoch [5/60], Batch [80/447], Loss: 3.8476
Epoch [5/60], Batch [90/447], Loss: 3.3766
Epoch [5/60], Batch [100/447], Loss: 3.1127
Epoch [5/60], Batch [110/447], Loss: 3.4687
Epoch [5/60], Batch [120/447], Loss: 3.5598
Epoch [5/60], Batch [130/447], Loss: 3.6664
Epoch [5/60], Batch [140/447], Loss: 3.5143
Epoch [5/60], Batch [150/447], Loss: 3.6488
Epoch [5/60], Batch [160/447], Loss: 3.7080
Epoch [5/60], Batch [170/447], Loss: 3.7134
Epoch [5/60], Batch [180/447], Loss: 3.2893
Epoch [5/60], Batch [190/447], Loss: 3.5090
Epoch [5/60], Batch [200/447], Loss: 3.5069
Epoch [5/60], Batch [210/447], Loss: 3.6489
Epoch [5/60], Batch [220/447], Loss: 3.5414

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [6/60], Batch [0/447], Loss: 3.1736
Epoch [6/60], Batch [10/447], Loss: 3.6282
Epoch [6/60], Batch [20/447], Loss: 3.1019
Epoch [6/60], Batch [30/447], Loss: 3.6241
Epoch [6/60], Batch [40/447], Loss: 3.5438
Epoch [6/60], Batch [50/447], Loss: 3.5310
Epoch [6/60], Batch [60/447], Loss: 3.7164
Epoch [6/60], Batch [70/447], Loss: 3.5047
Epoch [6/60], Batch [80/447], Loss: 3.3676
Epoch [6/60], Batch [90/447], Loss: 3.2707
Epoch [6/60], Batch [100/447], Loss: 3.4400
Epoch [6/60], Batch [110/447], Loss: 3.5263
Epoch [6/60], Batch [120/447], Loss: 3.3640
Epoch [6/60], Batch [130/447], Loss: 3.3769
Epoch [6/60], Batch [140/447], Loss: 3.5791
Epoch [6/60], Batch [150/447], Loss: 3.5367
Epoch [6/60], Batch [160/447], Loss: 3.5208
Epoch [6/60], Batch [170/447], Loss: 3.4013
Epoch [6/60], Batch [180/447], Loss: 3.8455
Epoch [6/60], Batch [190/447], Loss: 3.5434
Epoch [6/60], Batch [200/447], Loss: 3.6247
Epoch [6/60], Batch [210/447], Loss: 3.5040
Epoch [6/60], Batch [220/447], Loss: 3.3566

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [7/60], Batch [0/447], Loss: 3.1515
Epoch [7/60], Batch [10/447], Loss: 3.2981
Epoch [7/60], Batch [20/447], Loss: 3.4931
Epoch [7/60], Batch [30/447], Loss: 3.5399
Epoch [7/60], Batch [40/447], Loss: 3.1213
Epoch [7/60], Batch [50/447], Loss: 2.9973
Epoch [7/60], Batch [60/447], Loss: 3.4994
Epoch [7/60], Batch [70/447], Loss: 3.2738
Epoch [7/60], Batch [80/447], Loss: 3.1053
Epoch [7/60], Batch [90/447], Loss: 3.4159
Epoch [7/60], Batch [100/447], Loss: 3.1148
Epoch [7/60], Batch [110/447], Loss: 3.3019
Epoch [7/60], Batch [120/447], Loss: 3.7599
Epoch [7/60], Batch [130/447], Loss: 3.6305
Epoch [7/60], Batch [140/447], Loss: 3.6540
Epoch [7/60], Batch [150/447], Loss: 3.1055
Epoch [7/60], Batch [160/447], Loss: 3.5818
Epoch [7/60], Batch [170/447], Loss: 3.5007
Epoch [7/60], Batch [180/447], Loss: 3.3358
Epoch [7/60], Batch [190/447], Loss: 3.3752
Epoch [7/60], Batch [200/447], Loss: 3.4459
Epoch [7/60], Batch [210/447], Loss: 3.3775
Epoch [7/60], Batch [220/447], Loss: 3.7190

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [8/60], Batch [0/447], Loss: 3.7456
Epoch [8/60], Batch [10/447], Loss: 3.2309
Epoch [8/60], Batch [20/447], Loss: 3.2992
Epoch [8/60], Batch [30/447], Loss: 3.3760
Epoch [8/60], Batch [40/447], Loss: 3.2251
Epoch [8/60], Batch [50/447], Loss: 3.4284
Epoch [8/60], Batch [60/447], Loss: 3.0418
Epoch [8/60], Batch [70/447], Loss: 3.8750
Epoch [8/60], Batch [80/447], Loss: 3.5441
Epoch [8/60], Batch [90/447], Loss: 3.2490
Epoch [8/60], Batch [100/447], Loss: 3.2041
Epoch [8/60], Batch [110/447], Loss: 3.3605
Epoch [8/60], Batch [120/447], Loss: 3.6184
Epoch [8/60], Batch [130/447], Loss: 3.2613
Epoch [8/60], Batch [140/447], Loss: 3.5556
Epoch [8/60], Batch [150/447], Loss: 3.5482
Epoch [8/60], Batch [160/447], Loss: 3.1342
Epoch [8/60], Batch [170/447], Loss: 3.3604
Epoch [8/60], Batch [180/447], Loss: 3.1949
Epoch [8/60], Batch [190/447], Loss: 3.3107
Epoch [8/60], Batch [200/447], Loss: 3.4298
Epoch [8/60], Batch [210/447], Loss: 2.9672
Epoch [8/60], Batch [220/447], Loss: 3.0386

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [9/60], Batch [0/447], Loss: 3.0878
Epoch [9/60], Batch [10/447], Loss: 2.8491
Epoch [9/60], Batch [20/447], Loss: 3.5731
Epoch [9/60], Batch [30/447], Loss: 3.0337
Epoch [9/60], Batch [40/447], Loss: 2.8423
Epoch [9/60], Batch [50/447], Loss: 3.2845
Epoch [9/60], Batch [60/447], Loss: 3.1031
Epoch [9/60], Batch [70/447], Loss: 3.3502
Epoch [9/60], Batch [80/447], Loss: 3.4758
Epoch [9/60], Batch [90/447], Loss: 3.4495
Epoch [9/60], Batch [100/447], Loss: 3.2836
Epoch [9/60], Batch [110/447], Loss: 3.3611
Epoch [9/60], Batch [120/447], Loss: 3.1433
Epoch [9/60], Batch [130/447], Loss: 3.1919
Epoch [9/60], Batch [140/447], Loss: 3.3843
Epoch [9/60], Batch [150/447], Loss: 3.1589
Epoch [9/60], Batch [160/447], Loss: 3.2651
Epoch [9/60], Batch [170/447], Loss: 3.3421
Epoch [9/60], Batch [180/447], Loss: 3.4076
Epoch [9/60], Batch [190/447], Loss: 3.2078
Epoch [9/60], Batch [200/447], Loss: 3.2123
Epoch [9/60], Batch [210/447], Loss: 3.3545
Epoch [9/60], Batch [220/447], Loss: 3.1830

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [10/60], Batch [0/447], Loss: 3.1752
Epoch [10/60], Batch [10/447], Loss: 3.1628
Epoch [10/60], Batch [20/447], Loss: 3.1671
Epoch [10/60], Batch [30/447], Loss: 3.4041
Epoch [10/60], Batch [40/447], Loss: 3.1227
Epoch [10/60], Batch [50/447], Loss: 3.1909
Epoch [10/60], Batch [60/447], Loss: 3.2640
Epoch [10/60], Batch [70/447], Loss: 3.2890
Epoch [10/60], Batch [80/447], Loss: 3.2782
Epoch [10/60], Batch [90/447], Loss: 3.2271
Epoch [10/60], Batch [100/447], Loss: 2.9120
Epoch [10/60], Batch [110/447], Loss: 3.2929
Epoch [10/60], Batch [120/447], Loss: 3.0634
Epoch [10/60], Batch [130/447], Loss: 3.1733
Epoch [10/60], Batch [140/447], Loss: 3.6246
Epoch [10/60], Batch [150/447], Loss: 3.0517
Epoch [10/60], Batch [160/447], Loss: 3.3613
Epoch [10/60], Batch [170/447], Loss: 2.7373
Epoch [10/60], Batch [180/447], Loss: 3.2626
Epoch [10/60], Batch [190/447], Loss: 3.1711
Epoch [10/60], Batch [200/447], Loss: 3.3238
Epoch [10/60], Batch [210/447], Loss: 3.1818
Epoch [10/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [11/60], Batch [0/447], Loss: 3.4331
Epoch [11/60], Batch [10/447], Loss: 2.8964
Epoch [11/60], Batch [20/447], Loss: 2.8642
Epoch [11/60], Batch [30/447], Loss: 3.3570
Epoch [11/60], Batch [40/447], Loss: 2.8759
Epoch [11/60], Batch [50/447], Loss: 2.8479
Epoch [11/60], Batch [60/447], Loss: 2.8542
Epoch [11/60], Batch [70/447], Loss: 3.0400
Epoch [11/60], Batch [80/447], Loss: 2.5801
Epoch [11/60], Batch [90/447], Loss: 3.2285
Epoch [11/60], Batch [100/447], Loss: 3.5604
Epoch [11/60], Batch [110/447], Loss: 3.1349
Epoch [11/60], Batch [120/447], Loss: 3.0930
Epoch [11/60], Batch [130/447], Loss: 3.1273
Epoch [11/60], Batch [140/447], Loss: 2.8836
Epoch [11/60], Batch [150/447], Loss: 3.5283
Epoch [11/60], Batch [160/447], Loss: 2.5768
Epoch [11/60], Batch [170/447], Loss: 3.1327
Epoch [11/60], Batch [180/447], Loss: 2.9466
Epoch [11/60], Batch [190/447], Loss: 3.3125
Epoch [11/60], Batch [200/447], Loss: 3.0470
Epoch [11/60], Batch [210/447], Loss: 2.9863
Epoch [11/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [12/60], Batch [0/447], Loss: 2.9558
Epoch [12/60], Batch [10/447], Loss: 3.6508
Epoch [12/60], Batch [20/447], Loss: 3.2281
Epoch [12/60], Batch [30/447], Loss: 3.4705
Epoch [12/60], Batch [40/447], Loss: 3.4282
Epoch [12/60], Batch [50/447], Loss: 3.2277
Epoch [12/60], Batch [60/447], Loss: 2.6158
Epoch [12/60], Batch [70/447], Loss: 2.9839
Epoch [12/60], Batch [80/447], Loss: 2.8615
Epoch [12/60], Batch [90/447], Loss: 2.9272
Epoch [12/60], Batch [100/447], Loss: 3.0301
Epoch [12/60], Batch [110/447], Loss: 3.2857
Epoch [12/60], Batch [120/447], Loss: 3.0967
Epoch [12/60], Batch [130/447], Loss: 3.2446
Epoch [12/60], Batch [140/447], Loss: 3.1109
Epoch [12/60], Batch [150/447], Loss: 3.1031
Epoch [12/60], Batch [160/447], Loss: 3.0241
Epoch [12/60], Batch [170/447], Loss: 3.4128
Epoch [12/60], Batch [180/447], Loss: 3.3729
Epoch [12/60], Batch [190/447], Loss: 3.0028
Epoch [12/60], Batch [200/447], Loss: 3.2041
Epoch [12/60], Batch [210/447], Loss: 3.3189
Epoch [12/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [13/60], Batch [0/447], Loss: 2.9916
Epoch [13/60], Batch [10/447], Loss: 2.9578
Epoch [13/60], Batch [20/447], Loss: 2.9363
Epoch [13/60], Batch [30/447], Loss: 3.1031
Epoch [13/60], Batch [40/447], Loss: 3.2903
Epoch [13/60], Batch [50/447], Loss: 2.7318
Epoch [13/60], Batch [60/447], Loss: 3.0821
Epoch [13/60], Batch [70/447], Loss: 2.7986
Epoch [13/60], Batch [80/447], Loss: 3.1331
Epoch [13/60], Batch [90/447], Loss: 2.6849
Epoch [13/60], Batch [100/447], Loss: 3.4741
Epoch [13/60], Batch [110/447], Loss: 3.1005
Epoch [13/60], Batch [120/447], Loss: 3.0574
Epoch [13/60], Batch [130/447], Loss: 2.5147
Epoch [13/60], Batch [140/447], Loss: 3.1884
Epoch [13/60], Batch [150/447], Loss: 2.4096
Epoch [13/60], Batch [160/447], Loss: 3.0679
Epoch [13/60], Batch [170/447], Loss: 2.9251
Epoch [13/60], Batch [180/447], Loss: 3.2707
Epoch [13/60], Batch [190/447], Loss: 3.6417
Epoch [13/60], Batch [200/447], Loss: 2.7873
Epoch [13/60], Batch [210/447], Loss: 2.6855
Epoch [13/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [14/60], Batch [0/447], Loss: 3.1572
Epoch [14/60], Batch [10/447], Loss: 2.9987
Epoch [14/60], Batch [20/447], Loss: 3.1725
Epoch [14/60], Batch [30/447], Loss: 3.2379
Epoch [14/60], Batch [40/447], Loss: 3.0430
Epoch [14/60], Batch [50/447], Loss: 2.6916
Epoch [14/60], Batch [60/447], Loss: 2.7145
Epoch [14/60], Batch [70/447], Loss: 2.6348
Epoch [14/60], Batch [80/447], Loss: 3.2395
Epoch [14/60], Batch [90/447], Loss: 2.9183
Epoch [14/60], Batch [100/447], Loss: 3.5781
Epoch [14/60], Batch [110/447], Loss: 2.3512
Epoch [14/60], Batch [120/447], Loss: 2.7859
Epoch [14/60], Batch [130/447], Loss: 2.9500
Epoch [14/60], Batch [140/447], Loss: 2.5333
Epoch [14/60], Batch [150/447], Loss: 2.6450
Epoch [14/60], Batch [160/447], Loss: 3.1204
Epoch [14/60], Batch [170/447], Loss: 3.1832
Epoch [14/60], Batch [180/447], Loss: 3.1761
Epoch [14/60], Batch [190/447], Loss: 2.7307
Epoch [14/60], Batch [200/447], Loss: 3.0666
Epoch [14/60], Batch [210/447], Loss: 3.4165
Epoch [14/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [15/60], Batch [0/447], Loss: 2.6547
Epoch [15/60], Batch [10/447], Loss: 2.7942
Epoch [15/60], Batch [20/447], Loss: 2.8543
Epoch [15/60], Batch [30/447], Loss: 2.5285
Epoch [15/60], Batch [40/447], Loss: 3.1597
Epoch [15/60], Batch [50/447], Loss: 3.4233
Epoch [15/60], Batch [60/447], Loss: 2.6338
Epoch [15/60], Batch [70/447], Loss: 2.9779
Epoch [15/60], Batch [80/447], Loss: 3.0325
Epoch [15/60], Batch [90/447], Loss: 3.2906
Epoch [15/60], Batch [100/447], Loss: 3.0835
Epoch [15/60], Batch [110/447], Loss: 2.8293
Epoch [15/60], Batch [120/447], Loss: 2.5281
Epoch [15/60], Batch [130/447], Loss: 3.3148
Epoch [15/60], Batch [140/447], Loss: 2.3266
Epoch [15/60], Batch [150/447], Loss: 2.7549
Epoch [15/60], Batch [160/447], Loss: 2.9741
Epoch [15/60], Batch [170/447], Loss: 2.9825
Epoch [15/60], Batch [180/447], Loss: 2.5991
Epoch [15/60], Batch [190/447], Loss: 2.7149
Epoch [15/60], Batch [200/447], Loss: 3.7231
Epoch [15/60], Batch [210/447], Loss: 3.2343
Epoch [15/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [16/60], Batch [0/447], Loss: 2.8682
Epoch [16/60], Batch [10/447], Loss: 2.6278
Epoch [16/60], Batch [20/447], Loss: 2.7665
Epoch [16/60], Batch [30/447], Loss: 2.8664
Epoch [16/60], Batch [40/447], Loss: 3.0324
Epoch [16/60], Batch [50/447], Loss: 3.2480
Epoch [16/60], Batch [60/447], Loss: 2.6031
Epoch [16/60], Batch [70/447], Loss: 3.1078
Epoch [16/60], Batch [80/447], Loss: 3.0127
Epoch [16/60], Batch [90/447], Loss: 2.8421
Epoch [16/60], Batch [100/447], Loss: 3.0147
Epoch [16/60], Batch [110/447], Loss: 3.0694
Epoch [16/60], Batch [120/447], Loss: 3.0561
Epoch [16/60], Batch [130/447], Loss: 2.5169
Epoch [16/60], Batch [140/447], Loss: 3.2750
Epoch [16/60], Batch [150/447], Loss: 2.9783
Epoch [16/60], Batch [160/447], Loss: 2.9269
Epoch [16/60], Batch [170/447], Loss: 2.8810
Epoch [16/60], Batch [180/447], Loss: 2.7229
Epoch [16/60], Batch [190/447], Loss: 2.7299
Epoch [16/60], Batch [200/447], Loss: 3.1167
Epoch [16/60], Batch [210/447], Loss: 2.7999
Epoch [16/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [17/60], Batch [0/447], Loss: 2.3117
Epoch [17/60], Batch [10/447], Loss: 3.2189
Epoch [17/60], Batch [20/447], Loss: 2.7213
Epoch [17/60], Batch [30/447], Loss: 3.3065
Epoch [17/60], Batch [40/447], Loss: 2.9836
Epoch [17/60], Batch [50/447], Loss: 3.1169
Epoch [17/60], Batch [60/447], Loss: 2.5961
Epoch [17/60], Batch [70/447], Loss: 2.4403
Epoch [17/60], Batch [80/447], Loss: 2.9216
Epoch [17/60], Batch [90/447], Loss: 3.4567
Epoch [17/60], Batch [100/447], Loss: 3.1888
Epoch [17/60], Batch [110/447], Loss: 2.5115
Epoch [17/60], Batch [120/447], Loss: 2.8802
Epoch [17/60], Batch [130/447], Loss: 2.5356
Epoch [17/60], Batch [140/447], Loss: 2.9452
Epoch [17/60], Batch [150/447], Loss: 3.2293
Epoch [17/60], Batch [160/447], Loss: 2.9431
Epoch [17/60], Batch [170/447], Loss: 2.4248
Epoch [17/60], Batch [180/447], Loss: 3.2834
Epoch [17/60], Batch [190/447], Loss: 2.4434
Epoch [17/60], Batch [200/447], Loss: 2.7288
Epoch [17/60], Batch [210/447], Loss: 2.8683
Epoch [17/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [18/60], Batch [0/447], Loss: 2.7933
Epoch [18/60], Batch [10/447], Loss: 3.1863
Epoch [18/60], Batch [20/447], Loss: 3.1537
Epoch [18/60], Batch [30/447], Loss: 2.6730
Epoch [18/60], Batch [40/447], Loss: 2.7291
Epoch [18/60], Batch [50/447], Loss: 3.4903
Epoch [18/60], Batch [60/447], Loss: 2.6430
Epoch [18/60], Batch [70/447], Loss: 2.7539
Epoch [18/60], Batch [80/447], Loss: 3.1825
Epoch [18/60], Batch [90/447], Loss: 2.6424
Epoch [18/60], Batch [100/447], Loss: 3.5564
Epoch [18/60], Batch [110/447], Loss: 2.5211
Epoch [18/60], Batch [120/447], Loss: 2.2210
Epoch [18/60], Batch [130/447], Loss: 3.1461
Epoch [18/60], Batch [140/447], Loss: 1.7361
Epoch [18/60], Batch [150/447], Loss: 2.8323
Epoch [18/60], Batch [160/447], Loss: 2.9967
Epoch [18/60], Batch [170/447], Loss: 3.0274
Epoch [18/60], Batch [180/447], Loss: 2.7244
Epoch [18/60], Batch [190/447], Loss: 2.8667
Epoch [18/60], Batch [200/447], Loss: 2.7415
Epoch [18/60], Batch [210/447], Loss: 3.2000
Epoch [18/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [19/60], Batch [0/447], Loss: 3.2821
Epoch [19/60], Batch [10/447], Loss: 2.8998
Epoch [19/60], Batch [20/447], Loss: 2.8846
Epoch [19/60], Batch [30/447], Loss: 2.9111
Epoch [19/60], Batch [40/447], Loss: 2.5723
Epoch [19/60], Batch [50/447], Loss: 2.4119
Epoch [19/60], Batch [60/447], Loss: 2.0499
Epoch [19/60], Batch [70/447], Loss: 2.5792
Epoch [19/60], Batch [80/447], Loss: 2.8345
Epoch [19/60], Batch [90/447], Loss: 2.8337
Epoch [19/60], Batch [100/447], Loss: 2.6459
Epoch [19/60], Batch [110/447], Loss: 2.7057
Epoch [19/60], Batch [120/447], Loss: 2.3485
Epoch [19/60], Batch [130/447], Loss: 3.0368
Epoch [19/60], Batch [140/447], Loss: 2.6665
Epoch [19/60], Batch [150/447], Loss: 3.3685
Epoch [19/60], Batch [160/447], Loss: 2.8019
Epoch [19/60], Batch [170/447], Loss: 2.6194
Epoch [19/60], Batch [180/447], Loss: 2.4027
Epoch [19/60], Batch [190/447], Loss: 2.2281
Epoch [19/60], Batch [200/447], Loss: 2.8037
Epoch [19/60], Batch [210/447], Loss: 2.8781
Epoch [19/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [20/60], Batch [0/447], Loss: 2.3195
Epoch [20/60], Batch [10/447], Loss: 2.8263
Epoch [20/60], Batch [20/447], Loss: 2.4718
Epoch [20/60], Batch [30/447], Loss: 2.2095
Epoch [20/60], Batch [40/447], Loss: 2.6910
Epoch [20/60], Batch [50/447], Loss: 3.4940
Epoch [20/60], Batch [60/447], Loss: 2.6810
Epoch [20/60], Batch [70/447], Loss: 2.8416
Epoch [20/60], Batch [80/447], Loss: 2.4890
Epoch [20/60], Batch [90/447], Loss: 3.0181
Epoch [20/60], Batch [100/447], Loss: 2.8471
Epoch [20/60], Batch [110/447], Loss: 2.6862
Epoch [20/60], Batch [120/447], Loss: 2.9567
Epoch [20/60], Batch [130/447], Loss: 2.6463
Epoch [20/60], Batch [140/447], Loss: 2.9033
Epoch [20/60], Batch [150/447], Loss: 2.6710
Epoch [20/60], Batch [160/447], Loss: 3.1925
Epoch [20/60], Batch [170/447], Loss: 2.7153
Epoch [20/60], Batch [180/447], Loss: 2.4515
Epoch [20/60], Batch [190/447], Loss: 2.7934
Epoch [20/60], Batch [200/447], Loss: 2.5150
Epoch [20/60], Batch [210/447], Loss: 3.1971
Epoch [20/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [21/60], Batch [0/447], Loss: 2.2591
Epoch [21/60], Batch [10/447], Loss: 2.7980
Epoch [21/60], Batch [20/447], Loss: 2.7251
Epoch [21/60], Batch [30/447], Loss: 3.2580
Epoch [21/60], Batch [40/447], Loss: 2.5076
Epoch [21/60], Batch [50/447], Loss: 2.7558
Epoch [21/60], Batch [60/447], Loss: 2.5153
Epoch [21/60], Batch [70/447], Loss: 2.3246
Epoch [21/60], Batch [80/447], Loss: 3.2859
Epoch [21/60], Batch [90/447], Loss: 2.7090
Epoch [21/60], Batch [100/447], Loss: 2.4793
Epoch [21/60], Batch [110/447], Loss: 2.5407
Epoch [21/60], Batch [120/447], Loss: 3.1147
Epoch [21/60], Batch [130/447], Loss: 2.6011
Epoch [21/60], Batch [140/447], Loss: 2.0856
Epoch [21/60], Batch [150/447], Loss: 3.2385
Epoch [21/60], Batch [160/447], Loss: 3.4384
Epoch [21/60], Batch [170/447], Loss: 2.6248
Epoch [21/60], Batch [180/447], Loss: 2.1561
Epoch [21/60], Batch [190/447], Loss: 3.0454
Epoch [21/60], Batch [200/447], Loss: 2.9244
Epoch [21/60], Batch [210/447], Loss: 2.7544
Epoch [21/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [22/60], Batch [0/447], Loss: 3.4489
Epoch [22/60], Batch [10/447], Loss: 2.8035
Epoch [22/60], Batch [20/447], Loss: 2.6382
Epoch [22/60], Batch [30/447], Loss: 2.6359
Epoch [22/60], Batch [40/447], Loss: 2.7564
Epoch [22/60], Batch [50/447], Loss: 3.0926
Epoch [22/60], Batch [60/447], Loss: 2.9114
Epoch [22/60], Batch [70/447], Loss: 2.8651
Epoch [22/60], Batch [80/447], Loss: 1.7762
Epoch [22/60], Batch [90/447], Loss: 3.3022
Epoch [22/60], Batch [100/447], Loss: 2.8338
Epoch [22/60], Batch [110/447], Loss: 2.7310
Epoch [22/60], Batch [120/447], Loss: 3.2853
Epoch [22/60], Batch [130/447], Loss: 2.9169
Epoch [22/60], Batch [140/447], Loss: 2.7762
Epoch [22/60], Batch [150/447], Loss: 2.1361
Epoch [22/60], Batch [160/447], Loss: 2.7919
Epoch [22/60], Batch [170/447], Loss: 2.9965
Epoch [22/60], Batch [180/447], Loss: 2.2604
Epoch [22/60], Batch [190/447], Loss: 2.9182
Epoch [22/60], Batch [200/447], Loss: 2.8207
Epoch [22/60], Batch [210/447], Loss: 1.9526
Epoch [22/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [23/60], Batch [0/447], Loss: 2.8286
Epoch [23/60], Batch [10/447], Loss: 3.0208
Epoch [23/60], Batch [20/447], Loss: 2.7029
Epoch [23/60], Batch [30/447], Loss: 3.0261
Epoch [23/60], Batch [40/447], Loss: 2.6316
Epoch [23/60], Batch [50/447], Loss: 2.5563
Epoch [23/60], Batch [60/447], Loss: 3.0759
Epoch [23/60], Batch [70/447], Loss: 2.5461
Epoch [23/60], Batch [80/447], Loss: 2.7757
Epoch [23/60], Batch [90/447], Loss: 3.1485
Epoch [23/60], Batch [100/447], Loss: 2.8532
Epoch [23/60], Batch [110/447], Loss: 2.1114
Epoch [23/60], Batch [120/447], Loss: 3.1301
Epoch [23/60], Batch [130/447], Loss: 2.9634
Epoch [23/60], Batch [140/447], Loss: 2.7326
Epoch [23/60], Batch [150/447], Loss: 2.4373
Epoch [23/60], Batch [160/447], Loss: 2.8468
Epoch [23/60], Batch [170/447], Loss: 2.3604
Epoch [23/60], Batch [180/447], Loss: 2.2714
Epoch [23/60], Batch [190/447], Loss: 2.5618
Epoch [23/60], Batch [200/447], Loss: 2.4517
Epoch [23/60], Batch [210/447], Loss: 2.8363
Epoch [23/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [24/60], Batch [0/447], Loss: 2.5686
Epoch [24/60], Batch [10/447], Loss: 2.8869
Epoch [24/60], Batch [20/447], Loss: 2.5239
Epoch [24/60], Batch [30/447], Loss: 2.2715
Epoch [24/60], Batch [40/447], Loss: 2.0368
Epoch [24/60], Batch [50/447], Loss: 2.7110
Epoch [24/60], Batch [60/447], Loss: 2.8947
Epoch [24/60], Batch [70/447], Loss: 2.3346
Epoch [24/60], Batch [80/447], Loss: 2.6125
Epoch [24/60], Batch [90/447], Loss: 3.1879
Epoch [24/60], Batch [100/447], Loss: 2.7125
Epoch [24/60], Batch [110/447], Loss: 2.2464
Epoch [24/60], Batch [120/447], Loss: 2.5082
Epoch [24/60], Batch [130/447], Loss: 2.8492
Epoch [24/60], Batch [140/447], Loss: 3.1783
Epoch [24/60], Batch [150/447], Loss: 2.6334
Epoch [24/60], Batch [160/447], Loss: 2.4868
Epoch [24/60], Batch [170/447], Loss: 2.0143
Epoch [24/60], Batch [180/447], Loss: 2.9494
Epoch [24/60], Batch [190/447], Loss: 2.9048
Epoch [24/60], Batch [200/447], Loss: 1.9743
Epoch [24/60], Batch [210/447], Loss: 2.4442
Epoch [24/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [25/60], Batch [0/447], Loss: 2.0837
Epoch [25/60], Batch [10/447], Loss: 3.0725
Epoch [25/60], Batch [20/447], Loss: 2.3581
Epoch [25/60], Batch [30/447], Loss: 2.5598
Epoch [25/60], Batch [40/447], Loss: 2.2209
Epoch [25/60], Batch [50/447], Loss: 2.6969
Epoch [25/60], Batch [60/447], Loss: 2.4004
Epoch [25/60], Batch [70/447], Loss: 2.4924
Epoch [25/60], Batch [80/447], Loss: 2.7583
Epoch [25/60], Batch [90/447], Loss: 2.5879
Epoch [25/60], Batch [100/447], Loss: 2.6483
Epoch [25/60], Batch [110/447], Loss: 2.9296
Epoch [25/60], Batch [120/447], Loss: 2.6954
Epoch [25/60], Batch [130/447], Loss: 1.7605
Epoch [25/60], Batch [140/447], Loss: 2.7919
Epoch [25/60], Batch [150/447], Loss: 2.5357
Epoch [25/60], Batch [160/447], Loss: 2.3116
Epoch [25/60], Batch [170/447], Loss: 2.4924
Epoch [25/60], Batch [180/447], Loss: 2.3182
Epoch [25/60], Batch [190/447], Loss: 2.4867
Epoch [25/60], Batch [200/447], Loss: 2.3092
Epoch [25/60], Batch [210/447], Loss: 2.8762
Epoch [25/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [26/60], Batch [0/447], Loss: 2.8867
Epoch [26/60], Batch [10/447], Loss: 2.7127
Epoch [26/60], Batch [20/447], Loss: 2.2200
Epoch [26/60], Batch [30/447], Loss: 2.2654
Epoch [26/60], Batch [40/447], Loss: 2.0703
Epoch [26/60], Batch [50/447], Loss: 2.7881
Epoch [26/60], Batch [60/447], Loss: 3.0974
Epoch [26/60], Batch [70/447], Loss: 2.4591
Epoch [26/60], Batch [80/447], Loss: 2.2311
Epoch [26/60], Batch [90/447], Loss: 2.7906
Epoch [26/60], Batch [100/447], Loss: 3.1902
Epoch [26/60], Batch [110/447], Loss: 2.7307
Epoch [26/60], Batch [120/447], Loss: 2.7258
Epoch [26/60], Batch [130/447], Loss: 2.1596
Epoch [26/60], Batch [140/447], Loss: 2.6444
Epoch [26/60], Batch [150/447], Loss: 2.6376
Epoch [26/60], Batch [160/447], Loss: 1.9472
Epoch [26/60], Batch [170/447], Loss: 2.8592
Epoch [26/60], Batch [180/447], Loss: 2.2336
Epoch [26/60], Batch [190/447], Loss: 2.6410
Epoch [26/60], Batch [200/447], Loss: 2.9686
Epoch [26/60], Batch [210/447], Loss: 2.5879
Epoch [26/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [27/60], Batch [0/447], Loss: 2.5852
Epoch [27/60], Batch [10/447], Loss: 2.3949
Epoch [27/60], Batch [20/447], Loss: 2.9421
Epoch [27/60], Batch [30/447], Loss: 2.6541
Epoch [27/60], Batch [40/447], Loss: 2.6931
Epoch [27/60], Batch [50/447], Loss: 2.3907
Epoch [27/60], Batch [60/447], Loss: 2.9164
Epoch [27/60], Batch [70/447], Loss: 1.7231
Epoch [27/60], Batch [80/447], Loss: 2.5244
Epoch [27/60], Batch [90/447], Loss: 2.8409
Epoch [27/60], Batch [100/447], Loss: 2.3577
Epoch [27/60], Batch [110/447], Loss: 2.5644
Epoch [27/60], Batch [120/447], Loss: 3.2236
Epoch [27/60], Batch [130/447], Loss: 2.4578
Epoch [27/60], Batch [140/447], Loss: 2.1839
Epoch [27/60], Batch [150/447], Loss: 2.6473
Epoch [27/60], Batch [160/447], Loss: 2.1482
Epoch [27/60], Batch [170/447], Loss: 2.3441
Epoch [27/60], Batch [180/447], Loss: 2.7293
Epoch [27/60], Batch [190/447], Loss: 3.0382
Epoch [27/60], Batch [200/447], Loss: 2.0596
Epoch [27/60], Batch [210/447], Loss: 2.7348
Epoch [27/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [28/60], Batch [0/447], Loss: 3.1552
Epoch [28/60], Batch [10/447], Loss: 2.2713
Epoch [28/60], Batch [20/447], Loss: 2.3300
Epoch [28/60], Batch [30/447], Loss: 1.8910
Epoch [28/60], Batch [40/447], Loss: 2.9860
Epoch [28/60], Batch [50/447], Loss: 2.9482
Epoch [28/60], Batch [60/447], Loss: 3.0021
Epoch [28/60], Batch [70/447], Loss: 2.6125
Epoch [28/60], Batch [80/447], Loss: 2.4679
Epoch [28/60], Batch [90/447], Loss: 2.5135
Epoch [28/60], Batch [100/447], Loss: 2.8145
Epoch [28/60], Batch [110/447], Loss: 2.4882
Epoch [28/60], Batch [120/447], Loss: 2.7772
Epoch [28/60], Batch [130/447], Loss: 2.0263
Epoch [28/60], Batch [140/447], Loss: 2.5255
Epoch [28/60], Batch [150/447], Loss: 3.0787
Epoch [28/60], Batch [160/447], Loss: 2.3784
Epoch [28/60], Batch [170/447], Loss: 1.8939
Epoch [28/60], Batch [180/447], Loss: 3.2097
Epoch [28/60], Batch [190/447], Loss: 2.9150
Epoch [28/60], Batch [200/447], Loss: 3.0530
Epoch [28/60], Batch [210/447], Loss: 3.0444
Epoch [28/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [29/60], Batch [0/447], Loss: 2.7898
Epoch [29/60], Batch [10/447], Loss: 3.0133
Epoch [29/60], Batch [20/447], Loss: 2.3864
Epoch [29/60], Batch [30/447], Loss: 2.7149
Epoch [29/60], Batch [40/447], Loss: 2.3856
Epoch [29/60], Batch [50/447], Loss: 2.7881
Epoch [29/60], Batch [60/447], Loss: 2.0425
Epoch [29/60], Batch [70/447], Loss: 2.7826
Epoch [29/60], Batch [80/447], Loss: 2.4293
Epoch [29/60], Batch [90/447], Loss: 2.2615
Epoch [29/60], Batch [100/447], Loss: 2.3285
Epoch [29/60], Batch [110/447], Loss: 2.7489
Epoch [29/60], Batch [120/447], Loss: 2.9000
Epoch [29/60], Batch [130/447], Loss: 2.6317
Epoch [29/60], Batch [140/447], Loss: 2.1347
Epoch [29/60], Batch [150/447], Loss: 2.6988
Epoch [29/60], Batch [160/447], Loss: 2.6085
Epoch [29/60], Batch [170/447], Loss: 2.7531
Epoch [29/60], Batch [180/447], Loss: 3.4982
Epoch [29/60], Batch [190/447], Loss: 2.9194
Epoch [29/60], Batch [200/447], Loss: 2.5477
Epoch [29/60], Batch [210/447], Loss: 1.9079
Epoch [29/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [30/60], Batch [0/447], Loss: 1.9729
Epoch [30/60], Batch [10/447], Loss: 2.7413
Epoch [30/60], Batch [20/447], Loss: 2.9339
Epoch [30/60], Batch [30/447], Loss: 2.5316
Epoch [30/60], Batch [40/447], Loss: 3.2683
Epoch [30/60], Batch [50/447], Loss: 2.2553
Epoch [30/60], Batch [60/447], Loss: 2.0628
Epoch [30/60], Batch [70/447], Loss: 2.4072
Epoch [30/60], Batch [80/447], Loss: 2.2607
Epoch [30/60], Batch [90/447], Loss: 2.8565
Epoch [30/60], Batch [100/447], Loss: 2.5310
Epoch [30/60], Batch [110/447], Loss: 2.7474
Epoch [30/60], Batch [120/447], Loss: 2.9922
Epoch [30/60], Batch [130/447], Loss: 2.8114
Epoch [30/60], Batch [140/447], Loss: 2.5523
Epoch [30/60], Batch [150/447], Loss: 2.5489
Epoch [30/60], Batch [160/447], Loss: 2.5984
Epoch [30/60], Batch [170/447], Loss: 2.2777
Epoch [30/60], Batch [180/447], Loss: 2.2555
Epoch [30/60], Batch [190/447], Loss: 1.7445
Epoch [30/60], Batch [200/447], Loss: 2.9913
Epoch [30/60], Batch [210/447], Loss: 2.9275
Epoch [30/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [31/60], Batch [0/447], Loss: 2.6978
Epoch [31/60], Batch [10/447], Loss: 3.0496
Epoch [31/60], Batch [20/447], Loss: 2.7084
Epoch [31/60], Batch [30/447], Loss: 2.0452
Epoch [31/60], Batch [40/447], Loss: 2.7494
Epoch [31/60], Batch [50/447], Loss: 1.9106
Epoch [31/60], Batch [60/447], Loss: 2.1083
Epoch [31/60], Batch [70/447], Loss: 2.6556
Epoch [31/60], Batch [80/447], Loss: 2.4449
Epoch [31/60], Batch [90/447], Loss: 2.9147
Epoch [31/60], Batch [100/447], Loss: 2.7904
Epoch [31/60], Batch [110/447], Loss: 2.3596
Epoch [31/60], Batch [120/447], Loss: 2.5924
Epoch [31/60], Batch [130/447], Loss: 2.6415
Epoch [31/60], Batch [140/447], Loss: 1.6058
Epoch [31/60], Batch [150/447], Loss: 2.6411
Epoch [31/60], Batch [160/447], Loss: 2.9820
Epoch [31/60], Batch [170/447], Loss: 2.6879
Epoch [31/60], Batch [180/447], Loss: 2.6595
Epoch [31/60], Batch [190/447], Loss: 1.9707
Epoch [31/60], Batch [200/447], Loss: 1.8554
Epoch [31/60], Batch [210/447], Loss: 2.6855
Epoch [31/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [32/60], Batch [0/447], Loss: 2.3918
Epoch [32/60], Batch [10/447], Loss: 2.5366
Epoch [32/60], Batch [20/447], Loss: 2.6888
Epoch [32/60], Batch [30/447], Loss: 2.0994
Epoch [32/60], Batch [40/447], Loss: 2.5251
Epoch [32/60], Batch [50/447], Loss: 2.3329
Epoch [32/60], Batch [60/447], Loss: 2.1501
Epoch [32/60], Batch [70/447], Loss: 1.8221
Epoch [32/60], Batch [80/447], Loss: 1.9397
Epoch [32/60], Batch [90/447], Loss: 1.9028
Epoch [32/60], Batch [100/447], Loss: 2.2540
Epoch [32/60], Batch [110/447], Loss: 2.0579
Epoch [32/60], Batch [120/447], Loss: 2.8890
Epoch [32/60], Batch [130/447], Loss: 2.2569
Epoch [32/60], Batch [140/447], Loss: 2.0043
Epoch [32/60], Batch [150/447], Loss: 2.8234
Epoch [32/60], Batch [160/447], Loss: 2.7744
Epoch [32/60], Batch [170/447], Loss: 1.9206
Epoch [32/60], Batch [180/447], Loss: 2.1484
Epoch [32/60], Batch [190/447], Loss: 2.0959
Epoch [32/60], Batch [200/447], Loss: 2.6749
Epoch [32/60], Batch [210/447], Loss: 2.5646
Epoch [32/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [33/60], Batch [0/447], Loss: 2.4503
Epoch [33/60], Batch [10/447], Loss: 2.1326
Epoch [33/60], Batch [20/447], Loss: 2.5061
Epoch [33/60], Batch [30/447], Loss: 2.6079
Epoch [33/60], Batch [40/447], Loss: 2.8541
Epoch [33/60], Batch [50/447], Loss: 3.0462
Epoch [33/60], Batch [60/447], Loss: 1.9485
Epoch [33/60], Batch [70/447], Loss: 2.9348
Epoch [33/60], Batch [80/447], Loss: 2.2352
Epoch [33/60], Batch [90/447], Loss: 2.4582
Epoch [33/60], Batch [100/447], Loss: 2.7270
Epoch [33/60], Batch [110/447], Loss: 2.9419
Epoch [33/60], Batch [120/447], Loss: 1.8300
Epoch [33/60], Batch [130/447], Loss: 3.0989
Epoch [33/60], Batch [140/447], Loss: 2.4045
Epoch [33/60], Batch [150/447], Loss: 2.4198
Epoch [33/60], Batch [160/447], Loss: 1.5632
Epoch [33/60], Batch [170/447], Loss: 2.4089
Epoch [33/60], Batch [180/447], Loss: 3.1029
Epoch [33/60], Batch [190/447], Loss: 2.1431
Epoch [33/60], Batch [200/447], Loss: 2.2326
Epoch [33/60], Batch [210/447], Loss: 2.2810
Epoch [33/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [34/60], Batch [0/447], Loss: 2.6196
Epoch [34/60], Batch [10/447], Loss: 3.0560
Epoch [34/60], Batch [20/447], Loss: 2.4899
Epoch [34/60], Batch [30/447], Loss: 3.4113
Epoch [34/60], Batch [40/447], Loss: 1.8313
Epoch [34/60], Batch [50/447], Loss: 2.7861
Epoch [34/60], Batch [60/447], Loss: 2.4146
Epoch [34/60], Batch [70/447], Loss: 3.0190
Epoch [34/60], Batch [80/447], Loss: 2.4160
Epoch [34/60], Batch [90/447], Loss: 2.2956
Epoch [34/60], Batch [100/447], Loss: 2.1475
Epoch [34/60], Batch [110/447], Loss: 2.3880
Epoch [34/60], Batch [120/447], Loss: 2.1778
Epoch [34/60], Batch [130/447], Loss: 2.6857
Epoch [34/60], Batch [140/447], Loss: 2.3201
Epoch [34/60], Batch [150/447], Loss: 2.2666
Epoch [34/60], Batch [160/447], Loss: 2.5010
Epoch [34/60], Batch [170/447], Loss: 2.6307
Epoch [34/60], Batch [180/447], Loss: 2.0337
Epoch [34/60], Batch [190/447], Loss: 2.6440
Epoch [34/60], Batch [200/447], Loss: 2.5561
Epoch [34/60], Batch [210/447], Loss: 2.7207
Epoch [34/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [35/60], Batch [0/447], Loss: 1.7490
Epoch [35/60], Batch [10/447], Loss: 2.1810
Epoch [35/60], Batch [20/447], Loss: 1.8906
Epoch [35/60], Batch [30/447], Loss: 1.8488
Epoch [35/60], Batch [40/447], Loss: 1.8328
Epoch [35/60], Batch [50/447], Loss: 2.2431
Epoch [35/60], Batch [60/447], Loss: 2.7616
Epoch [35/60], Batch [70/447], Loss: 2.1009
Epoch [35/60], Batch [80/447], Loss: 2.4553
Epoch [35/60], Batch [90/447], Loss: 2.4948
Epoch [35/60], Batch [100/447], Loss: 2.5851
Epoch [35/60], Batch [110/447], Loss: 2.4010
Epoch [35/60], Batch [120/447], Loss: 2.2637
Epoch [35/60], Batch [130/447], Loss: 2.4323
Epoch [35/60], Batch [140/447], Loss: 2.4498
Epoch [35/60], Batch [150/447], Loss: 2.4307
Epoch [35/60], Batch [160/447], Loss: 2.6989
Epoch [35/60], Batch [170/447], Loss: 2.6015
Epoch [35/60], Batch [180/447], Loss: 2.9084
Epoch [35/60], Batch [190/447], Loss: 2.0322
Epoch [35/60], Batch [200/447], Loss: 2.8389
Epoch [35/60], Batch [210/447], Loss: 2.1511
Epoch [35/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [36/60], Batch [0/447], Loss: 1.7157
Epoch [36/60], Batch [10/447], Loss: 1.7324
Epoch [36/60], Batch [20/447], Loss: 2.1205
Epoch [36/60], Batch [30/447], Loss: 2.7410
Epoch [36/60], Batch [40/447], Loss: 2.2273
Epoch [36/60], Batch [50/447], Loss: 1.9731
Epoch [36/60], Batch [60/447], Loss: 2.0877
Epoch [36/60], Batch [70/447], Loss: 2.0189
Epoch [36/60], Batch [80/447], Loss: 2.3556
Epoch [36/60], Batch [90/447], Loss: 2.1681
Epoch [36/60], Batch [100/447], Loss: 1.7200
Epoch [36/60], Batch [110/447], Loss: 2.4976
Epoch [36/60], Batch [120/447], Loss: 2.4254
Epoch [36/60], Batch [130/447], Loss: 2.0238
Epoch [36/60], Batch [140/447], Loss: 1.9097
Epoch [36/60], Batch [150/447], Loss: 2.1047
Epoch [36/60], Batch [160/447], Loss: 2.5180
Epoch [36/60], Batch [170/447], Loss: 2.6719
Epoch [36/60], Batch [180/447], Loss: 2.4002
Epoch [36/60], Batch [190/447], Loss: 2.1838
Epoch [36/60], Batch [200/447], Loss: 2.0542
Epoch [36/60], Batch [210/447], Loss: 2.1114
Epoch [36/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [37/60], Batch [0/447], Loss: 1.9553
Epoch [37/60], Batch [10/447], Loss: 2.1819
Epoch [37/60], Batch [20/447], Loss: 2.0495
Epoch [37/60], Batch [30/447], Loss: 2.7076
Epoch [37/60], Batch [40/447], Loss: 3.0321
Epoch [37/60], Batch [50/447], Loss: 2.7800
Epoch [37/60], Batch [60/447], Loss: 2.2920
Epoch [37/60], Batch [70/447], Loss: 2.2453
Epoch [37/60], Batch [80/447], Loss: 2.5502
Epoch [37/60], Batch [90/447], Loss: 1.8596
Epoch [37/60], Batch [100/447], Loss: 2.8224
Epoch [37/60], Batch [110/447], Loss: 3.4768
Epoch [37/60], Batch [120/447], Loss: 2.6936
Epoch [37/60], Batch [130/447], Loss: 1.9781
Epoch [37/60], Batch [140/447], Loss: 2.0008
Epoch [37/60], Batch [150/447], Loss: 2.5948
Epoch [37/60], Batch [160/447], Loss: 1.9024
Epoch [37/60], Batch [170/447], Loss: 2.4826
Epoch [37/60], Batch [180/447], Loss: 2.7267
Epoch [37/60], Batch [190/447], Loss: 2.5776
Epoch [37/60], Batch [200/447], Loss: 2.7852
Epoch [37/60], Batch [210/447], Loss: 2.8897
Epoch [37/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [38/60], Batch [0/447], Loss: 2.2040
Epoch [38/60], Batch [10/447], Loss: 2.2982
Epoch [38/60], Batch [20/447], Loss: 2.2202
Epoch [38/60], Batch [30/447], Loss: 1.6270
Epoch [38/60], Batch [40/447], Loss: 2.9942
Epoch [38/60], Batch [50/447], Loss: 2.4656
Epoch [38/60], Batch [60/447], Loss: 1.8423
Epoch [38/60], Batch [70/447], Loss: 2.7243
Epoch [38/60], Batch [80/447], Loss: 2.0350
Epoch [38/60], Batch [90/447], Loss: 2.0786
Epoch [38/60], Batch [100/447], Loss: 2.8734
Epoch [38/60], Batch [110/447], Loss: 2.7249
Epoch [38/60], Batch [120/447], Loss: 2.6538
Epoch [38/60], Batch [130/447], Loss: 2.5449
Epoch [38/60], Batch [140/447], Loss: 2.1090
Epoch [38/60], Batch [150/447], Loss: 2.7034
Epoch [38/60], Batch [160/447], Loss: 1.1586
Epoch [38/60], Batch [170/447], Loss: 2.4540
Epoch [38/60], Batch [180/447], Loss: 2.1917
Epoch [38/60], Batch [190/447], Loss: 3.0234
Epoch [38/60], Batch [200/447], Loss: 3.0934
Epoch [38/60], Batch [210/447], Loss: 2.5020
Epoch [38/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [39/60], Batch [0/447], Loss: 1.9929
Epoch [39/60], Batch [10/447], Loss: 1.4246
Epoch [39/60], Batch [20/447], Loss: 2.7565
Epoch [39/60], Batch [30/447], Loss: 1.9925
Epoch [39/60], Batch [40/447], Loss: 2.3666
Epoch [39/60], Batch [50/447], Loss: 1.6339
Epoch [39/60], Batch [60/447], Loss: 3.1957
Epoch [39/60], Batch [70/447], Loss: 2.5058
Epoch [39/60], Batch [80/447], Loss: 2.7855
Epoch [39/60], Batch [90/447], Loss: 2.1258
Epoch [39/60], Batch [100/447], Loss: 2.2196
Epoch [39/60], Batch [110/447], Loss: 2.2665
Epoch [39/60], Batch [120/447], Loss: 2.0248
Epoch [39/60], Batch [130/447], Loss: 2.6587
Epoch [39/60], Batch [140/447], Loss: 2.4060
Epoch [39/60], Batch [150/447], Loss: 2.4432
Epoch [39/60], Batch [160/447], Loss: 1.7247
Epoch [39/60], Batch [170/447], Loss: 1.7050
Epoch [39/60], Batch [180/447], Loss: 2.1517
Epoch [39/60], Batch [190/447], Loss: 1.7419
Epoch [39/60], Batch [200/447], Loss: 2.2909
Epoch [39/60], Batch [210/447], Loss: 2.4176
Epoch [39/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [40/60], Batch [0/447], Loss: 2.4654
Epoch [40/60], Batch [10/447], Loss: 1.8409
Epoch [40/60], Batch [20/447], Loss: 3.0177
Epoch [40/60], Batch [30/447], Loss: 1.9670
Epoch [40/60], Batch [40/447], Loss: 2.2936
Epoch [40/60], Batch [50/447], Loss: 2.2272
Epoch [40/60], Batch [60/447], Loss: 2.7463
Epoch [40/60], Batch [70/447], Loss: 2.5559
Epoch [40/60], Batch [80/447], Loss: 2.4263
Epoch [40/60], Batch [90/447], Loss: 3.1944
Epoch [40/60], Batch [100/447], Loss: 2.9539
Epoch [40/60], Batch [110/447], Loss: 2.1591
Epoch [40/60], Batch [120/447], Loss: 2.0528
Epoch [40/60], Batch [130/447], Loss: 1.6525
Epoch [40/60], Batch [140/447], Loss: 2.6655
Epoch [40/60], Batch [150/447], Loss: 1.4489
Epoch [40/60], Batch [160/447], Loss: 1.7084
Epoch [40/60], Batch [170/447], Loss: 2.4159
Epoch [40/60], Batch [180/447], Loss: 2.1601
Epoch [40/60], Batch [190/447], Loss: 2.8475
Epoch [40/60], Batch [200/447], Loss: 2.8515
Epoch [40/60], Batch [210/447], Loss: 2.2872
Epoch [40/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [41/60], Batch [0/447], Loss: 2.5469
Epoch [41/60], Batch [10/447], Loss: 2.3988
Epoch [41/60], Batch [20/447], Loss: 2.3996
Epoch [41/60], Batch [30/447], Loss: 2.1413
Epoch [41/60], Batch [40/447], Loss: 2.8187
Epoch [41/60], Batch [50/447], Loss: 3.1268
Epoch [41/60], Batch [60/447], Loss: 1.9521
Epoch [41/60], Batch [70/447], Loss: 2.4577
Epoch [41/60], Batch [80/447], Loss: 2.2611
Epoch [41/60], Batch [90/447], Loss: 2.9603
Epoch [41/60], Batch [100/447], Loss: 2.2162
Epoch [41/60], Batch [110/447], Loss: 2.5479
Epoch [41/60], Batch [120/447], Loss: 2.4640
Epoch [41/60], Batch [130/447], Loss: 2.3499
Epoch [41/60], Batch [140/447], Loss: 2.1977
Epoch [41/60], Batch [150/447], Loss: 1.9196
Epoch [41/60], Batch [160/447], Loss: 2.4627
Epoch [41/60], Batch [170/447], Loss: 2.4861
Epoch [41/60], Batch [180/447], Loss: 2.5513
Epoch [41/60], Batch [190/447], Loss: 2.5002
Epoch [41/60], Batch [200/447], Loss: 1.5895
Epoch [41/60], Batch [210/447], Loss: 2.1108
Epoch [41/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [42/60], Batch [0/447], Loss: 2.4315
Epoch [42/60], Batch [10/447], Loss: 2.2440
Epoch [42/60], Batch [20/447], Loss: 2.2187
Epoch [42/60], Batch [30/447], Loss: 1.7516
Epoch [42/60], Batch [40/447], Loss: 2.8277
Epoch [42/60], Batch [50/447], Loss: 1.8943
Epoch [42/60], Batch [60/447], Loss: 1.2343
Epoch [42/60], Batch [70/447], Loss: 2.5155
Epoch [42/60], Batch [80/447], Loss: 2.7080
Epoch [42/60], Batch [90/447], Loss: 2.6804
Epoch [42/60], Batch [100/447], Loss: 2.0435
Epoch [42/60], Batch [110/447], Loss: 2.1979
Epoch [42/60], Batch [120/447], Loss: 2.3338
Epoch [42/60], Batch [130/447], Loss: 1.8653
Epoch [42/60], Batch [140/447], Loss: 2.0645
Epoch [42/60], Batch [150/447], Loss: 1.7802
Epoch [42/60], Batch [160/447], Loss: 2.2689
Epoch [42/60], Batch [170/447], Loss: 1.9190
Epoch [42/60], Batch [180/447], Loss: 3.0954
Epoch [42/60], Batch [190/447], Loss: 1.9779
Epoch [42/60], Batch [200/447], Loss: 2.7230
Epoch [42/60], Batch [210/447], Loss: 2.2120
Epoch [42/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [43/60], Batch [0/447], Loss: 2.4812
Epoch [43/60], Batch [10/447], Loss: 2.4654
Epoch [43/60], Batch [20/447], Loss: 2.6633
Epoch [43/60], Batch [30/447], Loss: 1.7377
Epoch [43/60], Batch [40/447], Loss: 1.9676
Epoch [43/60], Batch [50/447], Loss: 2.5734
Epoch [43/60], Batch [60/447], Loss: 3.2392
Epoch [43/60], Batch [70/447], Loss: 2.3593
Epoch [43/60], Batch [80/447], Loss: 2.2089
Epoch [43/60], Batch [90/447], Loss: 1.7105
Epoch [43/60], Batch [100/447], Loss: 2.5805
Epoch [43/60], Batch [110/447], Loss: 2.3783
Epoch [43/60], Batch [120/447], Loss: 1.4862
Epoch [43/60], Batch [130/447], Loss: 1.9906
Epoch [43/60], Batch [140/447], Loss: 2.0869
Epoch [43/60], Batch [150/447], Loss: 1.7630
Epoch [43/60], Batch [160/447], Loss: 2.6202
Epoch [43/60], Batch [170/447], Loss: 2.8572
Epoch [43/60], Batch [180/447], Loss: 1.9047
Epoch [43/60], Batch [190/447], Loss: 2.5171
Epoch [43/60], Batch [200/447], Loss: 2.2231
Epoch [43/60], Batch [210/447], Loss: 2.3086
Epoch [43/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [44/60], Batch [0/447], Loss: 1.7979
Epoch [44/60], Batch [10/447], Loss: 2.7875
Epoch [44/60], Batch [20/447], Loss: 2.1379
Epoch [44/60], Batch [30/447], Loss: 1.8224
Epoch [44/60], Batch [40/447], Loss: 2.7536
Epoch [44/60], Batch [50/447], Loss: 2.3651
Epoch [44/60], Batch [60/447], Loss: 1.4158
Epoch [44/60], Batch [70/447], Loss: 2.0023
Epoch [44/60], Batch [80/447], Loss: 2.3243
Epoch [44/60], Batch [90/447], Loss: 1.3446
Epoch [44/60], Batch [100/447], Loss: 1.6061
Epoch [44/60], Batch [110/447], Loss: 1.8178
Epoch [44/60], Batch [120/447], Loss: 2.6121
Epoch [44/60], Batch [130/447], Loss: 2.0654
Epoch [44/60], Batch [140/447], Loss: 2.1938
Epoch [44/60], Batch [150/447], Loss: 2.2836
Epoch [44/60], Batch [160/447], Loss: 2.1615
Epoch [44/60], Batch [170/447], Loss: 2.3399
Epoch [44/60], Batch [180/447], Loss: 1.7030
Epoch [44/60], Batch [190/447], Loss: 1.8499
Epoch [44/60], Batch [200/447], Loss: 2.1022
Epoch [44/60], Batch [210/447], Loss: 2.8850
Epoch [44/60], Batch 

[I 2024-12-13 11:02:01,599] Trial 4 pruned. 


Epoch [44/60], Validation Accuracy: 0.7268, Validation Loss: 1.0159
No improvement in validation accuracy for 5 epoch(s).
Early stopping at epoch 44.
Trial early stopped due to lack of improvement.
Starting a new trial...
Trial 5: alpha = 1.6445845403801216
Building the model...


2024-12-13 11:02:01,957 - mmaction - INFO - load model from: https://download.openmmlab.com/mmaction/recognition/csn/ircsn_from_scratch_r50_ig65m_20210617-ce545a37.pth
2024-12-13 11:02:01,958 - mmaction - INFO - load checkpoint from http path: https://download.openmmlab.com/mmaction/recognition/csn/ircsn_from_scratch_r50_ig65m_20210617-ce545a37.pth


Model built successfully!
Starting training...


  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [1/60], Batch [0/447], Loss: 3.9183
Epoch [1/60], Batch [10/447], Loss: 3.9542
Epoch [1/60], Batch [20/447], Loss: 3.9468
Epoch [1/60], Batch [30/447], Loss: 4.0604
Epoch [1/60], Batch [40/447], Loss: 4.0436
Epoch [1/60], Batch [50/447], Loss: 3.9820
Epoch [1/60], Batch [60/447], Loss: 3.8748
Epoch [1/60], Batch [70/447], Loss: 3.9436
Epoch [1/60], Batch [80/447], Loss: 3.9173
Epoch [1/60], Batch [90/447], Loss: 3.9773
Epoch [1/60], Batch [100/447], Loss: 3.9250
Epoch [1/60], Batch [110/447], Loss: 3.9818
Epoch [1/60], Batch [120/447], Loss: 3.9022
Epoch [1/60], Batch [130/447], Loss: 3.9789
Epoch [1/60], Batch [140/447], Loss: 3.9557
Epoch [1/60], Batch [150/447], Loss: 3.9551
Epoch [1/60], Batch [160/447], Loss: 3.9995
Epoch [1/60], Batch [170/447], Loss: 3.9498
Epoch [1/60], Batch [180/447], Loss: 3.9976
Epoch [1/60], Batch [190/447], Loss: 4.0354
Epoch [1/60], Batch [200/447], Loss: 3.9130
Epoch [1/60], Batch [210/447], Loss: 3.9262
Epoch [1/60], Batch [220/447], Loss: 3.9785

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [2/60], Batch [0/447], Loss: 3.9344
Epoch [2/60], Batch [10/447], Loss: 3.9653
Epoch [2/60], Batch [20/447], Loss: 3.7832
Epoch [2/60], Batch [30/447], Loss: 3.7728
Epoch [2/60], Batch [40/447], Loss: 3.8299
Epoch [2/60], Batch [50/447], Loss: 3.8499
Epoch [2/60], Batch [60/447], Loss: 3.9039
Epoch [2/60], Batch [70/447], Loss: 3.8015
Epoch [2/60], Batch [80/447], Loss: 3.8767
Epoch [2/60], Batch [90/447], Loss: 3.6738
Epoch [2/60], Batch [100/447], Loss: 3.8663
Epoch [2/60], Batch [110/447], Loss: 3.8918
Epoch [2/60], Batch [120/447], Loss: 3.8917
Epoch [2/60], Batch [130/447], Loss: 3.6758
Epoch [2/60], Batch [140/447], Loss: 3.8725
Epoch [2/60], Batch [150/447], Loss: 3.8726
Epoch [2/60], Batch [160/447], Loss: 3.8209
Epoch [2/60], Batch [170/447], Loss: 3.9411
Epoch [2/60], Batch [180/447], Loss: 3.6635
Epoch [2/60], Batch [190/447], Loss: 3.7509
Epoch [2/60], Batch [200/447], Loss: 3.8992
Epoch [2/60], Batch [210/447], Loss: 3.8042
Epoch [2/60], Batch [220/447], Loss: 3.9031

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [3/60], Batch [0/447], Loss: 3.8468
Epoch [3/60], Batch [10/447], Loss: 3.5606
Epoch [3/60], Batch [20/447], Loss: 3.8141
Epoch [3/60], Batch [30/447], Loss: 3.8613
Epoch [3/60], Batch [40/447], Loss: 3.7780
Epoch [3/60], Batch [50/447], Loss: 3.9328
Epoch [3/60], Batch [60/447], Loss: 3.8383
Epoch [3/60], Batch [70/447], Loss: 3.6514
Epoch [3/60], Batch [80/447], Loss: 3.8434
Epoch [3/60], Batch [90/447], Loss: 3.7256
Epoch [3/60], Batch [100/447], Loss: 3.6503
Epoch [3/60], Batch [110/447], Loss: 3.6257
Epoch [3/60], Batch [120/447], Loss: 3.7646
Epoch [3/60], Batch [130/447], Loss: 3.6622
Epoch [3/60], Batch [140/447], Loss: 3.8737
Epoch [3/60], Batch [150/447], Loss: 3.8071
Epoch [3/60], Batch [160/447], Loss: 3.4582
Epoch [3/60], Batch [170/447], Loss: 3.3784
Epoch [3/60], Batch [180/447], Loss: 3.8314
Epoch [3/60], Batch [190/447], Loss: 3.6444
Epoch [3/60], Batch [200/447], Loss: 3.6522
Epoch [3/60], Batch [210/447], Loss: 3.6431
Epoch [3/60], Batch [220/447], Loss: 3.7483

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [4/60], Batch [0/447], Loss: 3.7484
Epoch [4/60], Batch [10/447], Loss: 3.9022
Epoch [4/60], Batch [20/447], Loss: 3.3725
Epoch [4/60], Batch [30/447], Loss: 3.6258
Epoch [4/60], Batch [40/447], Loss: 3.4774
Epoch [4/60], Batch [50/447], Loss: 3.4938
Epoch [4/60], Batch [60/447], Loss: 3.4724
Epoch [4/60], Batch [70/447], Loss: 3.8253
Epoch [4/60], Batch [80/447], Loss: 3.6700
Epoch [4/60], Batch [90/447], Loss: 3.5787
Epoch [4/60], Batch [100/447], Loss: 3.7735
Epoch [4/60], Batch [110/447], Loss: 3.7727
Epoch [4/60], Batch [120/447], Loss: 3.8094
Epoch [4/60], Batch [130/447], Loss: 3.7286
Epoch [4/60], Batch [140/447], Loss: 3.2479
Epoch [4/60], Batch [150/447], Loss: 3.6575
Epoch [4/60], Batch [160/447], Loss: 3.3459
Epoch [4/60], Batch [170/447], Loss: 3.7375
Epoch [4/60], Batch [180/447], Loss: 3.6841
Epoch [4/60], Batch [190/447], Loss: 3.7430
Epoch [4/60], Batch [200/447], Loss: 3.7604
Epoch [4/60], Batch [210/447], Loss: 3.5098
Epoch [4/60], Batch [220/447], Loss: 3.7746

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [5/60], Batch [0/447], Loss: 3.4029
Epoch [5/60], Batch [10/447], Loss: 3.7752
Epoch [5/60], Batch [20/447], Loss: 3.6198
Epoch [5/60], Batch [30/447], Loss: 3.6983
Epoch [5/60], Batch [40/447], Loss: 3.3963
Epoch [5/60], Batch [50/447], Loss: 3.5622
Epoch [5/60], Batch [60/447], Loss: 3.8434
Epoch [5/60], Batch [70/447], Loss: 3.3440
Epoch [5/60], Batch [80/447], Loss: 3.6051
Epoch [5/60], Batch [90/447], Loss: 3.8300
Epoch [5/60], Batch [100/447], Loss: 3.7606
Epoch [5/60], Batch [110/447], Loss: 3.6121
Epoch [5/60], Batch [120/447], Loss: 3.5929
Epoch [5/60], Batch [130/447], Loss: 3.6129
Epoch [5/60], Batch [140/447], Loss: 3.8729
Epoch [5/60], Batch [150/447], Loss: 3.8846
Epoch [5/60], Batch [160/447], Loss: 3.5016
Epoch [5/60], Batch [170/447], Loss: 3.7035
Epoch [5/60], Batch [180/447], Loss: 3.4432
Epoch [5/60], Batch [190/447], Loss: 3.5400
Epoch [5/60], Batch [200/447], Loss: 3.2404
Epoch [5/60], Batch [210/447], Loss: 3.9235
Epoch [5/60], Batch [220/447], Loss: 3.5889

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [6/60], Batch [0/447], Loss: 3.7455
Epoch [6/60], Batch [10/447], Loss: 3.1331
Epoch [6/60], Batch [20/447], Loss: 3.5889
Epoch [6/60], Batch [30/447], Loss: 3.7200
Epoch [6/60], Batch [40/447], Loss: 3.6189
Epoch [6/60], Batch [50/447], Loss: 3.3182
Epoch [6/60], Batch [60/447], Loss: 3.5808
Epoch [6/60], Batch [70/447], Loss: 3.2771
Epoch [6/60], Batch [80/447], Loss: 3.5924
Epoch [6/60], Batch [90/447], Loss: 3.5848
Epoch [6/60], Batch [100/447], Loss: 3.1772
Epoch [6/60], Batch [110/447], Loss: 3.2275
Epoch [6/60], Batch [120/447], Loss: 3.2795
Epoch [6/60], Batch [130/447], Loss: 3.1798
Epoch [6/60], Batch [140/447], Loss: 3.5712
Epoch [6/60], Batch [150/447], Loss: 3.6240
Epoch [6/60], Batch [160/447], Loss: 3.2446
Epoch [6/60], Batch [170/447], Loss: 3.3101
Epoch [6/60], Batch [180/447], Loss: 3.5103
Epoch [6/60], Batch [190/447], Loss: 3.2884
Epoch [6/60], Batch [200/447], Loss: 3.6677
Epoch [6/60], Batch [210/447], Loss: 3.7497
Epoch [6/60], Batch [220/447], Loss: 3.5766

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [7/60], Batch [0/447], Loss: 3.3806
Epoch [7/60], Batch [10/447], Loss: 3.3831
Epoch [7/60], Batch [20/447], Loss: 2.8301
Epoch [7/60], Batch [30/447], Loss: 2.8540
Epoch [7/60], Batch [40/447], Loss: 3.3876
Epoch [7/60], Batch [50/447], Loss: 3.5536
Epoch [7/60], Batch [60/447], Loss: 3.2943
Epoch [7/60], Batch [70/447], Loss: 3.3938
Epoch [7/60], Batch [80/447], Loss: 3.4819
Epoch [7/60], Batch [90/447], Loss: 2.8618
Epoch [7/60], Batch [100/447], Loss: 3.3094
Epoch [7/60], Batch [110/447], Loss: 3.3080
Epoch [7/60], Batch [120/447], Loss: 3.1669
Epoch [7/60], Batch [130/447], Loss: 3.6425
Epoch [7/60], Batch [140/447], Loss: 3.3275
Epoch [7/60], Batch [150/447], Loss: 3.5117
Epoch [7/60], Batch [160/447], Loss: 3.3776
Epoch [7/60], Batch [170/447], Loss: 3.1980
Epoch [7/60], Batch [180/447], Loss: 3.3257
Epoch [7/60], Batch [190/447], Loss: 3.5933
Epoch [7/60], Batch [200/447], Loss: 3.4815
Epoch [7/60], Batch [210/447], Loss: 3.3846
Epoch [7/60], Batch [220/447], Loss: 3.4098

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [8/60], Batch [0/447], Loss: 3.2258
Epoch [8/60], Batch [10/447], Loss: 3.1432
Epoch [8/60], Batch [20/447], Loss: 3.5079
Epoch [8/60], Batch [30/447], Loss: 3.1325
Epoch [8/60], Batch [40/447], Loss: 3.3098
Epoch [8/60], Batch [50/447], Loss: 3.2978
Epoch [8/60], Batch [60/447], Loss: 3.1107
Epoch [8/60], Batch [70/447], Loss: 3.8305
Epoch [8/60], Batch [80/447], Loss: 3.5515
Epoch [8/60], Batch [90/447], Loss: 3.0159
Epoch [8/60], Batch [100/447], Loss: 3.2386
Epoch [8/60], Batch [110/447], Loss: 3.2996
Epoch [8/60], Batch [120/447], Loss: 3.0516
Epoch [8/60], Batch [130/447], Loss: 3.1331
Epoch [8/60], Batch [140/447], Loss: 3.5286
Epoch [8/60], Batch [150/447], Loss: 3.2186
Epoch [8/60], Batch [160/447], Loss: 3.0115
Epoch [8/60], Batch [170/447], Loss: 3.4264
Epoch [8/60], Batch [180/447], Loss: 3.2413
Epoch [8/60], Batch [190/447], Loss: 3.5539
Epoch [8/60], Batch [200/447], Loss: 3.4837
Epoch [8/60], Batch [210/447], Loss: 3.4050
Epoch [8/60], Batch [220/447], Loss: 3.4635

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [9/60], Batch [0/447], Loss: 3.5410
Epoch [9/60], Batch [10/447], Loss: 3.5301
Epoch [9/60], Batch [20/447], Loss: 3.0186
Epoch [9/60], Batch [30/447], Loss: 3.3183
Epoch [9/60], Batch [40/447], Loss: 3.4381
Epoch [9/60], Batch [50/447], Loss: 3.3396
Epoch [9/60], Batch [60/447], Loss: 3.2285
Epoch [9/60], Batch [70/447], Loss: 3.4655
Epoch [9/60], Batch [80/447], Loss: 3.2544
Epoch [9/60], Batch [90/447], Loss: 2.9459
Epoch [9/60], Batch [100/447], Loss: 3.3760
Epoch [9/60], Batch [110/447], Loss: 3.1588
Epoch [9/60], Batch [120/447], Loss: 3.4202
Epoch [9/60], Batch [130/447], Loss: 3.2510
Epoch [9/60], Batch [140/447], Loss: 3.2487
Epoch [9/60], Batch [150/447], Loss: 3.4835
Epoch [9/60], Batch [160/447], Loss: 3.4392
Epoch [9/60], Batch [170/447], Loss: 2.8461
Epoch [9/60], Batch [180/447], Loss: 3.3827
Epoch [9/60], Batch [190/447], Loss: 3.3031
Epoch [9/60], Batch [200/447], Loss: 3.4061
Epoch [9/60], Batch [210/447], Loss: 3.7340
Epoch [9/60], Batch [220/447], Loss: 3.3097

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [10/60], Batch [0/447], Loss: 3.1134
Epoch [10/60], Batch [10/447], Loss: 3.0768
Epoch [10/60], Batch [20/447], Loss: 3.3910
Epoch [10/60], Batch [30/447], Loss: 3.5566
Epoch [10/60], Batch [40/447], Loss: 3.2543
Epoch [10/60], Batch [50/447], Loss: 3.1281
Epoch [10/60], Batch [60/447], Loss: 3.2518
Epoch [10/60], Batch [70/447], Loss: 3.2922
Epoch [10/60], Batch [80/447], Loss: 3.0388
Epoch [10/60], Batch [90/447], Loss: 3.2064
Epoch [10/60], Batch [100/447], Loss: 3.2862
Epoch [10/60], Batch [110/447], Loss: 2.9819
Epoch [10/60], Batch [120/447], Loss: 3.0033
Epoch [10/60], Batch [130/447], Loss: 3.4860
Epoch [10/60], Batch [140/447], Loss: 3.1409
Epoch [10/60], Batch [150/447], Loss: 3.1991
Epoch [10/60], Batch [160/447], Loss: 2.7773
Epoch [10/60], Batch [170/447], Loss: 3.3375
Epoch [10/60], Batch [180/447], Loss: 3.3773
Epoch [10/60], Batch [190/447], Loss: 3.4686
Epoch [10/60], Batch [200/447], Loss: 3.1852
Epoch [10/60], Batch [210/447], Loss: 2.5894
Epoch [10/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [11/60], Batch [0/447], Loss: 3.4459
Epoch [11/60], Batch [10/447], Loss: 3.1208
Epoch [11/60], Batch [20/447], Loss: 2.6172
Epoch [11/60], Batch [30/447], Loss: 3.1411
Epoch [11/60], Batch [40/447], Loss: 3.6615
Epoch [11/60], Batch [50/447], Loss: 3.2371
Epoch [11/60], Batch [60/447], Loss: 2.7966
Epoch [11/60], Batch [70/447], Loss: 3.1296
Epoch [11/60], Batch [80/447], Loss: 2.9910
Epoch [11/60], Batch [90/447], Loss: 2.9155
Epoch [11/60], Batch [100/447], Loss: 2.9507
Epoch [11/60], Batch [110/447], Loss: 3.3080
Epoch [11/60], Batch [120/447], Loss: 3.2705
Epoch [11/60], Batch [130/447], Loss: 3.1611
Epoch [11/60], Batch [140/447], Loss: 3.5346
Epoch [11/60], Batch [150/447], Loss: 3.1394
Epoch [11/60], Batch [160/447], Loss: 2.7823
Epoch [11/60], Batch [170/447], Loss: 3.1328
Epoch [11/60], Batch [180/447], Loss: 3.0669
Epoch [11/60], Batch [190/447], Loss: 3.5123
Epoch [11/60], Batch [200/447], Loss: 3.2977
Epoch [11/60], Batch [210/447], Loss: 3.1223
Epoch [11/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [12/60], Batch [0/447], Loss: 2.6990
Epoch [12/60], Batch [10/447], Loss: 3.2672
Epoch [12/60], Batch [20/447], Loss: 2.9177
Epoch [12/60], Batch [30/447], Loss: 2.6919
Epoch [12/60], Batch [40/447], Loss: 3.4181
Epoch [12/60], Batch [50/447], Loss: 3.1640
Epoch [12/60], Batch [60/447], Loss: 3.3781
Epoch [12/60], Batch [70/447], Loss: 3.0639
Epoch [12/60], Batch [80/447], Loss: 3.5366
Epoch [12/60], Batch [90/447], Loss: 3.2266
Epoch [12/60], Batch [100/447], Loss: 3.2295
Epoch [12/60], Batch [110/447], Loss: 3.1752
Epoch [12/60], Batch [120/447], Loss: 3.1420
Epoch [12/60], Batch [130/447], Loss: 2.9480
Epoch [12/60], Batch [140/447], Loss: 3.2274
Epoch [12/60], Batch [150/447], Loss: 3.3959
Epoch [12/60], Batch [160/447], Loss: 2.8457
Epoch [12/60], Batch [170/447], Loss: 3.4040
Epoch [12/60], Batch [180/447], Loss: 3.1019
Epoch [12/60], Batch [190/447], Loss: 2.9216
Epoch [12/60], Batch [200/447], Loss: 3.0163
Epoch [12/60], Batch [210/447], Loss: 2.8015
Epoch [12/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [13/60], Batch [0/447], Loss: 3.0607
Epoch [13/60], Batch [10/447], Loss: 2.5801
Epoch [13/60], Batch [20/447], Loss: 2.9364
Epoch [13/60], Batch [30/447], Loss: 2.4259
Epoch [13/60], Batch [40/447], Loss: 3.1744
Epoch [13/60], Batch [50/447], Loss: 3.2520
Epoch [13/60], Batch [60/447], Loss: 3.1959
Epoch [13/60], Batch [70/447], Loss: 3.1568
Epoch [13/60], Batch [80/447], Loss: 2.6984
Epoch [13/60], Batch [90/447], Loss: 2.9744
Epoch [13/60], Batch [100/447], Loss: 2.9763
Epoch [13/60], Batch [110/447], Loss: 3.7240
Epoch [13/60], Batch [120/447], Loss: 3.0406
Epoch [13/60], Batch [130/447], Loss: 2.9108
Epoch [13/60], Batch [140/447], Loss: 3.2139
Epoch [13/60], Batch [150/447], Loss: 3.5223
Epoch [13/60], Batch [160/447], Loss: 3.0448
Epoch [13/60], Batch [170/447], Loss: 2.5046
Epoch [13/60], Batch [180/447], Loss: 3.0675
Epoch [13/60], Batch [190/447], Loss: 2.2864
Epoch [13/60], Batch [200/447], Loss: 3.0453
Epoch [13/60], Batch [210/447], Loss: 2.8308
Epoch [13/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [14/60], Batch [0/447], Loss: 3.2229
Epoch [14/60], Batch [10/447], Loss: 2.7428
Epoch [14/60], Batch [20/447], Loss: 2.8526
Epoch [14/60], Batch [30/447], Loss: 2.8512
Epoch [14/60], Batch [40/447], Loss: 3.0695
Epoch [14/60], Batch [50/447], Loss: 3.1191
Epoch [14/60], Batch [60/447], Loss: 2.9911
Epoch [14/60], Batch [70/447], Loss: 3.1475
Epoch [14/60], Batch [80/447], Loss: 2.8563
Epoch [14/60], Batch [90/447], Loss: 3.2579
Epoch [14/60], Batch [100/447], Loss: 3.0243
Epoch [14/60], Batch [110/447], Loss: 3.1877
Epoch [14/60], Batch [120/447], Loss: 3.1615
Epoch [14/60], Batch [130/447], Loss: 3.0463
Epoch [14/60], Batch [140/447], Loss: 2.6752
Epoch [14/60], Batch [150/447], Loss: 2.9841
Epoch [14/60], Batch [160/447], Loss: 2.5985
Epoch [14/60], Batch [170/447], Loss: 2.6670
Epoch [14/60], Batch [180/447], Loss: 3.3584
Epoch [14/60], Batch [190/447], Loss: 2.8949
Epoch [14/60], Batch [200/447], Loss: 2.8637
Epoch [14/60], Batch [210/447], Loss: 3.2376
Epoch [14/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [15/60], Batch [0/447], Loss: 2.8383
Epoch [15/60], Batch [10/447], Loss: 3.1497
Epoch [15/60], Batch [20/447], Loss: 3.1869
Epoch [15/60], Batch [30/447], Loss: 2.8542
Epoch [15/60], Batch [40/447], Loss: 2.8484
Epoch [15/60], Batch [50/447], Loss: 2.5994
Epoch [15/60], Batch [60/447], Loss: 3.0135
Epoch [15/60], Batch [70/447], Loss: 2.3491
Epoch [15/60], Batch [80/447], Loss: 2.9859
Epoch [15/60], Batch [90/447], Loss: 3.1994
Epoch [15/60], Batch [100/447], Loss: 2.4934
Epoch [15/60], Batch [110/447], Loss: 2.1935
Epoch [15/60], Batch [120/447], Loss: 3.3673
Epoch [15/60], Batch [130/447], Loss: 2.6067
Epoch [15/60], Batch [140/447], Loss: 3.1195
Epoch [15/60], Batch [150/447], Loss: 3.0538
Epoch [15/60], Batch [160/447], Loss: 3.4345
Epoch [15/60], Batch [170/447], Loss: 2.9101
Epoch [15/60], Batch [180/447], Loss: 2.9781
Epoch [15/60], Batch [190/447], Loss: 2.6980
Epoch [15/60], Batch [200/447], Loss: 3.1166
Epoch [15/60], Batch [210/447], Loss: 3.1202
Epoch [15/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [16/60], Batch [0/447], Loss: 2.6263
Epoch [16/60], Batch [10/447], Loss: 3.0259
Epoch [16/60], Batch [20/447], Loss: 2.8509
Epoch [16/60], Batch [30/447], Loss: 2.5681
Epoch [16/60], Batch [40/447], Loss: 2.7786
Epoch [16/60], Batch [50/447], Loss: 2.6493
Epoch [16/60], Batch [60/447], Loss: 2.9675
Epoch [16/60], Batch [70/447], Loss: 2.1431
Epoch [16/60], Batch [80/447], Loss: 3.0868
Epoch [16/60], Batch [90/447], Loss: 2.4103
Epoch [16/60], Batch [100/447], Loss: 3.2608
Epoch [16/60], Batch [110/447], Loss: 3.0571
Epoch [16/60], Batch [120/447], Loss: 2.9730
Epoch [16/60], Batch [130/447], Loss: 2.9336
Epoch [16/60], Batch [140/447], Loss: 3.0948
Epoch [16/60], Batch [150/447], Loss: 2.7174
Epoch [16/60], Batch [160/447], Loss: 3.0011
Epoch [16/60], Batch [170/447], Loss: 3.1772
Epoch [16/60], Batch [180/447], Loss: 3.2430
Epoch [16/60], Batch [190/447], Loss: 3.1904
Epoch [16/60], Batch [200/447], Loss: 3.5567
Epoch [16/60], Batch [210/447], Loss: 3.4023
Epoch [16/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [17/60], Batch [0/447], Loss: 3.0302
Epoch [17/60], Batch [10/447], Loss: 2.8147
Epoch [17/60], Batch [20/447], Loss: 2.5311
Epoch [17/60], Batch [30/447], Loss: 2.9116
Epoch [17/60], Batch [40/447], Loss: 3.0224
Epoch [17/60], Batch [50/447], Loss: 2.7001
Epoch [17/60], Batch [60/447], Loss: 2.7133
Epoch [17/60], Batch [70/447], Loss: 2.9976
Epoch [17/60], Batch [80/447], Loss: 2.3554
Epoch [17/60], Batch [90/447], Loss: 2.8729
Epoch [17/60], Batch [100/447], Loss: 2.2550
Epoch [17/60], Batch [110/447], Loss: 2.7723
Epoch [17/60], Batch [120/447], Loss: 2.5122
Epoch [17/60], Batch [130/447], Loss: 3.2345
Epoch [17/60], Batch [140/447], Loss: 2.8377
Epoch [17/60], Batch [150/447], Loss: 3.1886
Epoch [17/60], Batch [160/447], Loss: 3.0991
Epoch [17/60], Batch [170/447], Loss: 2.5426
Epoch [17/60], Batch [180/447], Loss: 3.5676
Epoch [17/60], Batch [190/447], Loss: 2.9369
Epoch [17/60], Batch [200/447], Loss: 3.3197
Epoch [17/60], Batch [210/447], Loss: 2.9302
Epoch [17/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [18/60], Batch [0/447], Loss: 2.8446
Epoch [18/60], Batch [10/447], Loss: 2.8192
Epoch [18/60], Batch [20/447], Loss: 2.9105
Epoch [18/60], Batch [30/447], Loss: 2.8684
Epoch [18/60], Batch [40/447], Loss: 2.7755
Epoch [18/60], Batch [50/447], Loss: 3.1716
Epoch [18/60], Batch [60/447], Loss: 2.5417
Epoch [18/60], Batch [70/447], Loss: 3.0163
Epoch [18/60], Batch [80/447], Loss: 3.4021
Epoch [18/60], Batch [90/447], Loss: 3.1517
Epoch [18/60], Batch [100/447], Loss: 2.9798
Epoch [18/60], Batch [110/447], Loss: 2.8217
Epoch [18/60], Batch [120/447], Loss: 2.7160
Epoch [18/60], Batch [130/447], Loss: 3.0291
Epoch [18/60], Batch [140/447], Loss: 2.8264
Epoch [18/60], Batch [150/447], Loss: 2.4604
Epoch [18/60], Batch [160/447], Loss: 2.3846
Epoch [18/60], Batch [170/447], Loss: 2.3081
Epoch [18/60], Batch [180/447], Loss: 2.6827
Epoch [18/60], Batch [190/447], Loss: 3.0091
Epoch [18/60], Batch [200/447], Loss: 2.9630
Epoch [18/60], Batch [210/447], Loss: 2.9047
Epoch [18/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [19/60], Batch [0/447], Loss: 2.9887
Epoch [19/60], Batch [10/447], Loss: 2.4087
Epoch [19/60], Batch [20/447], Loss: 2.9479
Epoch [19/60], Batch [30/447], Loss: 2.9977
Epoch [19/60], Batch [40/447], Loss: 2.5820
Epoch [19/60], Batch [50/447], Loss: 2.2507
Epoch [19/60], Batch [60/447], Loss: 3.0332
Epoch [19/60], Batch [70/447], Loss: 2.7633
Epoch [19/60], Batch [80/447], Loss: 2.8935
Epoch [19/60], Batch [90/447], Loss: 2.9451
Epoch [19/60], Batch [100/447], Loss: 2.5625
Epoch [19/60], Batch [110/447], Loss: 3.2626
Epoch [19/60], Batch [120/447], Loss: 2.7295
Epoch [19/60], Batch [130/447], Loss: 2.9083
Epoch [19/60], Batch [140/447], Loss: 1.9814
Epoch [19/60], Batch [150/447], Loss: 2.6793
Epoch [19/60], Batch [160/447], Loss: 3.2010
Epoch [19/60], Batch [170/447], Loss: 2.6134
Epoch [19/60], Batch [180/447], Loss: 2.7463
Epoch [19/60], Batch [190/447], Loss: 2.7987
Epoch [19/60], Batch [200/447], Loss: 2.6703
Epoch [19/60], Batch [210/447], Loss: 2.5416
Epoch [19/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [20/60], Batch [0/447], Loss: 2.8775
Epoch [20/60], Batch [10/447], Loss: 2.4330
Epoch [20/60], Batch [20/447], Loss: 3.2112
Epoch [20/60], Batch [30/447], Loss: 3.1840
Epoch [20/60], Batch [40/447], Loss: 2.8369
Epoch [20/60], Batch [50/447], Loss: 3.1041
Epoch [20/60], Batch [60/447], Loss: 2.6031
Epoch [20/60], Batch [70/447], Loss: 2.8329
Epoch [20/60], Batch [80/447], Loss: 3.4137
Epoch [20/60], Batch [90/447], Loss: 2.8164
Epoch [20/60], Batch [100/447], Loss: 2.7293
Epoch [20/60], Batch [110/447], Loss: 3.3662
Epoch [20/60], Batch [120/447], Loss: 2.4312
Epoch [20/60], Batch [130/447], Loss: 3.2411
Epoch [20/60], Batch [140/447], Loss: 2.5894
Epoch [20/60], Batch [150/447], Loss: 2.7700
Epoch [20/60], Batch [160/447], Loss: 2.9290
Epoch [20/60], Batch [170/447], Loss: 2.3788
Epoch [20/60], Batch [180/447], Loss: 2.6847
Epoch [20/60], Batch [190/447], Loss: 3.1212
Epoch [20/60], Batch [200/447], Loss: 2.6002
Epoch [20/60], Batch [210/447], Loss: 3.1159
Epoch [20/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [21/60], Batch [0/447], Loss: 3.2040
Epoch [21/60], Batch [10/447], Loss: 3.0316
Epoch [21/60], Batch [20/447], Loss: 2.4452
Epoch [21/60], Batch [30/447], Loss: 3.1126
Epoch [21/60], Batch [40/447], Loss: 2.5563
Epoch [21/60], Batch [50/447], Loss: 2.4944
Epoch [21/60], Batch [60/447], Loss: 2.6655
Epoch [21/60], Batch [70/447], Loss: 2.5695
Epoch [21/60], Batch [80/447], Loss: 3.0924
Epoch [21/60], Batch [90/447], Loss: 2.2293
Epoch [21/60], Batch [100/447], Loss: 2.1371
Epoch [21/60], Batch [110/447], Loss: 2.8231
Epoch [21/60], Batch [120/447], Loss: 3.0719
Epoch [21/60], Batch [130/447], Loss: 2.9233
Epoch [21/60], Batch [140/447], Loss: 2.3783
Epoch [21/60], Batch [150/447], Loss: 2.7261
Epoch [21/60], Batch [160/447], Loss: 2.4467
Epoch [21/60], Batch [170/447], Loss: 2.7917
Epoch [21/60], Batch [180/447], Loss: 2.4427
Epoch [21/60], Batch [190/447], Loss: 2.9123
Epoch [21/60], Batch [200/447], Loss: 2.6406
Epoch [21/60], Batch [210/447], Loss: 2.8897
Epoch [21/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [22/60], Batch [0/447], Loss: 2.8291
Epoch [22/60], Batch [10/447], Loss: 2.2670
Epoch [22/60], Batch [20/447], Loss: 2.6929
Epoch [22/60], Batch [30/447], Loss: 2.8097
Epoch [22/60], Batch [40/447], Loss: 2.9537
Epoch [22/60], Batch [50/447], Loss: 2.5869
Epoch [22/60], Batch [60/447], Loss: 2.9183
Epoch [22/60], Batch [70/447], Loss: 2.8360
Epoch [22/60], Batch [80/447], Loss: 2.4732
Epoch [22/60], Batch [90/447], Loss: 2.6813
Epoch [22/60], Batch [100/447], Loss: 2.7821
Epoch [22/60], Batch [110/447], Loss: 2.5870
Epoch [22/60], Batch [120/447], Loss: 2.3763
Epoch [22/60], Batch [130/447], Loss: 2.3799
Epoch [22/60], Batch [140/447], Loss: 2.6535
Epoch [22/60], Batch [150/447], Loss: 3.1431
Epoch [22/60], Batch [160/447], Loss: 2.9165
Epoch [22/60], Batch [170/447], Loss: 2.9935
Epoch [22/60], Batch [180/447], Loss: 2.5317
Epoch [22/60], Batch [190/447], Loss: 2.3478
Epoch [22/60], Batch [200/447], Loss: 3.2393
Epoch [22/60], Batch [210/447], Loss: 2.9310
Epoch [22/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [23/60], Batch [0/447], Loss: 2.4157
Epoch [23/60], Batch [10/447], Loss: 3.5517
Epoch [23/60], Batch [20/447], Loss: 3.3647
Epoch [23/60], Batch [30/447], Loss: 2.3567
Epoch [23/60], Batch [40/447], Loss: 2.5409
Epoch [23/60], Batch [50/447], Loss: 2.4018
Epoch [23/60], Batch [60/447], Loss: 2.7362
Epoch [23/60], Batch [70/447], Loss: 2.9571
Epoch [23/60], Batch [80/447], Loss: 2.9643
Epoch [23/60], Batch [90/447], Loss: 2.8245
Epoch [23/60], Batch [100/447], Loss: 2.9002
Epoch [23/60], Batch [110/447], Loss: 2.0038
Epoch [23/60], Batch [120/447], Loss: 3.1928
Epoch [23/60], Batch [130/447], Loss: 2.3286
Epoch [23/60], Batch [140/447], Loss: 3.0966
Epoch [23/60], Batch [150/447], Loss: 2.4868
Epoch [23/60], Batch [160/447], Loss: 3.1704
Epoch [23/60], Batch [170/447], Loss: 3.0591
Epoch [23/60], Batch [180/447], Loss: 3.3999
Epoch [23/60], Batch [190/447], Loss: 2.6230
Epoch [23/60], Batch [200/447], Loss: 2.4279
Epoch [23/60], Batch [210/447], Loss: 2.5463
Epoch [23/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [24/60], Batch [0/447], Loss: 2.7073
Epoch [24/60], Batch [10/447], Loss: 3.2110
Epoch [24/60], Batch [20/447], Loss: 2.6294
Epoch [24/60], Batch [30/447], Loss: 2.8829
Epoch [24/60], Batch [40/447], Loss: 2.1775
Epoch [24/60], Batch [50/447], Loss: 2.7192
Epoch [24/60], Batch [60/447], Loss: 2.5053
Epoch [24/60], Batch [70/447], Loss: 2.9894
Epoch [24/60], Batch [80/447], Loss: 2.2084
Epoch [24/60], Batch [90/447], Loss: 2.4285
Epoch [24/60], Batch [100/447], Loss: 2.9934
Epoch [24/60], Batch [110/447], Loss: 2.7682
Epoch [24/60], Batch [120/447], Loss: 2.4733
Epoch [24/60], Batch [130/447], Loss: 3.3133
Epoch [24/60], Batch [140/447], Loss: 2.4996
Epoch [24/60], Batch [150/447], Loss: 2.2227
Epoch [24/60], Batch [160/447], Loss: 2.3921
Epoch [24/60], Batch [170/447], Loss: 3.0321
Epoch [24/60], Batch [180/447], Loss: 2.6083
Epoch [24/60], Batch [190/447], Loss: 2.9102
Epoch [24/60], Batch [200/447], Loss: 2.9131
Epoch [24/60], Batch [210/447], Loss: 2.6840
Epoch [24/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [25/60], Batch [0/447], Loss: 2.9684
Epoch [25/60], Batch [10/447], Loss: 2.1453
Epoch [25/60], Batch [20/447], Loss: 2.4762
Epoch [25/60], Batch [30/447], Loss: 2.6405
Epoch [25/60], Batch [40/447], Loss: 2.1750
Epoch [25/60], Batch [50/447], Loss: 2.9318
Epoch [25/60], Batch [60/447], Loss: 2.4578
Epoch [25/60], Batch [70/447], Loss: 2.7003
Epoch [25/60], Batch [80/447], Loss: 2.0773
Epoch [25/60], Batch [90/447], Loss: 2.6671
Epoch [25/60], Batch [100/447], Loss: 2.8135
Epoch [25/60], Batch [110/447], Loss: 3.0068
Epoch [25/60], Batch [120/447], Loss: 1.9337
Epoch [25/60], Batch [130/447], Loss: 2.4302
Epoch [25/60], Batch [140/447], Loss: 2.8211
Epoch [25/60], Batch [150/447], Loss: 2.4726
Epoch [25/60], Batch [160/447], Loss: 2.9960
Epoch [25/60], Batch [170/447], Loss: 2.6150
Epoch [25/60], Batch [180/447], Loss: 2.3593
Epoch [25/60], Batch [190/447], Loss: 2.2113
Epoch [25/60], Batch [200/447], Loss: 2.2739
Epoch [25/60], Batch [210/447], Loss: 1.6244
Epoch [25/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [26/60], Batch [0/447], Loss: 2.6703
Epoch [26/60], Batch [10/447], Loss: 2.5466
Epoch [26/60], Batch [20/447], Loss: 3.1172
Epoch [26/60], Batch [30/447], Loss: 2.2149
Epoch [26/60], Batch [40/447], Loss: 2.6963
Epoch [26/60], Batch [50/447], Loss: 1.7288
Epoch [26/60], Batch [60/447], Loss: 2.4276
Epoch [26/60], Batch [70/447], Loss: 2.8237
Epoch [26/60], Batch [80/447], Loss: 2.7668
Epoch [26/60], Batch [90/447], Loss: 2.5718
Epoch [26/60], Batch [100/447], Loss: 2.6557
Epoch [26/60], Batch [110/447], Loss: 2.1859
Epoch [26/60], Batch [120/447], Loss: 2.3759
Epoch [26/60], Batch [130/447], Loss: 2.6295
Epoch [26/60], Batch [140/447], Loss: 2.5947
Epoch [26/60], Batch [150/447], Loss: 2.3477
Epoch [26/60], Batch [160/447], Loss: 2.8094
Epoch [26/60], Batch [170/447], Loss: 2.3652
Epoch [26/60], Batch [180/447], Loss: 3.9486
Epoch [26/60], Batch [190/447], Loss: 2.3868
Epoch [26/60], Batch [200/447], Loss: 2.6870
Epoch [26/60], Batch [210/447], Loss: 2.3024
Epoch [26/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [27/60], Batch [0/447], Loss: 2.7287
Epoch [27/60], Batch [10/447], Loss: 2.6828
Epoch [27/60], Batch [20/447], Loss: 2.4407
Epoch [27/60], Batch [30/447], Loss: 2.4770
Epoch [27/60], Batch [40/447], Loss: 2.0264
Epoch [27/60], Batch [50/447], Loss: 3.0099
Epoch [27/60], Batch [60/447], Loss: 2.7991
Epoch [27/60], Batch [70/447], Loss: 2.3363
Epoch [27/60], Batch [80/447], Loss: 2.8247
Epoch [27/60], Batch [90/447], Loss: 2.4105
Epoch [27/60], Batch [100/447], Loss: 3.1255
Epoch [27/60], Batch [110/447], Loss: 2.8379
Epoch [27/60], Batch [120/447], Loss: 2.9444
Epoch [27/60], Batch [130/447], Loss: 2.6858
Epoch [27/60], Batch [140/447], Loss: 2.5797
Epoch [27/60], Batch [150/447], Loss: 2.1454
Epoch [27/60], Batch [160/447], Loss: 2.9385
Epoch [27/60], Batch [170/447], Loss: 2.4838
Epoch [27/60], Batch [180/447], Loss: 3.1162
Epoch [27/60], Batch [190/447], Loss: 2.1747
Epoch [27/60], Batch [200/447], Loss: 2.5444
Epoch [27/60], Batch [210/447], Loss: 2.3387
Epoch [27/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [28/60], Batch [0/447], Loss: 2.3740
Epoch [28/60], Batch [10/447], Loss: 2.8870
Epoch [28/60], Batch [20/447], Loss: 2.2809
Epoch [28/60], Batch [30/447], Loss: 2.3265
Epoch [28/60], Batch [40/447], Loss: 2.9294
Epoch [28/60], Batch [50/447], Loss: 3.0182
Epoch [28/60], Batch [60/447], Loss: 3.1477
Epoch [28/60], Batch [70/447], Loss: 2.7936
Epoch [28/60], Batch [80/447], Loss: 3.2485
Epoch [28/60], Batch [90/447], Loss: 2.8346
Epoch [28/60], Batch [100/447], Loss: 3.0873
Epoch [28/60], Batch [110/447], Loss: 1.9388
Epoch [28/60], Batch [120/447], Loss: 2.6083
Epoch [28/60], Batch [130/447], Loss: 2.1419
Epoch [28/60], Batch [140/447], Loss: 2.6069
Epoch [28/60], Batch [150/447], Loss: 1.6257
Epoch [28/60], Batch [160/447], Loss: 2.7862
Epoch [28/60], Batch [170/447], Loss: 2.4291
Epoch [28/60], Batch [180/447], Loss: 2.7039
Epoch [28/60], Batch [190/447], Loss: 3.0718
Epoch [28/60], Batch [200/447], Loss: 2.1150
Epoch [28/60], Batch [210/447], Loss: 2.6860
Epoch [28/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [29/60], Batch [0/447], Loss: 2.8599
Epoch [29/60], Batch [10/447], Loss: 2.5397
Epoch [29/60], Batch [20/447], Loss: 2.8609
Epoch [29/60], Batch [30/447], Loss: 2.6706
Epoch [29/60], Batch [40/447], Loss: 2.6564
Epoch [29/60], Batch [50/447], Loss: 2.3944
Epoch [29/60], Batch [60/447], Loss: 2.4475
Epoch [29/60], Batch [70/447], Loss: 2.2073
Epoch [29/60], Batch [80/447], Loss: 2.8128
Epoch [29/60], Batch [90/447], Loss: 2.1035
Epoch [29/60], Batch [100/447], Loss: 2.1276
Epoch [29/60], Batch [110/447], Loss: 2.3428
Epoch [29/60], Batch [120/447], Loss: 2.1415
Epoch [29/60], Batch [130/447], Loss: 2.7690
Epoch [29/60], Batch [140/447], Loss: 1.8115
Epoch [29/60], Batch [150/447], Loss: 2.8808
Epoch [29/60], Batch [160/447], Loss: 2.9434
Epoch [29/60], Batch [170/447], Loss: 2.2492
Epoch [29/60], Batch [180/447], Loss: 2.4869
Epoch [29/60], Batch [190/447], Loss: 2.3460
Epoch [29/60], Batch [200/447], Loss: 1.9538
Epoch [29/60], Batch [210/447], Loss: 2.8931
Epoch [29/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [30/60], Batch [0/447], Loss: 2.8704
Epoch [30/60], Batch [10/447], Loss: 2.3326
Epoch [30/60], Batch [20/447], Loss: 2.4626
Epoch [30/60], Batch [30/447], Loss: 2.6843
Epoch [30/60], Batch [40/447], Loss: 2.6362
Epoch [30/60], Batch [50/447], Loss: 2.6499
Epoch [30/60], Batch [60/447], Loss: 2.6741
Epoch [30/60], Batch [70/447], Loss: 2.8005
Epoch [30/60], Batch [80/447], Loss: 2.3550
Epoch [30/60], Batch [90/447], Loss: 2.7702
Epoch [30/60], Batch [100/447], Loss: 2.4911
Epoch [30/60], Batch [110/447], Loss: 2.1680
Epoch [30/60], Batch [120/447], Loss: 2.3120
Epoch [30/60], Batch [130/447], Loss: 2.9130
Epoch [30/60], Batch [140/447], Loss: 2.4558
Epoch [30/60], Batch [150/447], Loss: 2.4270
Epoch [30/60], Batch [160/447], Loss: 3.1982
Epoch [30/60], Batch [170/447], Loss: 2.6714
Epoch [30/60], Batch [180/447], Loss: 2.5091
Epoch [30/60], Batch [190/447], Loss: 2.8675
Epoch [30/60], Batch [200/447], Loss: 2.7164
Epoch [30/60], Batch [210/447], Loss: 2.5057
Epoch [30/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [31/60], Batch [0/447], Loss: 2.2489
Epoch [31/60], Batch [10/447], Loss: 2.5941
Epoch [31/60], Batch [20/447], Loss: 2.6917
Epoch [31/60], Batch [30/447], Loss: 2.3144
Epoch [31/60], Batch [40/447], Loss: 2.4463
Epoch [31/60], Batch [50/447], Loss: 2.3112
Epoch [31/60], Batch [60/447], Loss: 2.8130
Epoch [31/60], Batch [70/447], Loss: 2.3700
Epoch [31/60], Batch [80/447], Loss: 2.5521
Epoch [31/60], Batch [90/447], Loss: 2.6871
Epoch [31/60], Batch [100/447], Loss: 2.0260
Epoch [31/60], Batch [110/447], Loss: 2.0874
Epoch [31/60], Batch [120/447], Loss: 2.1714
Epoch [31/60], Batch [130/447], Loss: 2.9736
Epoch [31/60], Batch [140/447], Loss: 2.2142
Epoch [31/60], Batch [150/447], Loss: 2.4669
Epoch [31/60], Batch [160/447], Loss: 2.3425
Epoch [31/60], Batch [170/447], Loss: 2.8811
Epoch [31/60], Batch [180/447], Loss: 1.9958
Epoch [31/60], Batch [190/447], Loss: 2.1782
Epoch [31/60], Batch [200/447], Loss: 2.7629
Epoch [31/60], Batch [210/447], Loss: 2.4095
Epoch [31/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [32/60], Batch [0/447], Loss: 2.5941
Epoch [32/60], Batch [10/447], Loss: 1.9421
Epoch [32/60], Batch [20/447], Loss: 2.5673
Epoch [32/60], Batch [30/447], Loss: 2.5549
Epoch [32/60], Batch [40/447], Loss: 2.0723
Epoch [32/60], Batch [50/447], Loss: 2.9991
Epoch [32/60], Batch [60/447], Loss: 3.1880
Epoch [32/60], Batch [70/447], Loss: 2.7274
Epoch [32/60], Batch [80/447], Loss: 2.2150
Epoch [32/60], Batch [90/447], Loss: 3.0661
Epoch [32/60], Batch [100/447], Loss: 3.1096
Epoch [32/60], Batch [110/447], Loss: 2.6835
Epoch [32/60], Batch [120/447], Loss: 2.6538
Epoch [32/60], Batch [130/447], Loss: 2.7514
Epoch [32/60], Batch [140/447], Loss: 2.7245
Epoch [32/60], Batch [150/447], Loss: 2.9756
Epoch [32/60], Batch [160/447], Loss: 2.8883
Epoch [32/60], Batch [170/447], Loss: 2.0483
Epoch [32/60], Batch [180/447], Loss: 2.7046
Epoch [32/60], Batch [190/447], Loss: 2.1542
Epoch [32/60], Batch [200/447], Loss: 2.4715
Epoch [32/60], Batch [210/447], Loss: 2.3447
Epoch [32/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [33/60], Batch [0/447], Loss: 2.3673
Epoch [33/60], Batch [10/447], Loss: 2.6021
Epoch [33/60], Batch [20/447], Loss: 2.0023
Epoch [33/60], Batch [30/447], Loss: 2.9386
Epoch [33/60], Batch [40/447], Loss: 2.5504
Epoch [33/60], Batch [50/447], Loss: 2.1514
Epoch [33/60], Batch [60/447], Loss: 3.2383
Epoch [33/60], Batch [70/447], Loss: 2.2903
Epoch [33/60], Batch [80/447], Loss: 2.6199
Epoch [33/60], Batch [90/447], Loss: 2.6093
Epoch [33/60], Batch [100/447], Loss: 2.8962
Epoch [33/60], Batch [110/447], Loss: 2.1793
Epoch [33/60], Batch [120/447], Loss: 2.2874
Epoch [33/60], Batch [130/447], Loss: 2.4212
Epoch [33/60], Batch [140/447], Loss: 3.3134
Epoch [33/60], Batch [150/447], Loss: 2.4257
Epoch [33/60], Batch [160/447], Loss: 2.5714
Epoch [33/60], Batch [170/447], Loss: 2.0414
Epoch [33/60], Batch [180/447], Loss: 2.7003
Epoch [33/60], Batch [190/447], Loss: 2.8710
Epoch [33/60], Batch [200/447], Loss: 2.2515
Epoch [33/60], Batch [210/447], Loss: 2.2305
Epoch [33/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [34/60], Batch [0/447], Loss: 2.3659
Epoch [34/60], Batch [10/447], Loss: 2.1641
Epoch [34/60], Batch [20/447], Loss: 2.3069
Epoch [34/60], Batch [30/447], Loss: 2.0756
Epoch [34/60], Batch [40/447], Loss: 1.7878
Epoch [34/60], Batch [50/447], Loss: 2.2443
Epoch [34/60], Batch [60/447], Loss: 2.2258
Epoch [34/60], Batch [70/447], Loss: 2.3669
Epoch [34/60], Batch [80/447], Loss: 1.6524
Epoch [34/60], Batch [90/447], Loss: 2.6682
Epoch [34/60], Batch [100/447], Loss: 2.8744
Epoch [34/60], Batch [110/447], Loss: 2.0960
Epoch [34/60], Batch [120/447], Loss: 2.5094
Epoch [34/60], Batch [130/447], Loss: 2.6138
Epoch [34/60], Batch [140/447], Loss: 2.3913
Epoch [34/60], Batch [150/447], Loss: 2.2675
Epoch [34/60], Batch [160/447], Loss: 2.6455
Epoch [34/60], Batch [170/447], Loss: 2.6320
Epoch [34/60], Batch [180/447], Loss: 1.9600
Epoch [34/60], Batch [190/447], Loss: 2.4954
Epoch [34/60], Batch [200/447], Loss: 2.4090
Epoch [34/60], Batch [210/447], Loss: 2.4293
Epoch [34/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [35/60], Batch [0/447], Loss: 2.7319
Epoch [35/60], Batch [10/447], Loss: 2.8900
Epoch [35/60], Batch [20/447], Loss: 2.3631
Epoch [35/60], Batch [30/447], Loss: 2.3661
Epoch [35/60], Batch [40/447], Loss: 2.2547
Epoch [35/60], Batch [50/447], Loss: 3.2502
Epoch [35/60], Batch [60/447], Loss: 2.9036
Epoch [35/60], Batch [70/447], Loss: 2.3186
Epoch [35/60], Batch [80/447], Loss: 2.6559
Epoch [35/60], Batch [90/447], Loss: 2.6332
Epoch [35/60], Batch [100/447], Loss: 2.2440
Epoch [35/60], Batch [110/447], Loss: 2.2286
Epoch [35/60], Batch [120/447], Loss: 2.3607
Epoch [35/60], Batch [130/447], Loss: 2.4436
Epoch [35/60], Batch [140/447], Loss: 2.6814
Epoch [35/60], Batch [150/447], Loss: 2.8570
Epoch [35/60], Batch [160/447], Loss: 2.7794
Epoch [35/60], Batch [170/447], Loss: 2.3977
Epoch [35/60], Batch [180/447], Loss: 2.1057
Epoch [35/60], Batch [190/447], Loss: 2.2837
Epoch [35/60], Batch [200/447], Loss: 2.5062
Epoch [35/60], Batch [210/447], Loss: 2.7757
Epoch [35/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [36/60], Batch [0/447], Loss: 2.8003
Epoch [36/60], Batch [10/447], Loss: 2.7949
Epoch [36/60], Batch [20/447], Loss: 2.2588
Epoch [36/60], Batch [30/447], Loss: 2.1769
Epoch [36/60], Batch [40/447], Loss: 2.3999
Epoch [36/60], Batch [50/447], Loss: 2.5736
Epoch [36/60], Batch [60/447], Loss: 1.7638
Epoch [36/60], Batch [70/447], Loss: 2.3141
Epoch [36/60], Batch [80/447], Loss: 2.3194
Epoch [36/60], Batch [90/447], Loss: 2.5521
Epoch [36/60], Batch [100/447], Loss: 2.7299
Epoch [36/60], Batch [110/447], Loss: 1.9476
Epoch [36/60], Batch [120/447], Loss: 2.4832
Epoch [36/60], Batch [130/447], Loss: 2.6279
Epoch [36/60], Batch [140/447], Loss: 2.5535
Epoch [36/60], Batch [150/447], Loss: 2.7364
Epoch [36/60], Batch [160/447], Loss: 2.2200
Epoch [36/60], Batch [170/447], Loss: 2.9125
Epoch [36/60], Batch [180/447], Loss: 2.0765
Epoch [36/60], Batch [190/447], Loss: 2.4782
Epoch [36/60], Batch [200/447], Loss: 2.6673
Epoch [36/60], Batch [210/447], Loss: 1.3100
Epoch [36/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [37/60], Batch [0/447], Loss: 2.4423
Epoch [37/60], Batch [10/447], Loss: 1.9230
Epoch [37/60], Batch [20/447], Loss: 1.5732
Epoch [37/60], Batch [30/447], Loss: 2.5612
Epoch [37/60], Batch [40/447], Loss: 2.6977
Epoch [37/60], Batch [50/447], Loss: 2.4457
Epoch [37/60], Batch [60/447], Loss: 2.2311
Epoch [37/60], Batch [70/447], Loss: 2.2448
Epoch [37/60], Batch [80/447], Loss: 2.4370
Epoch [37/60], Batch [90/447], Loss: 1.8945
Epoch [37/60], Batch [100/447], Loss: 2.0705
Epoch [37/60], Batch [110/447], Loss: 2.6848
Epoch [37/60], Batch [120/447], Loss: 2.2879
Epoch [37/60], Batch [130/447], Loss: 2.0022
Epoch [37/60], Batch [140/447], Loss: 2.2645
Epoch [37/60], Batch [150/447], Loss: 2.5566
Epoch [37/60], Batch [160/447], Loss: 2.8354
Epoch [37/60], Batch [170/447], Loss: 2.0077
Epoch [37/60], Batch [180/447], Loss: 2.1526
Epoch [37/60], Batch [190/447], Loss: 2.6797
Epoch [37/60], Batch [200/447], Loss: 2.3415
Epoch [37/60], Batch [210/447], Loss: 2.5892
Epoch [37/60], Batch 

[I 2024-12-13 12:34:48,536] Trial 5 pruned. 


Epoch [37/60], Validation Accuracy: 0.7092, Validation Loss: 1.0415
No improvement in validation accuracy for 5 epoch(s).
Early stopping at epoch 37.
Trial early stopped due to lack of improvement.
Starting a new trial...
Trial 6: alpha = 1.6443457513284063
Building the model...


2024-12-13 12:34:48,886 - mmaction - INFO - load model from: https://download.openmmlab.com/mmaction/recognition/csn/ircsn_from_scratch_r50_ig65m_20210617-ce545a37.pth
2024-12-13 12:34:48,887 - mmaction - INFO - load checkpoint from http path: https://download.openmmlab.com/mmaction/recognition/csn/ircsn_from_scratch_r50_ig65m_20210617-ce545a37.pth


Model built successfully!
Starting training...


  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [1/60], Batch [0/447], Loss: 4.0447
Epoch [1/60], Batch [10/447], Loss: 3.9984
Epoch [1/60], Batch [20/447], Loss: 3.8925
Epoch [1/60], Batch [30/447], Loss: 3.9472
Epoch [1/60], Batch [40/447], Loss: 3.9626
Epoch [1/60], Batch [50/447], Loss: 3.9366
Epoch [1/60], Batch [60/447], Loss: 3.9397
Epoch [1/60], Batch [70/447], Loss: 3.9028
Epoch [1/60], Batch [80/447], Loss: 3.9948
Epoch [1/60], Batch [90/447], Loss: 3.9593
Epoch [1/60], Batch [100/447], Loss: 3.9506
Epoch [1/60], Batch [110/447], Loss: 3.9392
Epoch [1/60], Batch [120/447], Loss: 3.9854
Epoch [1/60], Batch [130/447], Loss: 3.7870
Epoch [1/60], Batch [140/447], Loss: 3.9498
Epoch [1/60], Batch [150/447], Loss: 3.9253
Epoch [1/60], Batch [160/447], Loss: 3.9994
Epoch [1/60], Batch [170/447], Loss: 3.9608
Epoch [1/60], Batch [180/447], Loss: 3.9984
Epoch [1/60], Batch [190/447], Loss: 3.8786
Epoch [1/60], Batch [200/447], Loss: 4.0423
Epoch [1/60], Batch [210/447], Loss: 3.9361
Epoch [1/60], Batch [220/447], Loss: 3.9273

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [2/60], Batch [0/447], Loss: 3.9882
Epoch [2/60], Batch [10/447], Loss: 3.8404
Epoch [2/60], Batch [20/447], Loss: 3.9129
Epoch [2/60], Batch [30/447], Loss: 3.8042
Epoch [2/60], Batch [40/447], Loss: 3.7645
Epoch [2/60], Batch [50/447], Loss: 3.7876
Epoch [2/60], Batch [60/447], Loss: 3.8709
Epoch [2/60], Batch [70/447], Loss: 3.7412
Epoch [2/60], Batch [80/447], Loss: 3.6793
Epoch [2/60], Batch [90/447], Loss: 3.7384
Epoch [2/60], Batch [100/447], Loss: 3.8492
Epoch [2/60], Batch [110/447], Loss: 3.9229
Epoch [2/60], Batch [120/447], Loss: 3.6822
Epoch [2/60], Batch [130/447], Loss: 3.8285
Epoch [2/60], Batch [140/447], Loss: 3.9324
Epoch [2/60], Batch [150/447], Loss: 3.8713
Epoch [2/60], Batch [160/447], Loss: 4.0045
Epoch [2/60], Batch [170/447], Loss: 3.8255
Epoch [2/60], Batch [180/447], Loss: 3.8018
Epoch [2/60], Batch [190/447], Loss: 4.0401
Epoch [2/60], Batch [200/447], Loss: 3.7876
Epoch [2/60], Batch [210/447], Loss: 3.6490
Epoch [2/60], Batch [220/447], Loss: 3.7246

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [3/60], Batch [0/447], Loss: 3.7827
Epoch [3/60], Batch [10/447], Loss: 3.7953
Epoch [3/60], Batch [20/447], Loss: 3.7352
Epoch [3/60], Batch [30/447], Loss: 3.7224
Epoch [3/60], Batch [40/447], Loss: 3.6762
Epoch [3/60], Batch [50/447], Loss: 3.6040
Epoch [3/60], Batch [60/447], Loss: 3.6651
Epoch [3/60], Batch [70/447], Loss: 3.7712
Epoch [3/60], Batch [80/447], Loss: 3.7521
Epoch [3/60], Batch [90/447], Loss: 3.8824
Epoch [3/60], Batch [100/447], Loss: 3.8389
Epoch [3/60], Batch [110/447], Loss: 3.7883
Epoch [3/60], Batch [120/447], Loss: 3.8588
Epoch [3/60], Batch [130/447], Loss: 3.8450
Epoch [3/60], Batch [140/447], Loss: 3.7565
Epoch [3/60], Batch [150/447], Loss: 3.6338
Epoch [3/60], Batch [160/447], Loss: 3.8507
Epoch [3/60], Batch [170/447], Loss: 3.8020
Epoch [3/60], Batch [180/447], Loss: 3.7757
Epoch [3/60], Batch [190/447], Loss: 3.8422
Epoch [3/60], Batch [200/447], Loss: 3.9273
Epoch [3/60], Batch [210/447], Loss: 3.8477
Epoch [3/60], Batch [220/447], Loss: 3.4612

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [4/60], Batch [0/447], Loss: 3.5698
Epoch [4/60], Batch [10/447], Loss: 3.7975
Epoch [4/60], Batch [20/447], Loss: 3.7748
Epoch [4/60], Batch [30/447], Loss: 3.5417
Epoch [4/60], Batch [40/447], Loss: 3.5705
Epoch [4/60], Batch [50/447], Loss: 3.5144
Epoch [4/60], Batch [60/447], Loss: 3.5101
Epoch [4/60], Batch [70/447], Loss: 3.6010
Epoch [4/60], Batch [80/447], Loss: 3.8334
Epoch [4/60], Batch [90/447], Loss: 3.7827
Epoch [4/60], Batch [100/447], Loss: 3.7439
Epoch [4/60], Batch [110/447], Loss: 3.5473
Epoch [4/60], Batch [120/447], Loss: 3.3496
Epoch [4/60], Batch [130/447], Loss: 3.7860
Epoch [4/60], Batch [140/447], Loss: 3.4669
Epoch [4/60], Batch [150/447], Loss: 3.5815
Epoch [4/60], Batch [160/447], Loss: 3.6327
Epoch [4/60], Batch [170/447], Loss: 3.5148
Epoch [4/60], Batch [180/447], Loss: 3.7170
Epoch [4/60], Batch [190/447], Loss: 3.8140
Epoch [4/60], Batch [200/447], Loss: 3.9594
Epoch [4/60], Batch [210/447], Loss: 3.4069
Epoch [4/60], Batch [220/447], Loss: 3.9617

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [5/60], Batch [0/447], Loss: 3.6339
Epoch [5/60], Batch [10/447], Loss: 3.7231
Epoch [5/60], Batch [20/447], Loss: 3.4654
Epoch [5/60], Batch [30/447], Loss: 3.7750
Epoch [5/60], Batch [40/447], Loss: 3.5969
Epoch [5/60], Batch [50/447], Loss: 3.5423
Epoch [5/60], Batch [60/447], Loss: 3.6874
Epoch [5/60], Batch [70/447], Loss: 3.5024
Epoch [5/60], Batch [80/447], Loss: 3.5293
Epoch [5/60], Batch [90/447], Loss: 3.3686
Epoch [5/60], Batch [100/447], Loss: 3.7316
Epoch [5/60], Batch [110/447], Loss: 3.5292
Epoch [5/60], Batch [120/447], Loss: 3.5960
Epoch [5/60], Batch [130/447], Loss: 3.6921
Epoch [5/60], Batch [140/447], Loss: 3.8291
Epoch [5/60], Batch [150/447], Loss: 3.6534
Epoch [5/60], Batch [160/447], Loss: 3.6926
Epoch [5/60], Batch [170/447], Loss: 3.6241
Epoch [5/60], Batch [180/447], Loss: 3.5975
Epoch [5/60], Batch [190/447], Loss: 3.6209
Epoch [5/60], Batch [200/447], Loss: 3.7716
Epoch [5/60], Batch [210/447], Loss: 3.8151
Epoch [5/60], Batch [220/447], Loss: 3.5196

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [6/60], Batch [0/447], Loss: 3.5683
Epoch [6/60], Batch [10/447], Loss: 3.4841
Epoch [6/60], Batch [20/447], Loss: 3.6516
Epoch [6/60], Batch [30/447], Loss: 3.5831
Epoch [6/60], Batch [40/447], Loss: 3.2725
Epoch [6/60], Batch [50/447], Loss: 3.5919
Epoch [6/60], Batch [60/447], Loss: 3.5125
Epoch [6/60], Batch [70/447], Loss: 3.1257
Epoch [6/60], Batch [80/447], Loss: 3.5534
Epoch [6/60], Batch [90/447], Loss: 3.2467
Epoch [6/60], Batch [100/447], Loss: 3.4654
Epoch [6/60], Batch [110/447], Loss: 3.4248
Epoch [6/60], Batch [120/447], Loss: 3.6038
Epoch [6/60], Batch [130/447], Loss: 3.5335
Epoch [6/60], Batch [140/447], Loss: 3.3955
Epoch [6/60], Batch [150/447], Loss: 3.3262
Epoch [6/60], Batch [160/447], Loss: 3.4014
Epoch [6/60], Batch [170/447], Loss: 3.3687
Epoch [6/60], Batch [180/447], Loss: 3.8655
Epoch [6/60], Batch [190/447], Loss: 3.5071
Epoch [6/60], Batch [200/447], Loss: 3.7059
Epoch [6/60], Batch [210/447], Loss: 3.5600
Epoch [6/60], Batch [220/447], Loss: 3.6590

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [7/60], Batch [0/447], Loss: 3.3546
Epoch [7/60], Batch [10/447], Loss: 3.6434
Epoch [7/60], Batch [20/447], Loss: 3.1272
Epoch [7/60], Batch [30/447], Loss: 3.4512
Epoch [7/60], Batch [40/447], Loss: 3.5271
Epoch [7/60], Batch [50/447], Loss: 3.2817
Epoch [7/60], Batch [60/447], Loss: 3.6105
Epoch [7/60], Batch [70/447], Loss: 3.4216
Epoch [7/60], Batch [80/447], Loss: 3.5965
Epoch [7/60], Batch [90/447], Loss: 3.0128
Epoch [7/60], Batch [100/447], Loss: 3.2747
Epoch [7/60], Batch [110/447], Loss: 3.5532
Epoch [7/60], Batch [120/447], Loss: 3.3669
Epoch [7/60], Batch [130/447], Loss: 3.5717
Epoch [7/60], Batch [140/447], Loss: 3.4310
Epoch [7/60], Batch [150/447], Loss: 3.6165
Epoch [7/60], Batch [160/447], Loss: 3.7071
Epoch [7/60], Batch [170/447], Loss: 3.4618
Epoch [7/60], Batch [180/447], Loss: 3.5761
Epoch [7/60], Batch [190/447], Loss: 3.8164
Epoch [7/60], Batch [200/447], Loss: 3.4978
Epoch [7/60], Batch [210/447], Loss: 3.0373
Epoch [7/60], Batch [220/447], Loss: 3.3921

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [8/60], Batch [0/447], Loss: 3.5372
Epoch [8/60], Batch [10/447], Loss: 3.5280
Epoch [8/60], Batch [20/447], Loss: 3.5082
Epoch [8/60], Batch [30/447], Loss: 3.4671
Epoch [8/60], Batch [40/447], Loss: 3.6401
Epoch [8/60], Batch [50/447], Loss: 3.5246
Epoch [8/60], Batch [60/447], Loss: 3.7969
Epoch [8/60], Batch [70/447], Loss: 3.4640
Epoch [8/60], Batch [80/447], Loss: 3.3000
Epoch [8/60], Batch [90/447], Loss: 3.4871
Epoch [8/60], Batch [100/447], Loss: 3.1039
Epoch [8/60], Batch [110/447], Loss: 3.0883
Epoch [8/60], Batch [120/447], Loss: 3.7066
Epoch [8/60], Batch [130/447], Loss: 3.7772
Epoch [8/60], Batch [140/447], Loss: 2.8006
Epoch [8/60], Batch [150/447], Loss: 3.5396
Epoch [8/60], Batch [160/447], Loss: 3.3695
Epoch [8/60], Batch [170/447], Loss: 3.1143
Epoch [8/60], Batch [180/447], Loss: 3.1642
Epoch [8/60], Batch [190/447], Loss: 3.4663
Epoch [8/60], Batch [200/447], Loss: 3.2601
Epoch [8/60], Batch [210/447], Loss: 3.1724
Epoch [8/60], Batch [220/447], Loss: 2.8817

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [9/60], Batch [0/447], Loss: 3.4689
Epoch [9/60], Batch [10/447], Loss: 3.0925
Epoch [9/60], Batch [20/447], Loss: 3.0606
Epoch [9/60], Batch [30/447], Loss: 3.5711
Epoch [9/60], Batch [40/447], Loss: 3.3936
Epoch [9/60], Batch [50/447], Loss: 3.3161
Epoch [9/60], Batch [60/447], Loss: 2.9781
Epoch [9/60], Batch [70/447], Loss: 3.4756
Epoch [9/60], Batch [80/447], Loss: 3.0044
Epoch [9/60], Batch [90/447], Loss: 3.4769
Epoch [9/60], Batch [100/447], Loss: 3.2344
Epoch [9/60], Batch [110/447], Loss: 3.5348
Epoch [9/60], Batch [120/447], Loss: 3.0687
Epoch [9/60], Batch [130/447], Loss: 3.3512
Epoch [9/60], Batch [140/447], Loss: 3.0225
Epoch [9/60], Batch [150/447], Loss: 3.6554
Epoch [9/60], Batch [160/447], Loss: 3.4829
Epoch [9/60], Batch [170/447], Loss: 3.2083
Epoch [9/60], Batch [180/447], Loss: 2.7197
Epoch [9/60], Batch [190/447], Loss: 3.3011
Epoch [9/60], Batch [200/447], Loss: 3.3978
Epoch [9/60], Batch [210/447], Loss: 3.0461
Epoch [9/60], Batch [220/447], Loss: 3.0882

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [10/60], Batch [0/447], Loss: 3.2524
Epoch [10/60], Batch [10/447], Loss: 3.2822
Epoch [10/60], Batch [20/447], Loss: 3.3590
Epoch [10/60], Batch [30/447], Loss: 3.4933
Epoch [10/60], Batch [40/447], Loss: 2.7320
Epoch [10/60], Batch [50/447], Loss: 3.5630
Epoch [10/60], Batch [60/447], Loss: 3.4001
Epoch [10/60], Batch [70/447], Loss: 3.3351
Epoch [10/60], Batch [80/447], Loss: 3.2423
Epoch [10/60], Batch [90/447], Loss: 2.8768
Epoch [10/60], Batch [100/447], Loss: 3.3239
Epoch [10/60], Batch [110/447], Loss: 3.2767
Epoch [10/60], Batch [120/447], Loss: 3.6096
Epoch [10/60], Batch [130/447], Loss: 3.4779
Epoch [10/60], Batch [140/447], Loss: 3.1696
Epoch [10/60], Batch [150/447], Loss: 2.7127
Epoch [10/60], Batch [160/447], Loss: 3.3364
Epoch [10/60], Batch [170/447], Loss: 2.9097
Epoch [10/60], Batch [180/447], Loss: 3.3026
Epoch [10/60], Batch [190/447], Loss: 3.2469
Epoch [10/60], Batch [200/447], Loss: 3.1448
Epoch [10/60], Batch [210/447], Loss: 3.2514
Epoch [10/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [11/60], Batch [0/447], Loss: 2.8718
Epoch [11/60], Batch [10/447], Loss: 3.0800
Epoch [11/60], Batch [20/447], Loss: 3.0550
Epoch [11/60], Batch [30/447], Loss: 3.3329
Epoch [11/60], Batch [40/447], Loss: 3.4204
Epoch [11/60], Batch [50/447], Loss: 2.9861
Epoch [11/60], Batch [60/447], Loss: 2.9191
Epoch [11/60], Batch [70/447], Loss: 3.1839
Epoch [11/60], Batch [80/447], Loss: 3.0663
Epoch [11/60], Batch [90/447], Loss: 3.4654
Epoch [11/60], Batch [100/447], Loss: 3.2605
Epoch [11/60], Batch [110/447], Loss: 3.0558
Epoch [11/60], Batch [120/447], Loss: 3.4690
Epoch [11/60], Batch [130/447], Loss: 3.3006
Epoch [11/60], Batch [140/447], Loss: 3.0501
Epoch [11/60], Batch [150/447], Loss: 3.0470
Epoch [11/60], Batch [160/447], Loss: 2.9676
Epoch [11/60], Batch [170/447], Loss: 3.1357
Epoch [11/60], Batch [180/447], Loss: 3.3297
Epoch [11/60], Batch [190/447], Loss: 3.1079
Epoch [11/60], Batch [200/447], Loss: 2.9329
Epoch [11/60], Batch [210/447], Loss: 3.0556
Epoch [11/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [12/60], Batch [0/447], Loss: 3.1888
Epoch [12/60], Batch [10/447], Loss: 3.4050
Epoch [12/60], Batch [20/447], Loss: 2.9824
Epoch [12/60], Batch [30/447], Loss: 2.6728
Epoch [12/60], Batch [40/447], Loss: 3.4782
Epoch [12/60], Batch [50/447], Loss: 3.2953
Epoch [12/60], Batch [60/447], Loss: 3.2827
Epoch [12/60], Batch [70/447], Loss: 3.1751
Epoch [12/60], Batch [80/447], Loss: 3.5138
Epoch [12/60], Batch [90/447], Loss: 2.7890
Epoch [12/60], Batch [100/447], Loss: 2.8523
Epoch [12/60], Batch [110/447], Loss: 2.8907
Epoch [12/60], Batch [120/447], Loss: 2.6796
Epoch [12/60], Batch [130/447], Loss: 3.2922
Epoch [12/60], Batch [140/447], Loss: 2.9469
Epoch [12/60], Batch [150/447], Loss: 2.6974
Epoch [12/60], Batch [160/447], Loss: 3.0314
Epoch [12/60], Batch [170/447], Loss: 2.7970
Epoch [12/60], Batch [180/447], Loss: 3.2803
Epoch [12/60], Batch [190/447], Loss: 3.2130
Epoch [12/60], Batch [200/447], Loss: 3.1557
Epoch [12/60], Batch [210/447], Loss: 3.1888
Epoch [12/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [13/60], Batch [0/447], Loss: 3.4646
Epoch [13/60], Batch [10/447], Loss: 2.9900
Epoch [13/60], Batch [20/447], Loss: 3.3427
Epoch [13/60], Batch [30/447], Loss: 2.7964
Epoch [13/60], Batch [40/447], Loss: 3.1374
Epoch [13/60], Batch [50/447], Loss: 2.7621
Epoch [13/60], Batch [60/447], Loss: 2.7467
Epoch [13/60], Batch [70/447], Loss: 2.9715
Epoch [13/60], Batch [80/447], Loss: 3.2273
Epoch [13/60], Batch [90/447], Loss: 2.9786
Epoch [13/60], Batch [100/447], Loss: 2.9482
Epoch [13/60], Batch [110/447], Loss: 3.2284
Epoch [13/60], Batch [120/447], Loss: 2.9210
Epoch [13/60], Batch [130/447], Loss: 3.3238
Epoch [13/60], Batch [140/447], Loss: 3.4673
Epoch [13/60], Batch [150/447], Loss: 3.1454
Epoch [13/60], Batch [160/447], Loss: 2.8377
Epoch [13/60], Batch [170/447], Loss: 3.2801
Epoch [13/60], Batch [180/447], Loss: 2.8044
Epoch [13/60], Batch [190/447], Loss: 3.6444
Epoch [13/60], Batch [200/447], Loss: 3.0010
Epoch [13/60], Batch [210/447], Loss: 3.1607
Epoch [13/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [14/60], Batch [0/447], Loss: 3.1029
Epoch [14/60], Batch [10/447], Loss: 3.1551
Epoch [14/60], Batch [20/447], Loss: 3.1565
Epoch [14/60], Batch [30/447], Loss: 3.0660
Epoch [14/60], Batch [40/447], Loss: 3.4849
Epoch [14/60], Batch [50/447], Loss: 3.5737
Epoch [14/60], Batch [60/447], Loss: 2.9725
Epoch [14/60], Batch [70/447], Loss: 2.9318
Epoch [14/60], Batch [80/447], Loss: 3.0278
Epoch [14/60], Batch [90/447], Loss: 2.9396
Epoch [14/60], Batch [100/447], Loss: 3.4234
Epoch [14/60], Batch [110/447], Loss: 2.8765
Epoch [14/60], Batch [120/447], Loss: 2.8626
Epoch [14/60], Batch [130/447], Loss: 3.0459
Epoch [14/60], Batch [140/447], Loss: 3.1319
Epoch [14/60], Batch [150/447], Loss: 3.2912
Epoch [14/60], Batch [160/447], Loss: 2.8990
Epoch [14/60], Batch [170/447], Loss: 2.3112
Epoch [14/60], Batch [180/447], Loss: 3.3238
Epoch [14/60], Batch [190/447], Loss: 2.8169
Epoch [14/60], Batch [200/447], Loss: 3.1079
Epoch [14/60], Batch [210/447], Loss: 3.1973
Epoch [14/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [15/60], Batch [0/447], Loss: 2.5540
Epoch [15/60], Batch [10/447], Loss: 3.5851
Epoch [15/60], Batch [20/447], Loss: 3.1518
Epoch [15/60], Batch [30/447], Loss: 2.8372
Epoch [15/60], Batch [40/447], Loss: 2.9789
Epoch [15/60], Batch [50/447], Loss: 2.7876
Epoch [15/60], Batch [60/447], Loss: 2.4922
Epoch [15/60], Batch [70/447], Loss: 2.7190
Epoch [15/60], Batch [80/447], Loss: 2.9926
Epoch [15/60], Batch [90/447], Loss: 3.1154
Epoch [15/60], Batch [100/447], Loss: 2.2412
Epoch [15/60], Batch [110/447], Loss: 2.8092
Epoch [15/60], Batch [120/447], Loss: 3.0021
Epoch [15/60], Batch [130/447], Loss: 2.7074
Epoch [15/60], Batch [140/447], Loss: 2.5928
Epoch [15/60], Batch [150/447], Loss: 3.2717
Epoch [15/60], Batch [160/447], Loss: 2.7094
Epoch [15/60], Batch [170/447], Loss: 3.2557
Epoch [15/60], Batch [180/447], Loss: 2.8139
Epoch [15/60], Batch [190/447], Loss: 3.3374
Epoch [15/60], Batch [200/447], Loss: 2.7675
Epoch [15/60], Batch [210/447], Loss: 2.7988
Epoch [15/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [16/60], Batch [0/447], Loss: 2.7173
Epoch [16/60], Batch [10/447], Loss: 3.0105
Epoch [16/60], Batch [20/447], Loss: 3.1177
Epoch [16/60], Batch [30/447], Loss: 2.9149
Epoch [16/60], Batch [40/447], Loss: 2.8810
Epoch [16/60], Batch [50/447], Loss: 3.3794
Epoch [16/60], Batch [60/447], Loss: 2.4747
Epoch [16/60], Batch [70/447], Loss: 2.8330
Epoch [16/60], Batch [80/447], Loss: 3.0754
Epoch [16/60], Batch [90/447], Loss: 2.8355
Epoch [16/60], Batch [100/447], Loss: 2.4113
Epoch [16/60], Batch [110/447], Loss: 2.8866
Epoch [16/60], Batch [120/447], Loss: 3.2053
Epoch [16/60], Batch [130/447], Loss: 2.4985
Epoch [16/60], Batch [140/447], Loss: 2.9889
Epoch [16/60], Batch [150/447], Loss: 3.1118
Epoch [16/60], Batch [160/447], Loss: 3.3008
Epoch [16/60], Batch [170/447], Loss: 3.2141
Epoch [16/60], Batch [180/447], Loss: 2.9702
Epoch [16/60], Batch [190/447], Loss: 2.8675
Epoch [16/60], Batch [200/447], Loss: 2.1746
Epoch [16/60], Batch [210/447], Loss: 2.6860
Epoch [16/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [17/60], Batch [0/447], Loss: 2.3438
Epoch [17/60], Batch [10/447], Loss: 3.3265
Epoch [17/60], Batch [20/447], Loss: 2.8572
Epoch [17/60], Batch [30/447], Loss: 2.6019
Epoch [17/60], Batch [40/447], Loss: 2.9751
Epoch [17/60], Batch [50/447], Loss: 3.0328
Epoch [17/60], Batch [60/447], Loss: 3.7964
Epoch [17/60], Batch [70/447], Loss: 2.7291
Epoch [17/60], Batch [80/447], Loss: 3.1705
Epoch [17/60], Batch [90/447], Loss: 2.3819
Epoch [17/60], Batch [100/447], Loss: 2.7822
Epoch [17/60], Batch [110/447], Loss: 2.6208
Epoch [17/60], Batch [120/447], Loss: 2.4602
Epoch [17/60], Batch [130/447], Loss: 2.9253
Epoch [17/60], Batch [140/447], Loss: 2.8879
Epoch [17/60], Batch [150/447], Loss: 2.8464
Epoch [17/60], Batch [160/447], Loss: 2.8654
Epoch [17/60], Batch [170/447], Loss: 3.0860
Epoch [17/60], Batch [180/447], Loss: 3.0507
Epoch [17/60], Batch [190/447], Loss: 3.1671
Epoch [17/60], Batch [200/447], Loss: 3.1526
Epoch [17/60], Batch [210/447], Loss: 2.9978
Epoch [17/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [18/60], Batch [0/447], Loss: 3.0589
Epoch [18/60], Batch [10/447], Loss: 2.7180
Epoch [18/60], Batch [20/447], Loss: 3.2591
Epoch [18/60], Batch [30/447], Loss: 3.6541
Epoch [18/60], Batch [40/447], Loss: 2.2885
Epoch [18/60], Batch [50/447], Loss: 2.8817
Epoch [18/60], Batch [60/447], Loss: 2.7721
Epoch [18/60], Batch [70/447], Loss: 2.2484
Epoch [18/60], Batch [80/447], Loss: 2.5622
Epoch [18/60], Batch [90/447], Loss: 3.1906
Epoch [18/60], Batch [100/447], Loss: 2.7977
Epoch [18/60], Batch [110/447], Loss: 2.3525
Epoch [18/60], Batch [120/447], Loss: 2.8844
Epoch [18/60], Batch [130/447], Loss: 2.8080
Epoch [18/60], Batch [140/447], Loss: 2.7264
Epoch [18/60], Batch [150/447], Loss: 2.7532
Epoch [18/60], Batch [160/447], Loss: 2.6255
Epoch [18/60], Batch [170/447], Loss: 2.8556
Epoch [18/60], Batch [180/447], Loss: 2.9649
Epoch [18/60], Batch [190/447], Loss: 2.8941
Epoch [18/60], Batch [200/447], Loss: 2.8738
Epoch [18/60], Batch [210/447], Loss: 2.5742
Epoch [18/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [19/60], Batch [0/447], Loss: 2.5184
Epoch [19/60], Batch [10/447], Loss: 2.7860
Epoch [19/60], Batch [20/447], Loss: 2.9132
Epoch [19/60], Batch [30/447], Loss: 3.0235
Epoch [19/60], Batch [40/447], Loss: 2.9491
Epoch [19/60], Batch [50/447], Loss: 2.8204
Epoch [19/60], Batch [60/447], Loss: 3.0096
Epoch [19/60], Batch [70/447], Loss: 3.0499
Epoch [19/60], Batch [80/447], Loss: 3.4902
Epoch [19/60], Batch [90/447], Loss: 2.4168
Epoch [19/60], Batch [100/447], Loss: 2.5356
Epoch [19/60], Batch [110/447], Loss: 3.2484
Epoch [19/60], Batch [120/447], Loss: 2.9249
Epoch [19/60], Batch [130/447], Loss: 2.8979
Epoch [19/60], Batch [140/447], Loss: 2.7465
Epoch [19/60], Batch [150/447], Loss: 2.8936
Epoch [19/60], Batch [160/447], Loss: 3.1922
Epoch [19/60], Batch [170/447], Loss: 2.9118
Epoch [19/60], Batch [180/447], Loss: 2.5588
Epoch [19/60], Batch [190/447], Loss: 3.0050
Epoch [19/60], Batch [200/447], Loss: 2.7499
Epoch [19/60], Batch [210/447], Loss: 2.9900
Epoch [19/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [20/60], Batch [0/447], Loss: 2.7650
Epoch [20/60], Batch [10/447], Loss: 2.7620
Epoch [20/60], Batch [20/447], Loss: 2.9104
Epoch [20/60], Batch [30/447], Loss: 3.0716
Epoch [20/60], Batch [40/447], Loss: 3.1481
Epoch [20/60], Batch [50/447], Loss: 2.7049
Epoch [20/60], Batch [60/447], Loss: 2.8921
Epoch [20/60], Batch [70/447], Loss: 2.7362
Epoch [20/60], Batch [80/447], Loss: 2.6972
Epoch [20/60], Batch [90/447], Loss: 2.9978
Epoch [20/60], Batch [100/447], Loss: 2.5211
Epoch [20/60], Batch [110/447], Loss: 2.8563
Epoch [20/60], Batch [120/447], Loss: 3.2022
Epoch [20/60], Batch [130/447], Loss: 2.6646
Epoch [20/60], Batch [140/447], Loss: 2.2087
Epoch [20/60], Batch [150/447], Loss: 2.9313
Epoch [20/60], Batch [160/447], Loss: 2.8111
Epoch [20/60], Batch [170/447], Loss: 2.8403
Epoch [20/60], Batch [180/447], Loss: 2.6791
Epoch [20/60], Batch [190/447], Loss: 3.1052
Epoch [20/60], Batch [200/447], Loss: 2.8439
Epoch [20/60], Batch [210/447], Loss: 3.1320
Epoch [20/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [21/60], Batch [0/447], Loss: 2.2317
Epoch [21/60], Batch [10/447], Loss: 2.6751
Epoch [21/60], Batch [20/447], Loss: 2.6958
Epoch [21/60], Batch [30/447], Loss: 3.1114
Epoch [21/60], Batch [40/447], Loss: 2.9457
Epoch [21/60], Batch [50/447], Loss: 2.9934
Epoch [21/60], Batch [60/447], Loss: 3.1605
Epoch [21/60], Batch [70/447], Loss: 2.5188
Epoch [21/60], Batch [80/447], Loss: 2.8938
Epoch [21/60], Batch [90/447], Loss: 3.0178
Epoch [21/60], Batch [100/447], Loss: 2.4597
Epoch [21/60], Batch [110/447], Loss: 2.5732
Epoch [21/60], Batch [120/447], Loss: 3.1842
Epoch [21/60], Batch [130/447], Loss: 2.9648
Epoch [21/60], Batch [140/447], Loss: 2.5089
Epoch [21/60], Batch [150/447], Loss: 2.8951
Epoch [21/60], Batch [160/447], Loss: 2.1172
Epoch [21/60], Batch [170/447], Loss: 2.6070
Epoch [21/60], Batch [180/447], Loss: 2.6219
Epoch [21/60], Batch [190/447], Loss: 3.3273
Epoch [21/60], Batch [200/447], Loss: 2.1704
Epoch [21/60], Batch [210/447], Loss: 3.1492
Epoch [21/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [22/60], Batch [0/447], Loss: 2.9785
Epoch [22/60], Batch [10/447], Loss: 2.4511
Epoch [22/60], Batch [20/447], Loss: 2.2225
Epoch [22/60], Batch [30/447], Loss: 3.1053
Epoch [22/60], Batch [40/447], Loss: 2.3035
Epoch [22/60], Batch [50/447], Loss: 3.1706
Epoch [22/60], Batch [60/447], Loss: 3.0873
Epoch [22/60], Batch [70/447], Loss: 2.0862
Epoch [22/60], Batch [80/447], Loss: 2.4766
Epoch [22/60], Batch [90/447], Loss: 3.0653
Epoch [22/60], Batch [100/447], Loss: 2.3953
Epoch [22/60], Batch [110/447], Loss: 2.4882
Epoch [22/60], Batch [120/447], Loss: 2.9844
Epoch [22/60], Batch [130/447], Loss: 3.2878
Epoch [22/60], Batch [140/447], Loss: 2.7895
Epoch [22/60], Batch [150/447], Loss: 2.7527
Epoch [22/60], Batch [160/447], Loss: 3.0152
Epoch [22/60], Batch [170/447], Loss: 2.8875
Epoch [22/60], Batch [180/447], Loss: 3.1718
Epoch [22/60], Batch [190/447], Loss: 2.2672
Epoch [22/60], Batch [200/447], Loss: 2.9960
Epoch [22/60], Batch [210/447], Loss: 2.5519
Epoch [22/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [23/60], Batch [0/447], Loss: 2.8838
Epoch [23/60], Batch [10/447], Loss: 2.5764
Epoch [23/60], Batch [20/447], Loss: 2.8729
Epoch [23/60], Batch [30/447], Loss: 2.6054
Epoch [23/60], Batch [40/447], Loss: 3.1802
Epoch [23/60], Batch [50/447], Loss: 2.6861
Epoch [23/60], Batch [60/447], Loss: 2.9119
Epoch [23/60], Batch [70/447], Loss: 2.8901
Epoch [23/60], Batch [80/447], Loss: 3.1305
Epoch [23/60], Batch [90/447], Loss: 2.8683
Epoch [23/60], Batch [100/447], Loss: 2.8041
Epoch [23/60], Batch [110/447], Loss: 2.6031
Epoch [23/60], Batch [120/447], Loss: 2.9279
Epoch [23/60], Batch [130/447], Loss: 2.4686
Epoch [23/60], Batch [140/447], Loss: 2.7003
Epoch [23/60], Batch [150/447], Loss: 2.8062
Epoch [23/60], Batch [160/447], Loss: 3.0032
Epoch [23/60], Batch [170/447], Loss: 3.6258
Epoch [23/60], Batch [180/447], Loss: 2.8978
Epoch [23/60], Batch [190/447], Loss: 2.6368
Epoch [23/60], Batch [200/447], Loss: 2.9248
Epoch [23/60], Batch [210/447], Loss: 2.4520
Epoch [23/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [24/60], Batch [0/447], Loss: 2.4029
Epoch [24/60], Batch [10/447], Loss: 2.5191
Epoch [24/60], Batch [20/447], Loss: 3.1546
Epoch [24/60], Batch [30/447], Loss: 2.6560
Epoch [24/60], Batch [40/447], Loss: 2.9370
Epoch [24/60], Batch [50/447], Loss: 2.6986
Epoch [24/60], Batch [60/447], Loss: 3.0273
Epoch [24/60], Batch [70/447], Loss: 2.6123
Epoch [24/60], Batch [80/447], Loss: 2.5668
Epoch [24/60], Batch [90/447], Loss: 2.7679
Epoch [24/60], Batch [100/447], Loss: 2.4235
Epoch [24/60], Batch [110/447], Loss: 2.5827
Epoch [24/60], Batch [120/447], Loss: 2.5082
Epoch [24/60], Batch [130/447], Loss: 2.7130
Epoch [24/60], Batch [140/447], Loss: 2.9059
Epoch [24/60], Batch [150/447], Loss: 2.7012
Epoch [24/60], Batch [160/447], Loss: 2.7886
Epoch [24/60], Batch [170/447], Loss: 2.4766
Epoch [24/60], Batch [180/447], Loss: 2.7945
Epoch [24/60], Batch [190/447], Loss: 1.9637
Epoch [24/60], Batch [200/447], Loss: 2.5432
Epoch [24/60], Batch [210/447], Loss: 1.9188
Epoch [24/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [25/60], Batch [0/447], Loss: 2.6971
Epoch [25/60], Batch [10/447], Loss: 2.6458
Epoch [25/60], Batch [20/447], Loss: 2.8467
Epoch [25/60], Batch [30/447], Loss: 2.3841
Epoch [25/60], Batch [40/447], Loss: 2.3580
Epoch [25/60], Batch [50/447], Loss: 2.9494
Epoch [25/60], Batch [60/447], Loss: 3.1088
Epoch [25/60], Batch [70/447], Loss: 2.4132
Epoch [25/60], Batch [80/447], Loss: 2.4504
Epoch [25/60], Batch [90/447], Loss: 2.1861
Epoch [25/60], Batch [100/447], Loss: 2.6425
Epoch [25/60], Batch [110/447], Loss: 2.3973
Epoch [25/60], Batch [120/447], Loss: 2.8633
Epoch [25/60], Batch [130/447], Loss: 2.7360
Epoch [25/60], Batch [140/447], Loss: 2.6808
Epoch [25/60], Batch [150/447], Loss: 2.0484
Epoch [25/60], Batch [160/447], Loss: 3.1160
Epoch [25/60], Batch [170/447], Loss: 3.4456
Epoch [25/60], Batch [180/447], Loss: 2.4586
Epoch [25/60], Batch [190/447], Loss: 2.9765
Epoch [25/60], Batch [200/447], Loss: 2.3864
Epoch [25/60], Batch [210/447], Loss: 2.5318
Epoch [25/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [26/60], Batch [0/447], Loss: 2.3950
Epoch [26/60], Batch [10/447], Loss: 2.2422
Epoch [26/60], Batch [20/447], Loss: 2.1352
Epoch [26/60], Batch [30/447], Loss: 2.0327
Epoch [26/60], Batch [40/447], Loss: 2.3207
Epoch [26/60], Batch [50/447], Loss: 2.9212
Epoch [26/60], Batch [60/447], Loss: 2.7608
Epoch [26/60], Batch [70/447], Loss: 2.3776
Epoch [26/60], Batch [80/447], Loss: 2.1922
Epoch [26/60], Batch [90/447], Loss: 2.8679
Epoch [26/60], Batch [100/447], Loss: 2.7284
Epoch [26/60], Batch [110/447], Loss: 2.6532
Epoch [26/60], Batch [120/447], Loss: 2.7836
Epoch [26/60], Batch [130/447], Loss: 2.5809
Epoch [26/60], Batch [140/447], Loss: 2.3190
Epoch [26/60], Batch [150/447], Loss: 2.6781
Epoch [26/60], Batch [160/447], Loss: 3.0203
Epoch [26/60], Batch [170/447], Loss: 2.5058
Epoch [26/60], Batch [180/447], Loss: 2.3632
Epoch [26/60], Batch [190/447], Loss: 3.0970
Epoch [26/60], Batch [200/447], Loss: 2.0729
Epoch [26/60], Batch [210/447], Loss: 2.8653
Epoch [26/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [27/60], Batch [0/447], Loss: 2.6916
Epoch [27/60], Batch [10/447], Loss: 2.9231
Epoch [27/60], Batch [20/447], Loss: 1.8026
Epoch [27/60], Batch [30/447], Loss: 2.2839
Epoch [27/60], Batch [40/447], Loss: 2.6656
Epoch [27/60], Batch [50/447], Loss: 3.2066
Epoch [27/60], Batch [60/447], Loss: 2.1833
Epoch [27/60], Batch [70/447], Loss: 2.0545
Epoch [27/60], Batch [80/447], Loss: 2.2887
Epoch [27/60], Batch [90/447], Loss: 3.3146
Epoch [27/60], Batch [100/447], Loss: 2.3877
Epoch [27/60], Batch [110/447], Loss: 2.4987
Epoch [27/60], Batch [120/447], Loss: 2.7991
Epoch [27/60], Batch [130/447], Loss: 2.8476
Epoch [27/60], Batch [140/447], Loss: 2.9402
Epoch [27/60], Batch [150/447], Loss: 2.2054
Epoch [27/60], Batch [160/447], Loss: 3.1283
Epoch [27/60], Batch [170/447], Loss: 2.2908
Epoch [27/60], Batch [180/447], Loss: 2.6784
Epoch [27/60], Batch [190/447], Loss: 2.7710
Epoch [27/60], Batch [200/447], Loss: 2.0731
Epoch [27/60], Batch [210/447], Loss: 3.0998
Epoch [27/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [28/60], Batch [0/447], Loss: 2.5709
Epoch [28/60], Batch [10/447], Loss: 2.4330
Epoch [28/60], Batch [20/447], Loss: 2.0648
Epoch [28/60], Batch [30/447], Loss: 2.2619
Epoch [28/60], Batch [40/447], Loss: 1.9348
Epoch [28/60], Batch [50/447], Loss: 2.7130
Epoch [28/60], Batch [60/447], Loss: 2.1975
Epoch [28/60], Batch [70/447], Loss: 2.7973
Epoch [28/60], Batch [80/447], Loss: 2.3571
Epoch [28/60], Batch [90/447], Loss: 1.9918
Epoch [28/60], Batch [100/447], Loss: 2.2872
Epoch [28/60], Batch [110/447], Loss: 2.4583
Epoch [28/60], Batch [120/447], Loss: 2.3470
Epoch [28/60], Batch [130/447], Loss: 1.8307
Epoch [28/60], Batch [140/447], Loss: 2.6839
Epoch [28/60], Batch [150/447], Loss: 2.4954
Epoch [28/60], Batch [160/447], Loss: 3.5358
Epoch [28/60], Batch [170/447], Loss: 3.0224
Epoch [28/60], Batch [180/447], Loss: 2.4770
Epoch [28/60], Batch [190/447], Loss: 2.4296
Epoch [28/60], Batch [200/447], Loss: 3.0515
Epoch [28/60], Batch [210/447], Loss: 2.5159
Epoch [28/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [29/60], Batch [0/447], Loss: 2.8397
Epoch [29/60], Batch [10/447], Loss: 2.1947
Epoch [29/60], Batch [20/447], Loss: 3.3793
Epoch [29/60], Batch [30/447], Loss: 2.5148
Epoch [29/60], Batch [40/447], Loss: 2.7567
Epoch [29/60], Batch [50/447], Loss: 3.0347
Epoch [29/60], Batch [60/447], Loss: 2.2124
Epoch [29/60], Batch [70/447], Loss: 2.8903
Epoch [29/60], Batch [80/447], Loss: 2.2447
Epoch [29/60], Batch [90/447], Loss: 2.5116
Epoch [29/60], Batch [100/447], Loss: 2.5515
Epoch [29/60], Batch [110/447], Loss: 2.8412
Epoch [29/60], Batch [120/447], Loss: 2.1985
Epoch [29/60], Batch [130/447], Loss: 2.9221
Epoch [29/60], Batch [140/447], Loss: 3.0836
Epoch [29/60], Batch [150/447], Loss: 2.3899
Epoch [29/60], Batch [160/447], Loss: 2.9223
Epoch [29/60], Batch [170/447], Loss: 2.5301
Epoch [29/60], Batch [180/447], Loss: 2.4283
Epoch [29/60], Batch [190/447], Loss: 2.1123
Epoch [29/60], Batch [200/447], Loss: 2.1797
Epoch [29/60], Batch [210/447], Loss: 2.4147
Epoch [29/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [30/60], Batch [0/447], Loss: 2.3640
Epoch [30/60], Batch [10/447], Loss: 3.0677
Epoch [30/60], Batch [20/447], Loss: 2.6822
Epoch [30/60], Batch [30/447], Loss: 1.9627
Epoch [30/60], Batch [40/447], Loss: 3.0617
Epoch [30/60], Batch [50/447], Loss: 2.3903
Epoch [30/60], Batch [60/447], Loss: 2.4284
Epoch [30/60], Batch [70/447], Loss: 3.1450
Epoch [30/60], Batch [80/447], Loss: 2.4926
Epoch [30/60], Batch [90/447], Loss: 2.6109
Epoch [30/60], Batch [100/447], Loss: 2.9631
Epoch [30/60], Batch [110/447], Loss: 2.7050
Epoch [30/60], Batch [120/447], Loss: 2.4033
Epoch [30/60], Batch [130/447], Loss: 2.3484
Epoch [30/60], Batch [140/447], Loss: 2.6127
Epoch [30/60], Batch [150/447], Loss: 2.0860
Epoch [30/60], Batch [160/447], Loss: 2.2576
Epoch [30/60], Batch [170/447], Loss: 2.7057
Epoch [30/60], Batch [180/447], Loss: 2.0810
Epoch [30/60], Batch [190/447], Loss: 2.5803
Epoch [30/60], Batch [200/447], Loss: 2.1125
Epoch [30/60], Batch [210/447], Loss: 2.6243
Epoch [30/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [31/60], Batch [0/447], Loss: 2.5413
Epoch [31/60], Batch [10/447], Loss: 2.6821
Epoch [31/60], Batch [20/447], Loss: 2.5636
Epoch [31/60], Batch [30/447], Loss: 2.3255
Epoch [31/60], Batch [40/447], Loss: 2.3626
Epoch [31/60], Batch [50/447], Loss: 1.8726
Epoch [31/60], Batch [60/447], Loss: 2.3443
Epoch [31/60], Batch [70/447], Loss: 2.7038
Epoch [31/60], Batch [80/447], Loss: 2.3548
Epoch [31/60], Batch [90/447], Loss: 2.4789
Epoch [31/60], Batch [100/447], Loss: 2.4739
Epoch [31/60], Batch [110/447], Loss: 2.6367
Epoch [31/60], Batch [120/447], Loss: 2.6664
Epoch [31/60], Batch [130/447], Loss: 2.4000
Epoch [31/60], Batch [140/447], Loss: 2.5628
Epoch [31/60], Batch [150/447], Loss: 2.6482
Epoch [31/60], Batch [160/447], Loss: 2.8451
Epoch [31/60], Batch [170/447], Loss: 1.7746
Epoch [31/60], Batch [180/447], Loss: 3.4136
Epoch [31/60], Batch [190/447], Loss: 2.7444
Epoch [31/60], Batch [200/447], Loss: 2.5311
Epoch [31/60], Batch [210/447], Loss: 1.9532
Epoch [31/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [32/60], Batch [0/447], Loss: 2.2438
Epoch [32/60], Batch [10/447], Loss: 2.7192
Epoch [32/60], Batch [20/447], Loss: 2.7704
Epoch [32/60], Batch [30/447], Loss: 2.6730
Epoch [32/60], Batch [40/447], Loss: 1.9302
Epoch [32/60], Batch [50/447], Loss: 3.3725
Epoch [32/60], Batch [60/447], Loss: 2.3652
Epoch [32/60], Batch [70/447], Loss: 2.4990
Epoch [32/60], Batch [80/447], Loss: 2.3994
Epoch [32/60], Batch [90/447], Loss: 2.2763
Epoch [32/60], Batch [100/447], Loss: 1.9687
Epoch [32/60], Batch [110/447], Loss: 2.4534
Epoch [32/60], Batch [120/447], Loss: 2.4341
Epoch [32/60], Batch [130/447], Loss: 2.6427
Epoch [32/60], Batch [140/447], Loss: 1.9465
Epoch [32/60], Batch [150/447], Loss: 1.8576
Epoch [32/60], Batch [160/447], Loss: 2.0545
Epoch [32/60], Batch [170/447], Loss: 2.8067
Epoch [32/60], Batch [180/447], Loss: 2.9986
Epoch [32/60], Batch [190/447], Loss: 2.7540
Epoch [32/60], Batch [200/447], Loss: 1.8218
Epoch [32/60], Batch [210/447], Loss: 2.5802
Epoch [32/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [33/60], Batch [0/447], Loss: 2.3707
Epoch [33/60], Batch [10/447], Loss: 1.8434
Epoch [33/60], Batch [20/447], Loss: 2.2288
Epoch [33/60], Batch [30/447], Loss: 2.9264
Epoch [33/60], Batch [40/447], Loss: 2.8051
Epoch [33/60], Batch [50/447], Loss: 2.6185
Epoch [33/60], Batch [60/447], Loss: 1.9196
Epoch [33/60], Batch [70/447], Loss: 2.7459
Epoch [33/60], Batch [80/447], Loss: 2.9215
Epoch [33/60], Batch [90/447], Loss: 2.5396
Epoch [33/60], Batch [100/447], Loss: 2.7305
Epoch [33/60], Batch [110/447], Loss: 2.0634
Epoch [33/60], Batch [120/447], Loss: 1.9698
Epoch [33/60], Batch [130/447], Loss: 3.0433
Epoch [33/60], Batch [140/447], Loss: 2.5003
Epoch [33/60], Batch [150/447], Loss: 2.1749
Epoch [33/60], Batch [160/447], Loss: 1.9934
Epoch [33/60], Batch [170/447], Loss: 2.1647
Epoch [33/60], Batch [180/447], Loss: 2.4849
Epoch [33/60], Batch [190/447], Loss: 2.6382
Epoch [33/60], Batch [200/447], Loss: 2.1957
Epoch [33/60], Batch [210/447], Loss: 2.0075
Epoch [33/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [34/60], Batch [0/447], Loss: 2.9263
Epoch [34/60], Batch [10/447], Loss: 2.3078
Epoch [34/60], Batch [20/447], Loss: 2.3486
Epoch [34/60], Batch [30/447], Loss: 2.1149
Epoch [34/60], Batch [40/447], Loss: 2.4735
Epoch [34/60], Batch [50/447], Loss: 2.7607
Epoch [34/60], Batch [60/447], Loss: 2.1478
Epoch [34/60], Batch [70/447], Loss: 2.9417
Epoch [34/60], Batch [80/447], Loss: 2.4787
Epoch [34/60], Batch [90/447], Loss: 1.8472
Epoch [34/60], Batch [100/447], Loss: 2.1841
Epoch [34/60], Batch [110/447], Loss: 2.4379
Epoch [34/60], Batch [120/447], Loss: 2.2261
Epoch [34/60], Batch [130/447], Loss: 2.9900
Epoch [34/60], Batch [140/447], Loss: 2.2781
Epoch [34/60], Batch [150/447], Loss: 2.5957
Epoch [34/60], Batch [160/447], Loss: 1.7253
Epoch [34/60], Batch [170/447], Loss: 2.5387
Epoch [34/60], Batch [180/447], Loss: 2.7745
Epoch [34/60], Batch [190/447], Loss: 2.1073
Epoch [34/60], Batch [200/447], Loss: 2.4351
Epoch [34/60], Batch [210/447], Loss: 2.9588
Epoch [34/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [35/60], Batch [0/447], Loss: 2.8535
Epoch [35/60], Batch [10/447], Loss: 2.7510
Epoch [35/60], Batch [20/447], Loss: 2.4988
Epoch [35/60], Batch [30/447], Loss: 2.5167
Epoch [35/60], Batch [40/447], Loss: 2.6791
Epoch [35/60], Batch [50/447], Loss: 3.0455
Epoch [35/60], Batch [60/447], Loss: 1.5094
Epoch [35/60], Batch [70/447], Loss: 2.8514
Epoch [35/60], Batch [80/447], Loss: 2.0918
Epoch [35/60], Batch [90/447], Loss: 2.1116
Epoch [35/60], Batch [100/447], Loss: 2.5832
Epoch [35/60], Batch [110/447], Loss: 2.8504
Epoch [35/60], Batch [120/447], Loss: 2.9243
Epoch [35/60], Batch [130/447], Loss: 2.7450
Epoch [35/60], Batch [140/447], Loss: 3.1160
Epoch [35/60], Batch [150/447], Loss: 2.0559
Epoch [35/60], Batch [160/447], Loss: 2.6735
Epoch [35/60], Batch [170/447], Loss: 2.7998
Epoch [35/60], Batch [180/447], Loss: 2.1529
Epoch [35/60], Batch [190/447], Loss: 2.1022
Epoch [35/60], Batch [200/447], Loss: 1.9039
Epoch [35/60], Batch [210/447], Loss: 2.3219
Epoch [35/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [36/60], Batch [0/447], Loss: 2.7602
Epoch [36/60], Batch [10/447], Loss: 2.7868
Epoch [36/60], Batch [20/447], Loss: 2.1871
Epoch [36/60], Batch [30/447], Loss: 1.9808
Epoch [36/60], Batch [40/447], Loss: 2.1347
Epoch [36/60], Batch [50/447], Loss: 2.9302
Epoch [36/60], Batch [60/447], Loss: 1.8115
Epoch [36/60], Batch [70/447], Loss: 2.6642
Epoch [36/60], Batch [80/447], Loss: 2.5814
Epoch [36/60], Batch [90/447], Loss: 2.3025
Epoch [36/60], Batch [100/447], Loss: 1.9230
Epoch [36/60], Batch [110/447], Loss: 2.7672
Epoch [36/60], Batch [120/447], Loss: 2.1748
Epoch [36/60], Batch [130/447], Loss: 2.4828
Epoch [36/60], Batch [140/447], Loss: 2.2793
Epoch [36/60], Batch [150/447], Loss: 2.4043
Epoch [36/60], Batch [160/447], Loss: 1.8576
Epoch [36/60], Batch [170/447], Loss: 2.3131
Epoch [36/60], Batch [180/447], Loss: 2.0979
Epoch [36/60], Batch [190/447], Loss: 2.4986
Epoch [36/60], Batch [200/447], Loss: 2.1392
Epoch [36/60], Batch [210/447], Loss: 2.0140
Epoch [36/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [37/60], Batch [0/447], Loss: 2.8383
Epoch [37/60], Batch [10/447], Loss: 2.3320
Epoch [37/60], Batch [20/447], Loss: 2.3010
Epoch [37/60], Batch [30/447], Loss: 2.9811
Epoch [37/60], Batch [40/447], Loss: 2.7677
Epoch [37/60], Batch [50/447], Loss: 1.7305
Epoch [37/60], Batch [60/447], Loss: 2.2534
Epoch [37/60], Batch [70/447], Loss: 2.6952
Epoch [37/60], Batch [80/447], Loss: 2.3687
Epoch [37/60], Batch [90/447], Loss: 2.7452
Epoch [37/60], Batch [100/447], Loss: 2.1457
Epoch [37/60], Batch [110/447], Loss: 3.3728
Epoch [37/60], Batch [120/447], Loss: 2.5621
Epoch [37/60], Batch [130/447], Loss: 2.3178
Epoch [37/60], Batch [140/447], Loss: 1.8366
Epoch [37/60], Batch [150/447], Loss: 2.3672
Epoch [37/60], Batch [160/447], Loss: 2.3065
Epoch [37/60], Batch [170/447], Loss: 2.1122
Epoch [37/60], Batch [180/447], Loss: 2.8003
Epoch [37/60], Batch [190/447], Loss: 2.5537
Epoch [37/60], Batch [200/447], Loss: 3.1070
Epoch [37/60], Batch [210/447], Loss: 2.0426
Epoch [37/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [38/60], Batch [0/447], Loss: 1.9583
Epoch [38/60], Batch [10/447], Loss: 2.3276
Epoch [38/60], Batch [20/447], Loss: 2.3750
Epoch [38/60], Batch [30/447], Loss: 2.0156
Epoch [38/60], Batch [40/447], Loss: 2.4194
Epoch [38/60], Batch [50/447], Loss: 2.3390
Epoch [38/60], Batch [60/447], Loss: 2.4179
Epoch [38/60], Batch [70/447], Loss: 2.8591
Epoch [38/60], Batch [80/447], Loss: 2.5269
Epoch [38/60], Batch [90/447], Loss: 2.1931
Epoch [38/60], Batch [100/447], Loss: 2.9840
Epoch [38/60], Batch [110/447], Loss: 2.2789
Epoch [38/60], Batch [120/447], Loss: 2.4910
Epoch [38/60], Batch [130/447], Loss: 1.7435
Epoch [38/60], Batch [140/447], Loss: 2.7209
Epoch [38/60], Batch [150/447], Loss: 2.2895
Epoch [38/60], Batch [160/447], Loss: 2.7690
Epoch [38/60], Batch [170/447], Loss: 2.3699
Epoch [38/60], Batch [180/447], Loss: 2.2602
Epoch [38/60], Batch [190/447], Loss: 2.4625
Epoch [38/60], Batch [200/447], Loss: 2.2365
Epoch [38/60], Batch [210/447], Loss: 2.2010
Epoch [38/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [39/60], Batch [0/447], Loss: 1.8986
Epoch [39/60], Batch [10/447], Loss: 3.3146
Epoch [39/60], Batch [20/447], Loss: 2.0518
Epoch [39/60], Batch [30/447], Loss: 1.9849
Epoch [39/60], Batch [40/447], Loss: 2.0104
Epoch [39/60], Batch [50/447], Loss: 1.5783
Epoch [39/60], Batch [60/447], Loss: 2.5053
Epoch [39/60], Batch [70/447], Loss: 2.5084
Epoch [39/60], Batch [80/447], Loss: 2.6275
Epoch [39/60], Batch [90/447], Loss: 1.9438
Epoch [39/60], Batch [100/447], Loss: 2.3303
Epoch [39/60], Batch [110/447], Loss: 2.7371
Epoch [39/60], Batch [120/447], Loss: 1.8339
Epoch [39/60], Batch [130/447], Loss: 1.3324
Epoch [39/60], Batch [140/447], Loss: 2.8331
Epoch [39/60], Batch [150/447], Loss: 2.8060
Epoch [39/60], Batch [160/447], Loss: 2.3549
Epoch [39/60], Batch [170/447], Loss: 2.5631
Epoch [39/60], Batch [180/447], Loss: 2.4417
Epoch [39/60], Batch [190/447], Loss: 2.8807
Epoch [39/60], Batch [200/447], Loss: 2.2540
Epoch [39/60], Batch [210/447], Loss: 2.6246
Epoch [39/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [40/60], Batch [0/447], Loss: 3.1552
Epoch [40/60], Batch [10/447], Loss: 2.7887
Epoch [40/60], Batch [20/447], Loss: 1.5407
Epoch [40/60], Batch [30/447], Loss: 1.8586
Epoch [40/60], Batch [40/447], Loss: 2.5511
Epoch [40/60], Batch [50/447], Loss: 1.4189
Epoch [40/60], Batch [60/447], Loss: 1.5531
Epoch [40/60], Batch [70/447], Loss: 2.4414
Epoch [40/60], Batch [80/447], Loss: 1.9790
Epoch [40/60], Batch [90/447], Loss: 2.7048
Epoch [40/60], Batch [100/447], Loss: 3.0790
Epoch [40/60], Batch [110/447], Loss: 2.4991
Epoch [40/60], Batch [120/447], Loss: 1.8829
Epoch [40/60], Batch [130/447], Loss: 2.4711
Epoch [40/60], Batch [140/447], Loss: 2.7867
Epoch [40/60], Batch [150/447], Loss: 2.3576
Epoch [40/60], Batch [160/447], Loss: 2.1335
Epoch [40/60], Batch [170/447], Loss: 2.5886
Epoch [40/60], Batch [180/447], Loss: 2.5647
Epoch [40/60], Batch [190/447], Loss: 2.3214
Epoch [40/60], Batch [200/447], Loss: 2.1120
Epoch [40/60], Batch [210/447], Loss: 2.4384
Epoch [40/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [41/60], Batch [0/447], Loss: 2.4741
Epoch [41/60], Batch [10/447], Loss: 3.0472
Epoch [41/60], Batch [20/447], Loss: 1.5903
Epoch [41/60], Batch [30/447], Loss: 2.7726
Epoch [41/60], Batch [40/447], Loss: 2.0683
Epoch [41/60], Batch [50/447], Loss: 2.6075
Epoch [41/60], Batch [60/447], Loss: 2.4037
Epoch [41/60], Batch [70/447], Loss: 2.3656
Epoch [41/60], Batch [80/447], Loss: 2.6275
Epoch [41/60], Batch [90/447], Loss: 2.4375
Epoch [41/60], Batch [100/447], Loss: 2.6894
Epoch [41/60], Batch [110/447], Loss: 2.8832
Epoch [41/60], Batch [120/447], Loss: 2.0720
Epoch [41/60], Batch [130/447], Loss: 2.8497
Epoch [41/60], Batch [140/447], Loss: 2.4770
Epoch [41/60], Batch [150/447], Loss: 3.0212
Epoch [41/60], Batch [160/447], Loss: 1.8610
Epoch [41/60], Batch [170/447], Loss: 2.7562
Epoch [41/60], Batch [180/447], Loss: 3.4931
Epoch [41/60], Batch [190/447], Loss: 2.5585
Epoch [41/60], Batch [200/447], Loss: 1.9126
Epoch [41/60], Batch [210/447], Loss: 2.5439
Epoch [41/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [42/60], Batch [0/447], Loss: 2.0632
Epoch [42/60], Batch [10/447], Loss: 2.1631
Epoch [42/60], Batch [20/447], Loss: 1.9509
Epoch [42/60], Batch [30/447], Loss: 2.3173
Epoch [42/60], Batch [40/447], Loss: 2.1262
Epoch [42/60], Batch [50/447], Loss: 2.1510
Epoch [42/60], Batch [60/447], Loss: 2.4205
Epoch [42/60], Batch [70/447], Loss: 2.5394
Epoch [42/60], Batch [80/447], Loss: 2.0513
Epoch [42/60], Batch [90/447], Loss: 1.8675
Epoch [42/60], Batch [100/447], Loss: 2.8118
Epoch [42/60], Batch [110/447], Loss: 1.2757
Epoch [42/60], Batch [120/447], Loss: 3.0715
Epoch [42/60], Batch [130/447], Loss: 1.0738
Epoch [42/60], Batch [140/447], Loss: 2.7007
Epoch [42/60], Batch [150/447], Loss: 1.9652
Epoch [42/60], Batch [160/447], Loss: 2.3408
Epoch [42/60], Batch [170/447], Loss: 2.7874
Epoch [42/60], Batch [180/447], Loss: 2.4562
Epoch [42/60], Batch [190/447], Loss: 2.5375
Epoch [42/60], Batch [200/447], Loss: 1.6992
Epoch [42/60], Batch [210/447], Loss: 2.6786
Epoch [42/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [43/60], Batch [0/447], Loss: 2.5076
Epoch [43/60], Batch [10/447], Loss: 2.7814
Epoch [43/60], Batch [20/447], Loss: 1.8300
Epoch [43/60], Batch [30/447], Loss: 2.1150
Epoch [43/60], Batch [40/447], Loss: 2.2820
Epoch [43/60], Batch [50/447], Loss: 2.6824
Epoch [43/60], Batch [60/447], Loss: 2.8992
Epoch [43/60], Batch [70/447], Loss: 2.6701
Epoch [43/60], Batch [80/447], Loss: 2.0709
Epoch [43/60], Batch [90/447], Loss: 2.9015
Epoch [43/60], Batch [100/447], Loss: 2.8679
Epoch [43/60], Batch [110/447], Loss: 2.5924
Epoch [43/60], Batch [120/447], Loss: 1.8157
Epoch [43/60], Batch [130/447], Loss: 1.8847
Epoch [43/60], Batch [140/447], Loss: 1.9235
Epoch [43/60], Batch [150/447], Loss: 2.6031
Epoch [43/60], Batch [160/447], Loss: 2.4674
Epoch [43/60], Batch [170/447], Loss: 2.4223
Epoch [43/60], Batch [180/447], Loss: 2.4088
Epoch [43/60], Batch [190/447], Loss: 2.4216
Epoch [43/60], Batch [200/447], Loss: 2.1561
Epoch [43/60], Batch [210/447], Loss: 2.3263
Epoch [43/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [44/60], Batch [0/447], Loss: 2.3754
Epoch [44/60], Batch [10/447], Loss: 2.2534
Epoch [44/60], Batch [20/447], Loss: 2.3533
Epoch [44/60], Batch [30/447], Loss: 2.6340
Epoch [44/60], Batch [40/447], Loss: 3.6024
Epoch [44/60], Batch [50/447], Loss: 2.0394
Epoch [44/60], Batch [60/447], Loss: 2.3846
Epoch [44/60], Batch [70/447], Loss: 2.2492
Epoch [44/60], Batch [80/447], Loss: 2.6214
Epoch [44/60], Batch [90/447], Loss: 2.6114
Epoch [44/60], Batch [100/447], Loss: 2.4028
Epoch [44/60], Batch [110/447], Loss: 1.4650
Epoch [44/60], Batch [120/447], Loss: 2.1738
Epoch [44/60], Batch [130/447], Loss: 2.1625
Epoch [44/60], Batch [140/447], Loss: 1.7619
Epoch [44/60], Batch [150/447], Loss: 2.0676
Epoch [44/60], Batch [160/447], Loss: 2.3592
Epoch [44/60], Batch [170/447], Loss: 2.4964
Epoch [44/60], Batch [180/447], Loss: 1.9692
Epoch [44/60], Batch [190/447], Loss: 2.2973
Epoch [44/60], Batch [200/447], Loss: 2.5507
Epoch [44/60], Batch [210/447], Loss: 2.1773
Epoch [44/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [45/60], Batch [0/447], Loss: 1.9557
Epoch [45/60], Batch [10/447], Loss: 2.5439
Epoch [45/60], Batch [20/447], Loss: 1.4301
Epoch [45/60], Batch [30/447], Loss: 2.0707
Epoch [45/60], Batch [40/447], Loss: 2.1346
Epoch [45/60], Batch [50/447], Loss: 2.6887
Epoch [45/60], Batch [60/447], Loss: 1.9288
Epoch [45/60], Batch [70/447], Loss: 2.2872
Epoch [45/60], Batch [80/447], Loss: 2.3664
Epoch [45/60], Batch [90/447], Loss: 2.4723
Epoch [45/60], Batch [100/447], Loss: 2.5093
Epoch [45/60], Batch [110/447], Loss: 2.3574
Epoch [45/60], Batch [120/447], Loss: 2.4714
Epoch [45/60], Batch [130/447], Loss: 2.7006
Epoch [45/60], Batch [140/447], Loss: 2.4455
Epoch [45/60], Batch [150/447], Loss: 2.8111
Epoch [45/60], Batch [160/447], Loss: 2.0077
Epoch [45/60], Batch [170/447], Loss: 1.9531
Epoch [45/60], Batch [180/447], Loss: 2.0234
Epoch [45/60], Batch [190/447], Loss: 2.2411
Epoch [45/60], Batch [200/447], Loss: 2.1880
Epoch [45/60], Batch [210/447], Loss: 2.2052
Epoch [45/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [46/60], Batch [0/447], Loss: 2.0693
Epoch [46/60], Batch [10/447], Loss: 3.0997
Epoch [46/60], Batch [20/447], Loss: 2.0694
Epoch [46/60], Batch [30/447], Loss: 2.6428
Epoch [46/60], Batch [40/447], Loss: 2.4145
Epoch [46/60], Batch [50/447], Loss: 2.8504
Epoch [46/60], Batch [60/447], Loss: 1.8830
Epoch [46/60], Batch [70/447], Loss: 1.7131
Epoch [46/60], Batch [80/447], Loss: 2.1118
Epoch [46/60], Batch [90/447], Loss: 2.8259
Epoch [46/60], Batch [100/447], Loss: 1.9400
Epoch [46/60], Batch [110/447], Loss: 2.0781
Epoch [46/60], Batch [120/447], Loss: 2.6608
Epoch [46/60], Batch [130/447], Loss: 1.5054
Epoch [46/60], Batch [140/447], Loss: 2.4186
Epoch [46/60], Batch [150/447], Loss: 2.3860
Epoch [46/60], Batch [160/447], Loss: 2.1186
Epoch [46/60], Batch [170/447], Loss: 2.4409
Epoch [46/60], Batch [180/447], Loss: 2.4917
Epoch [46/60], Batch [190/447], Loss: 2.4508
Epoch [46/60], Batch [200/447], Loss: 2.2051
Epoch [46/60], Batch [210/447], Loss: 2.8792
Epoch [46/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [47/60], Batch [0/447], Loss: 2.6898
Epoch [47/60], Batch [10/447], Loss: 2.1880
Epoch [47/60], Batch [20/447], Loss: 2.6744
Epoch [47/60], Batch [30/447], Loss: 1.8943
Epoch [47/60], Batch [40/447], Loss: 2.5334
Epoch [47/60], Batch [50/447], Loss: 2.2716
Epoch [47/60], Batch [60/447], Loss: 1.2876
Epoch [47/60], Batch [70/447], Loss: 1.8509
Epoch [47/60], Batch [80/447], Loss: 2.1788
Epoch [47/60], Batch [90/447], Loss: 2.1214
Epoch [47/60], Batch [100/447], Loss: 2.4998
Epoch [47/60], Batch [110/447], Loss: 2.8009
Epoch [47/60], Batch [120/447], Loss: 1.7694
Epoch [47/60], Batch [130/447], Loss: 2.3405
Epoch [47/60], Batch [140/447], Loss: 3.3313
Epoch [47/60], Batch [150/447], Loss: 1.2865
Epoch [47/60], Batch [160/447], Loss: 2.4129
Epoch [47/60], Batch [170/447], Loss: 2.7087
Epoch [47/60], Batch [180/447], Loss: 2.0438
Epoch [47/60], Batch [190/447], Loss: 2.2692
Epoch [47/60], Batch [200/447], Loss: 2.4990
Epoch [47/60], Batch [210/447], Loss: 1.6407
Epoch [47/60], Batch 

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [48/60], Batch [0/447], Loss: 2.0704
Epoch [48/60], Batch [10/447], Loss: 2.7534
Epoch [48/60], Batch [20/447], Loss: 2.4179
Epoch [48/60], Batch [30/447], Loss: 2.1455
Epoch [48/60], Batch [40/447], Loss: 2.3169
Epoch [48/60], Batch [50/447], Loss: 2.1292
Epoch [48/60], Batch [60/447], Loss: 2.5296
Epoch [48/60], Batch [70/447], Loss: 2.1276
Epoch [48/60], Batch [80/447], Loss: 1.8507
Epoch [48/60], Batch [90/447], Loss: 2.4864
Epoch [48/60], Batch [100/447], Loss: 1.8329
Epoch [48/60], Batch [110/447], Loss: 2.4774
Epoch [48/60], Batch [120/447], Loss: 1.9631
Epoch [48/60], Batch [130/447], Loss: 3.3926
Epoch [48/60], Batch [140/447], Loss: 2.1734
Epoch [48/60], Batch [150/447], Loss: 2.1118
Epoch [48/60], Batch [160/447], Loss: 2.2371
Epoch [48/60], Batch [170/447], Loss: 2.2338
Epoch [48/60], Batch [180/447], Loss: 2.2670
Epoch [48/60], Batch [190/447], Loss: 2.6985
Epoch [48/60], Batch [200/447], Loss: 1.7652
Epoch [48/60], Batch [210/447], Loss: 2.0147
Epoch [48/60], Batch 

[I 2024-12-13 14:34:44,833] Trial 6 pruned. 


Epoch [48/60], Validation Accuracy: 0.7150, Validation Loss: 1.0329
No improvement in validation accuracy for 5 epoch(s).
Early stopping at epoch 48.
Trial early stopped due to lack of improvement.
Starting a new trial...
Trial 7: alpha = 0.6750277604651747
Building the model...


2024-12-13 14:34:45,159 - mmaction - INFO - load model from: https://download.openmmlab.com/mmaction/recognition/csn/ircsn_from_scratch_r50_ig65m_20210617-ce545a37.pth
2024-12-13 14:34:45,160 - mmaction - INFO - load checkpoint from http path: https://download.openmmlab.com/mmaction/recognition/csn/ircsn_from_scratch_r50_ig65m_20210617-ce545a37.pth


Model built successfully!
Starting training...


  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [1/60], Batch [0/447], Loss: 3.9903
Epoch [1/60], Batch [10/447], Loss: 4.0229
Epoch [1/60], Batch [20/447], Loss: 4.0205
Epoch [1/60], Batch [30/447], Loss: 3.9753
Epoch [1/60], Batch [40/447], Loss: 3.9957
Epoch [1/60], Batch [50/447], Loss: 3.9691
Epoch [1/60], Batch [60/447], Loss: 3.9674
Epoch [1/60], Batch [70/447], Loss: 4.0265
Epoch [1/60], Batch [80/447], Loss: 3.9887
Epoch [1/60], Batch [90/447], Loss: 3.9656
Epoch [1/60], Batch [100/447], Loss: 3.9852
Epoch [1/60], Batch [110/447], Loss: 3.9691
Epoch [1/60], Batch [120/447], Loss: 3.9775
Epoch [1/60], Batch [130/447], Loss: 4.0289
Epoch [1/60], Batch [140/447], Loss: 3.9911
Epoch [1/60], Batch [150/447], Loss: 3.9799
Epoch [1/60], Batch [160/447], Loss: 3.9730
Epoch [1/60], Batch [170/447], Loss: 3.9660
Epoch [1/60], Batch [180/447], Loss: 3.9680
Epoch [1/60], Batch [190/447], Loss: 3.9803
Epoch [1/60], Batch [200/447], Loss: 3.9498
Epoch [1/60], Batch [210/447], Loss: 4.0229
Epoch [1/60], Batch [220/447], Loss: 3.8964

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [2/60], Batch [0/447], Loss: 3.8166
Epoch [2/60], Batch [10/447], Loss: 3.9342
Epoch [2/60], Batch [20/447], Loss: 3.8536
Epoch [2/60], Batch [30/447], Loss: 3.8796
Epoch [2/60], Batch [40/447], Loss: 3.9817
Epoch [2/60], Batch [50/447], Loss: 3.8228
Epoch [2/60], Batch [60/447], Loss: 3.9401
Epoch [2/60], Batch [70/447], Loss: 3.8045
Epoch [2/60], Batch [80/447], Loss: 3.6844
Epoch [2/60], Batch [90/447], Loss: 3.8013
Epoch [2/60], Batch [100/447], Loss: 3.8125
Epoch [2/60], Batch [110/447], Loss: 3.7774
Epoch [2/60], Batch [120/447], Loss: 3.8703
Epoch [2/60], Batch [130/447], Loss: 3.9529
Epoch [2/60], Batch [140/447], Loss: 3.9243
Epoch [2/60], Batch [150/447], Loss: 3.7520
Epoch [2/60], Batch [160/447], Loss: 3.9852
Epoch [2/60], Batch [170/447], Loss: 3.8874
Epoch [2/60], Batch [180/447], Loss: 3.9056
Epoch [2/60], Batch [190/447], Loss: 3.8803
Epoch [2/60], Batch [200/447], Loss: 3.8008
Epoch [2/60], Batch [210/447], Loss: 3.5910
Epoch [2/60], Batch [220/447], Loss: 3.6794

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [3/60], Batch [0/447], Loss: 3.5200
Epoch [3/60], Batch [10/447], Loss: 3.6587
Epoch [3/60], Batch [20/447], Loss: 3.8143
Epoch [3/60], Batch [30/447], Loss: 3.9237
Epoch [3/60], Batch [40/447], Loss: 3.8080
Epoch [3/60], Batch [50/447], Loss: 3.6224
Epoch [3/60], Batch [60/447], Loss: 3.8545
Epoch [3/60], Batch [70/447], Loss: 3.8929
Epoch [3/60], Batch [80/447], Loss: 3.6797
Epoch [3/60], Batch [90/447], Loss: 3.6377
Epoch [3/60], Batch [100/447], Loss: 3.5250
Epoch [3/60], Batch [110/447], Loss: 3.6878
Epoch [3/60], Batch [120/447], Loss: 3.9605
Epoch [3/60], Batch [130/447], Loss: 3.5984
Epoch [3/60], Batch [140/447], Loss: 3.6918
Epoch [3/60], Batch [150/447], Loss: 3.7463
Epoch [3/60], Batch [160/447], Loss: 3.7508
Epoch [3/60], Batch [170/447], Loss: 3.8494
Epoch [3/60], Batch [180/447], Loss: 3.5996
Epoch [3/60], Batch [190/447], Loss: 3.5298
Epoch [3/60], Batch [200/447], Loss: 3.5914
Epoch [3/60], Batch [210/447], Loss: 3.7648
Epoch [3/60], Batch [220/447], Loss: 3.7932

  bbx1 = torch.clamp(cx - cut_w // 2, 0, w)
  bby1 = torch.clamp(cy - cut_h // 2, 0, h)
  bbx2 = torch.clamp(cx + cut_w // 2, 0, w)
  bby2 = torch.clamp(cy + cut_h // 2, 0, h)


Epoch [4/60], Batch [0/447], Loss: 3.6099
Epoch [4/60], Batch [10/447], Loss: 3.5379
Epoch [4/60], Batch [20/447], Loss: 3.5813
Epoch [4/60], Batch [30/447], Loss: 3.6037
Epoch [4/60], Batch [40/447], Loss: 3.7958
Epoch [4/60], Batch [50/447], Loss: 3.8730
Epoch [4/60], Batch [60/447], Loss: 3.8491
Epoch [4/60], Batch [70/447], Loss: 3.5983
Epoch [4/60], Batch [80/447], Loss: 3.6245
Epoch [4/60], Batch [90/447], Loss: 3.6914
Epoch [4/60], Batch [100/447], Loss: 3.7384
Epoch [4/60], Batch [110/447], Loss: 3.8332
Epoch [4/60], Batch [120/447], Loss: 3.7592
Epoch [4/60], Batch [130/447], Loss: 3.6376
Epoch [4/60], Batch [140/447], Loss: 3.7105
Epoch [4/60], Batch [150/447], Loss: 3.6235
Epoch [4/60], Batch [160/447], Loss: 3.5160
Epoch [4/60], Batch [170/447], Loss: 3.7314
Epoch [4/60], Batch [180/447], Loss: 3.4608
Epoch [4/60], Batch [190/447], Loss: 3.4440
Epoch [4/60], Batch [200/447], Loss: 3.6412
Epoch [4/60], Batch [210/447], Loss: 3.6969
Epoch [4/60], Batch [220/447], Loss: 3.6859

[W 2024-12-13 14:43:42,968] Trial 7 failed with parameters: {'alpha': 0.6750277604651747} because of the following error: KeyboardInterrupt().
Traceback (most recent call last):
  File "/home/sadat/miniconda3/envs/scrambmix/lib/python3.8/site-packages/optuna/study/_optimize.py", line 197, in _run_trial
    value_or_values = func(trial)
  File "/tmp/ipykernel_102155/3443986128.py", line 110, in objective
    optimizer.step()
  File "/home/sadat/miniconda3/envs/scrambmix/lib/python3.8/site-packages/torch/optim/optimizer.py", line 88, in wrapper
    return func(*args, **kwargs)
  File "/home/sadat/miniconda3/envs/scrambmix/lib/python3.8/site-packages/torch/autograd/grad_mode.py", line 27, in decorate_context
    return func(*args, **kwargs)
  File "/home/sadat/miniconda3/envs/scrambmix/lib/python3.8/site-packages/torch/optim/adam.py", line 141, in step
    F.adam(params_with_grad,
  File "/home/sadat/miniconda3/envs/scrambmix/lib/python3.8/site-packages/torch/optim/_functional.py", line 9

KeyboardInterrupt: 

## Results

In [8]:
# Retrieve all trials and print their parameters
for trial in study.trials:
    print(f"Trial number: {trial.number}")
    print(f"Parameters: {trial.params}")
    print(f"Value (e.g., validation accuracy): {trial.value}")
    print("-" * 30)

Trial number: 0
Parameters: {'alpha': 3.807947176588889}
Value (e.g., validation accuracy): None
------------------------------
Trial number: 1
Parameters: {'alpha': 3.807947176588889}
Value (e.g., validation accuracy): 0.7065359477124183
------------------------------
Trial number: 2
Parameters: {'alpha': 9.51207163345817}
Value (e.g., validation accuracy): 0.7287581699346405
------------------------------
Trial number: 3
Parameters: {'alpha': 7.34674002393291}
Value (e.g., validation accuracy): 0.7261437908496732
------------------------------
Trial number: 4
Parameters: {'alpha': 6.026718993550662}
Value (e.g., validation accuracy): 0.726797385620915
------------------------------
Trial number: 5
Parameters: {'alpha': 1.6445845403801216}
Value (e.g., validation accuracy): 0.7091503267973857
------------------------------
Trial number: 6
Parameters: {'alpha': 1.6443457513284063}
Value (e.g., validation accuracy): 0.7150326797385621
------------------------------
Trial number: 7
Param

In [9]:
best_trial = study.best_trial
print("Best trial number:", best_trial.number)
print("Best parameters:", best_trial.params)
print("Best validation loss:", best_trial.value)

ValueError: Record does not exist.