## Helmet Detection With COCO {with.pt} and Without CBAM


### Importing the Modules


In [1]:
from ultralytics import YOLO
import torch


In [2]:
import torch

print("Torch version:", torch.__version__)
print("CUDA available:", torch.cuda.is_available())

if torch.cuda.is_available():
    print("CUDA version:", torch.version.cuda)
    print("GPU count:", torch.cuda.device_count())
    print("Current device:", torch.cuda.current_device())
    print("GPU name:", torch.cuda.get_device_name(0))
    print("Total VRAM (GB):",
          torch.cuda.get_device_properties(0).total_memory / 1024**3)

    # Simple tensor test on GPU
    x = torch.randn(1000, 1000).cuda()
    y = torch.matmul(x, x)
    print("✅ GPU computation successful")
else:
    print("❌ CUDA NOT working, using CPU")


Torch version: 2.9.1+cu130
CUDA available: True
CUDA version: 13.0
GPU count: 1
Current device: 0
GPU name: NVIDIA GeForce RTX 4060 Laptop GPU
Total VRAM (GB): 7.99560546875
✅ GPU computation successful


In [3]:

# Dataset YAML
data_yaml = r"E:/Helmet-Detection/Helmet-Detection/dataset/data.yaml"

# Load YOLOv8 Nano
model = YOLO("yolov8n.pt")

model.train(
    data=data_yaml,
    epochs=100,
    imgsz=640,          # optimal for accuracy
    batch=16,           # max safe batch for 8GB VRAM
    device=0,
    workers=0,          # notebook safe
    amp=True,           # uses Tensor Cores
    cache=False,        # avoids RAM spikes
    cos_lr=True,
    close_mosaic=10,
    patience=20,
    plots=True,
    name="helmet_yolov8n_coco"
)


New https://pypi.org/project/ultralytics/8.3.239 available  Update with 'pip install -U ultralytics'
Ultralytics 8.3.235  Python-3.12.0 torch-2.9.1+cu130 CUDA:0 (NVIDIA GeForce RTX 4060 Laptop GPU, 8188MiB)
[34m[1mengine\trainer: [0magnostic_nms=False, amp=True, augment=False, auto_augment=randaugment, batch=16, bgr=0.0, box=7.5, cache=False, cfg=None, classes=None, close_mosaic=10, cls=0.5, compile=False, conf=None, copy_paste=0.0, copy_paste_mode=flip, cos_lr=True, cutmix=0.0, data=E:/Helmet-Detection/Helmet-Detection/dataset/data.yaml, degrees=0.0, deterministic=True, device=0, dfl=1.5, dnn=False, dropout=0.0, dynamic=False, embed=None, epochs=100, erasing=0.4, exist_ok=False, fliplr=0.5, flipud=0.0, format=torchscript, fraction=1.0, freeze=None, half=False, hsv_h=0.015, hsv_s=0.7, hsv_v=0.4, imgsz=640, int8=False, iou=0.7, keras=False, kobj=1.0, line_width=None, lr0=0.01, lrf=0.01, mask_ratio=4, max_det=300, mixup=0.0, mode=train, model=yolov8n.pt, momentum=0.937, mosaic=1.0, mu

  attn = (q.transpose(-2, -1) @ k) * self.scale
  x = (v @ attn.transpose(-2, -1)).view(B, C, H, W) + self.pe(v.reshape(B, C, H, W))


[34m[1mAMP: [0mchecks passed 
[34m[1mtrain: [0mFast image access  (ping: 0.00.0 ms, read: 1948.8697.3 MB/s, size: 262.3 KB)
[K[34m[1mtrain: [0mScanning E:\Helmet-Detection\Helmet-Detection\dataset\labels\train.cache... 4000 images, 0 backgrounds, 0 corrupt: 100% ━━━━━━━━━━━━ 4000/4000  0.0s
[34m[1mval: [0mFast image access  (ping: 0.00.0 ms, read: 2237.8530.2 MB/s, size: 265.2 KB)
[K[34m[1mval: [0mScanning E:\Helmet-Detection\Helmet-Detection\dataset\labels\val.cache... 1000 images, 0 backgrounds, 0 corrupt: 100% ━━━━━━━━━━━━ 1000/1000  0.0s
Plotting labels to E:\Helmet-Detection\Helmet-Detection\runs\detect\helmet_yolov8n_coco3\labels.jpg... 
[34m[1moptimizer:[0m 'optimizer=auto' found, ignoring 'lr0=0.01' and 'momentum=0.937' and determining best 'optimizer', 'lr0' and 'momentum' automatically... 
[34m[1moptimizer:[0m AdamW(lr=0.001667, momentum=0.9) with parameter groups 57 weight(decay=0.0), 64 weight(decay=0.0005), 63 bias(decay=0.0)
Image sizes 640 train, 6

  pred_dist = pred_dist.view(b, a, 4, c // 4).softmax(3).matmul(self.proj.type(pred_dist.dtype))


[K      1/100       2.1G      1.504      1.712       1.18        146        640: 100% ━━━━━━━━━━━━ 250/250 3.4it/s 1:13<0.3ss
[K                 Class     Images  Instances      Box(P          R      mAP50  mAP50-95): 100% ━━━━━━━━━━━━ 32/32 3.4it/s 9.4s0.3s
                   all       1000       5087      0.801      0.707      0.787       0.45

      Epoch    GPU_mem   box_loss   cls_loss   dfl_loss  Instances       Size
[K      2/100      3.05G      1.517      1.244      1.186        148        640: 0% ──────────── 0/250  0.3s

  pred_dist = pred_dist.view(b, a, 4, c // 4).softmax(3).matmul(self.proj.type(pred_dist.dtype))


[K      2/100      3.05G      1.443      1.132      1.158        106        640: 100% ━━━━━━━━━━━━ 250/250 3.5it/s 1:11<0.3ss
[K                 Class     Images  Instances      Box(P          R      mAP50  mAP50-95): 100% ━━━━━━━━━━━━ 32/32 3.5it/s 9.2s0.3s
                   all       1000       5087      0.835      0.745      0.818      0.476

      Epoch    GPU_mem   box_loss   cls_loss   dfl_loss  Instances       Size
[K      3/100      3.07G      1.403      1.002      1.157        121        640: 0% ──────────── 0/250  0.3s

  pred_dist = pred_dist.view(b, a, 4, c // 4).softmax(3).matmul(self.proj.type(pred_dist.dtype))


[K      3/100      3.07G      1.455      1.066      1.171        104        640: 100% ━━━━━━━━━━━━ 250/250 3.6it/s 1:10<0.3ss
[K                 Class     Images  Instances      Box(P          R      mAP50  mAP50-95): 100% ━━━━━━━━━━━━ 32/32 3.5it/s 9.2s0.3s
                   all       1000       5087      0.856      0.732       0.82      0.488

      Epoch    GPU_mem   box_loss   cls_loss   dfl_loss  Instances       Size
[K      4/100      3.07G      1.377      1.015      1.195         70        640: 0% ──────────── 0/250  0.3s

  pred_dist = pred_dist.view(b, a, 4, c // 4).softmax(3).matmul(self.proj.type(pred_dist.dtype))


[K      4/100      3.07G      1.409     0.9704      1.157         74        640: 100% ━━━━━━━━━━━━ 250/250 3.3it/s 1:16<0.3ss
[K                 Class     Images  Instances      Box(P          R      mAP50  mAP50-95): 100% ━━━━━━━━━━━━ 32/32 3.4it/s 9.3s0.3s
                   all       1000       5087      0.876      0.765      0.863      0.499

      Epoch    GPU_mem   box_loss   cls_loss   dfl_loss  Instances       Size
[K      5/100      3.07G      1.361     0.9202      1.147        103        640: 0% ──────────── 0/250  0.3s

  pred_dist = pred_dist.view(b, a, 4, c // 4).softmax(3).matmul(self.proj.type(pred_dist.dtype))


[K      5/100      3.07G      1.405     0.9374      1.154        167        640: 100% ━━━━━━━━━━━━ 250/250 2.9it/s 1:26<0.6ss
[K                 Class     Images  Instances      Box(P          R      mAP50  mAP50-95): 100% ━━━━━━━━━━━━ 32/32 1.1it/s 29.0s0.9ss
                   all       1000       5087      0.883      0.795      0.876      0.527

      Epoch    GPU_mem   box_loss   cls_loss   dfl_loss  Instances       Size
[K      6/100      3.09G      1.372     0.9976       1.12         57        640: 0% ──────────── 0/250  0.6s

  pred_dist = pred_dist.view(b, a, 4, c // 4).softmax(3).matmul(self.proj.type(pred_dist.dtype))


[K      6/100      3.09G       1.38     0.8921      1.145        110        640: 100% ━━━━━━━━━━━━ 250/250 1.6it/s 2:38<0.6s
[K                 Class     Images  Instances      Box(P          R      mAP50  mAP50-95): 100% ━━━━━━━━━━━━ 32/32 3.5it/s 9.0s0.3s
                   all       1000       5087      0.889      0.812      0.884      0.544

      Epoch    GPU_mem   box_loss   cls_loss   dfl_loss  Instances       Size
[K      7/100      3.09G        1.1     0.8243      1.115         66        640: 0% ──────────── 0/250  0.3s

  pred_dist = pred_dist.view(b, a, 4, c // 4).softmax(3).matmul(self.proj.type(pred_dist.dtype))


[K      7/100      3.09G      1.374     0.8634       1.14         98        640: 100% ━━━━━━━━━━━━ 250/250 3.6it/s 1:10<0.3ss
[K                 Class     Images  Instances      Box(P          R      mAP50  mAP50-95): 100% ━━━━━━━━━━━━ 32/32 3.5it/s 9.1s0.3s
                   all       1000       5087      0.886      0.801       0.88      0.537

      Epoch    GPU_mem   box_loss   cls_loss   dfl_loss  Instances       Size
[K      8/100      3.09G      1.311     0.9562      1.113         87        640: 0% ──────────── 0/250  0.3s

  pred_dist = pred_dist.view(b, a, 4, c // 4).softmax(3).matmul(self.proj.type(pred_dist.dtype))


[K      8/100      3.09G      1.372      0.843      1.138         93        640: 100% ━━━━━━━━━━━━ 250/250 3.5it/s 1:11<0.3ss
[K                 Class     Images  Instances      Box(P          R      mAP50  mAP50-95): 100% ━━━━━━━━━━━━ 32/32 3.4it/s 9.4s0.3s
                   all       1000       5087      0.902      0.821      0.895      0.535

      Epoch    GPU_mem   box_loss   cls_loss   dfl_loss  Instances       Size
[K      9/100      3.09G      1.434      1.039      1.168        129        640: 0% ──────────── 0/250  0.3s

  pred_dist = pred_dist.view(b, a, 4, c // 4).softmax(3).matmul(self.proj.type(pred_dist.dtype))


[K      9/100      3.09G      1.342     0.8302       1.13        122        640: 100% ━━━━━━━━━━━━ 250/250 3.6it/s 1:10<0.3ss
[K                 Class     Images  Instances      Box(P          R      mAP50  mAP50-95): 100% ━━━━━━━━━━━━ 32/32 3.5it/s 9.2s0.3s
                   all       1000       5087      0.889      0.811      0.885      0.549

      Epoch    GPU_mem   box_loss   cls_loss   dfl_loss  Instances       Size
[K     10/100      3.09G      1.244     0.8769      1.124        119        640: 0% ──────────── 0/250  0.3s

  pred_dist = pred_dist.view(b, a, 4, c // 4).softmax(3).matmul(self.proj.type(pred_dist.dtype))


[K     10/100      3.09G      1.342     0.8162      1.125         93        640: 100% ━━━━━━━━━━━━ 250/250 3.5it/s 1:11<0.3ss
[K                 Class     Images  Instances      Box(P          R      mAP50  mAP50-95): 100% ━━━━━━━━━━━━ 32/32 3.5it/s 9.2s0.3s
                   all       1000       5087      0.897      0.807      0.887      0.564

      Epoch    GPU_mem   box_loss   cls_loss   dfl_loss  Instances       Size
[K     11/100      3.09G      1.417     0.8299      1.053        173        640: 0% ──────────── 0/250  0.3s

  pred_dist = pred_dist.view(b, a, 4, c // 4).softmax(3).matmul(self.proj.type(pred_dist.dtype))


[K     11/100      3.09G      1.334     0.8017      1.121        106        640: 100% ━━━━━━━━━━━━ 250/250 3.6it/s 1:09<0.3ss
[K                 Class     Images  Instances      Box(P          R      mAP50  mAP50-95): 100% ━━━━━━━━━━━━ 32/32 3.4it/s 9.5s0.3s
                   all       1000       5087      0.882       0.82      0.892      0.554

      Epoch    GPU_mem   box_loss   cls_loss   dfl_loss  Instances       Size
[K     12/100      3.09G      1.352     0.9078      1.097        119        640: 0% ──────────── 0/250  0.3s

  pred_dist = pred_dist.view(b, a, 4, c // 4).softmax(3).matmul(self.proj.type(pred_dist.dtype))


[K     12/100      3.09G       1.33     0.7994      1.123         98        640: 100% ━━━━━━━━━━━━ 250/250 3.5it/s 1:12<0.3ss
[K                 Class     Images  Instances      Box(P          R      mAP50  mAP50-95): 100% ━━━━━━━━━━━━ 32/32 3.4it/s 9.3s0.3s
                   all       1000       5087      0.886      0.822      0.891      0.561

      Epoch    GPU_mem   box_loss   cls_loss   dfl_loss  Instances       Size
[K     13/100      3.09G      1.129     0.6384     0.9957         82        640: 0% ──────────── 0/250  0.3s

  pred_dist = pred_dist.view(b, a, 4, c // 4).softmax(3).matmul(self.proj.type(pred_dist.dtype))


[K     13/100      3.09G       1.32     0.7731      1.119        114        640: 100% ━━━━━━━━━━━━ 250/250 3.5it/s 1:12<0.3ss
[K                 Class     Images  Instances      Box(P          R      mAP50  mAP50-95): 100% ━━━━━━━━━━━━ 32/32 3.4it/s 9.3s0.3s
                   all       1000       5087        0.9      0.836       0.91      0.564

      Epoch    GPU_mem   box_loss   cls_loss   dfl_loss  Instances       Size
[K     14/100       3.1G      1.348      0.782      1.151         78        640: 0% ──────────── 0/250  0.3s

  pred_dist = pred_dist.view(b, a, 4, c // 4).softmax(3).matmul(self.proj.type(pred_dist.dtype))


[K     14/100       3.1G      1.317     0.7692      1.119         93        640: 100% ━━━━━━━━━━━━ 250/250 3.5it/s 1:12<0.3ss
[K                 Class     Images  Instances      Box(P          R      mAP50  mAP50-95): 100% ━━━━━━━━━━━━ 32/32 3.5it/s 9.2s0.3s
                   all       1000       5087      0.907       0.83       0.91      0.565

      Epoch    GPU_mem   box_loss   cls_loss   dfl_loss  Instances       Size
[K     15/100      3.11G      1.376     0.8948      1.162        102        640: 0% ──────────── 0/250  0.3s

  pred_dist = pred_dist.view(b, a, 4, c // 4).softmax(3).matmul(self.proj.type(pred_dist.dtype))


[K     15/100      3.12G      1.308     0.7694      1.117        122        640: 100% ━━━━━━━━━━━━ 250/250 3.5it/s 1:11<0.3ss
[K                 Class     Images  Instances      Box(P          R      mAP50  mAP50-95): 100% ━━━━━━━━━━━━ 32/32 3.5it/s 9.1s0.3s
                   all       1000       5087      0.921       0.84      0.919      0.583

      Epoch    GPU_mem   box_loss   cls_loss   dfl_loss  Instances       Size
[K     16/100      3.12G      1.407     0.8299      1.169         75        640: 0% ──────────── 0/250  0.3s

  pred_dist = pred_dist.view(b, a, 4, c // 4).softmax(3).matmul(self.proj.type(pred_dist.dtype))


[K     16/100      3.12G      1.302     0.7483      1.108        104        640: 100% ━━━━━━━━━━━━ 250/250 3.6it/s 1:10<0.3ss
[K                 Class     Images  Instances      Box(P          R      mAP50  mAP50-95): 100% ━━━━━━━━━━━━ 32/32 3.5it/s 9.2s0.3s
                   all       1000       5087      0.909      0.846       0.92      0.585

      Epoch    GPU_mem   box_loss   cls_loss   dfl_loss  Instances       Size
[K     17/100      3.12G      1.157     0.6273      1.053        121        640: 0% ──────────── 0/250  0.3s

  pred_dist = pred_dist.view(b, a, 4, c // 4).softmax(3).matmul(self.proj.type(pred_dist.dtype))


[K     17/100      3.12G      1.294     0.7558      1.109         81        640: 100% ━━━━━━━━━━━━ 250/250 3.5it/s 1:11<0.3ss
[K                 Class     Images  Instances      Box(P          R      mAP50  mAP50-95): 100% ━━━━━━━━━━━━ 32/32 3.5it/s 9.2s0.3s
                   all       1000       5087      0.916      0.838      0.914      0.582

      Epoch    GPU_mem   box_loss   cls_loss   dfl_loss  Instances       Size
[K     18/100      3.12G      1.357      1.021       1.25         48        640: 0% ──────────── 0/250  0.3s

  pred_dist = pred_dist.view(b, a, 4, c // 4).softmax(3).matmul(self.proj.type(pred_dist.dtype))


[K     18/100      3.12G      1.311      0.749      1.114        167        640: 100% ━━━━━━━━━━━━ 250/250 3.4it/s 1:13<0.3ss
[K                 Class     Images  Instances      Box(P          R      mAP50  mAP50-95): 100% ━━━━━━━━━━━━ 32/32 3.6it/s 9.0s0.3s
                   all       1000       5087      0.912       0.86      0.922      0.587

      Epoch    GPU_mem   box_loss   cls_loss   dfl_loss  Instances       Size
[K     19/100      3.12G      1.265     0.7518      1.071        110        640: 0% ──────────── 0/250  0.3s

  pred_dist = pred_dist.view(b, a, 4, c // 4).softmax(3).matmul(self.proj.type(pred_dist.dtype))


[K     19/100      3.12G      1.284      0.735      1.103        148        640: 100% ━━━━━━━━━━━━ 250/250 3.5it/s 1:11<0.3ss
[K                 Class     Images  Instances      Box(P          R      mAP50  mAP50-95): 100% ━━━━━━━━━━━━ 32/32 3.5it/s 9.2s0.3s
                   all       1000       5087      0.906      0.836      0.911      0.578

      Epoch    GPU_mem   box_loss   cls_loss   dfl_loss  Instances       Size
[K     20/100      3.12G      1.239     0.6696      1.041         78        640: 0% ──────────── 0/250  0.3s

  pred_dist = pred_dist.view(b, a, 4, c // 4).softmax(3).matmul(self.proj.type(pred_dist.dtype))


[K     20/100      3.12G       1.29     0.7318      1.106        155        640: 100% ━━━━━━━━━━━━ 250/250 3.5it/s 1:12<0.3ss
[K                 Class     Images  Instances      Box(P          R      mAP50  mAP50-95): 100% ━━━━━━━━━━━━ 32/32 3.3it/s 9.6s0.3s
                   all       1000       5087      0.908      0.855      0.922      0.591

      Epoch    GPU_mem   box_loss   cls_loss   dfl_loss  Instances       Size
[K     21/100      3.12G      1.227     0.6584      1.047        122        640: 0% ──────────── 0/250  0.3s

  pred_dist = pred_dist.view(b, a, 4, c // 4).softmax(3).matmul(self.proj.type(pred_dist.dtype))


[K     21/100      3.12G      1.283     0.7211      1.098        134        640: 100% ━━━━━━━━━━━━ 250/250 3.4it/s 1:13<0.3ss
[K                 Class     Images  Instances      Box(P          R      mAP50  mAP50-95): 100% ━━━━━━━━━━━━ 32/32 3.3it/s 9.7s0.3s
                   all       1000       5087      0.904      0.851      0.915      0.588

      Epoch    GPU_mem   box_loss   cls_loss   dfl_loss  Instances       Size
[K     22/100      3.12G      1.207     0.7741      1.115         61        640: 0% ──────────── 0/250  0.3s

  pred_dist = pred_dist.view(b, a, 4, c // 4).softmax(3).matmul(self.proj.type(pred_dist.dtype))


[K     22/100      3.12G      1.276     0.7201      1.099        103        640: 100% ━━━━━━━━━━━━ 250/250 3.5it/s 1:11<0.3ss
[K                 Class     Images  Instances      Box(P          R      mAP50  mAP50-95): 100% ━━━━━━━━━━━━ 32/32 3.5it/s 9.2s0.3s
                   all       1000       5087      0.917      0.857      0.926      0.598

      Epoch    GPU_mem   box_loss   cls_loss   dfl_loss  Instances       Size
[K     23/100      3.12G      1.367     0.7092      1.151        101        640: 0% ──────────── 0/250  0.3s

  pred_dist = pred_dist.view(b, a, 4, c // 4).softmax(3).matmul(self.proj.type(pred_dist.dtype))


[K     23/100      3.12G       1.27     0.7092      1.094        129        640: 100% ━━━━━━━━━━━━ 250/250 3.6it/s 1:10<0.3ss
[K                 Class     Images  Instances      Box(P          R      mAP50  mAP50-95): 100% ━━━━━━━━━━━━ 32/32 3.5it/s 9.2s0.3s
                   all       1000       5087      0.926      0.853      0.926        0.6

      Epoch    GPU_mem   box_loss   cls_loss   dfl_loss  Instances       Size
[K     24/100      3.12G       1.22     0.7325      1.071        160        640: 0% ──────────── 0/250  0.3s

  pred_dist = pred_dist.view(b, a, 4, c // 4).softmax(3).matmul(self.proj.type(pred_dist.dtype))


[K     24/100      3.12G      1.283     0.7138        1.1        109        640: 100% ━━━━━━━━━━━━ 250/250 3.6it/s 1:10<0.3ss
[K                 Class     Images  Instances      Box(P          R      mAP50  mAP50-95): 100% ━━━━━━━━━━━━ 32/32 3.5it/s 9.2s0.3s
                   all       1000       5087      0.927      0.851      0.926      0.576

      Epoch    GPU_mem   box_loss   cls_loss   dfl_loss  Instances       Size
[K     25/100      3.12G      1.167     0.6424      1.055        122        640: 0% ──────────── 0/250  0.3s

  pred_dist = pred_dist.view(b, a, 4, c // 4).softmax(3).matmul(self.proj.type(pred_dist.dtype))


[K     25/100      3.12G      1.266     0.7011      1.097         84        640: 100% ━━━━━━━━━━━━ 250/250 3.6it/s 1:10<0.3ss
[K                 Class     Images  Instances      Box(P          R      mAP50  mAP50-95): 100% ━━━━━━━━━━━━ 32/32 3.4it/s 9.4s0.3s
                   all       1000       5087      0.914      0.855      0.924       0.59

      Epoch    GPU_mem   box_loss   cls_loss   dfl_loss  Instances       Size
[K     26/100      3.12G      1.348     0.7439      1.076        105        640: 0% ──────────── 0/250  0.3s

  pred_dist = pred_dist.view(b, a, 4, c // 4).softmax(3).matmul(self.proj.type(pred_dist.dtype))


[K     26/100      3.12G      1.259     0.6965      1.089         85        640: 100% ━━━━━━━━━━━━ 250/250 3.5it/s 1:11<0.3ss
[K                 Class     Images  Instances      Box(P          R      mAP50  mAP50-95): 100% ━━━━━━━━━━━━ 32/32 3.5it/s 9.0s0.3s
                   all       1000       5087      0.919      0.854      0.925      0.592

      Epoch    GPU_mem   box_loss   cls_loss   dfl_loss  Instances       Size
[K     27/100      3.12G      1.271     0.6652      1.126         85        640: 0% ──────────── 0/250  0.3s

  pred_dist = pred_dist.view(b, a, 4, c // 4).softmax(3).matmul(self.proj.type(pred_dist.dtype))


[K     27/100      3.12G      1.266     0.6994      1.093        118        640: 100% ━━━━━━━━━━━━ 250/250 3.6it/s 1:10<0.3ss
[K                 Class     Images  Instances      Box(P          R      mAP50  mAP50-95): 100% ━━━━━━━━━━━━ 32/32 3.5it/s 9.1s0.3s
                   all       1000       5087      0.909      0.867      0.927      0.598

      Epoch    GPU_mem   box_loss   cls_loss   dfl_loss  Instances       Size
[K     28/100      3.12G      1.353      0.706      1.158         83        640: 0% ──────────── 0/250  0.3s

  pred_dist = pred_dist.view(b, a, 4, c // 4).softmax(3).matmul(self.proj.type(pred_dist.dtype))


[K     28/100      3.12G      1.264     0.6875       1.09        113        640: 100% ━━━━━━━━━━━━ 250/250 3.6it/s 1:10<0.3ss
[K                 Class     Images  Instances      Box(P          R      mAP50  mAP50-95): 100% ━━━━━━━━━━━━ 32/32 3.6it/s 9.0s0.3s
                   all       1000       5087      0.912       0.87       0.93      0.601

      Epoch    GPU_mem   box_loss   cls_loss   dfl_loss  Instances       Size
[K     29/100      3.12G      1.294     0.6496      1.064        144        640: 0% ──────────── 0/250  0.3s

  pred_dist = pred_dist.view(b, a, 4, c // 4).softmax(3).matmul(self.proj.type(pred_dist.dtype))


[K     29/100      3.12G      1.248     0.6814       1.08        155        640: 100% ━━━━━━━━━━━━ 250/250 3.5it/s 1:10<0.3ss
[K                 Class     Images  Instances      Box(P          R      mAP50  mAP50-95): 100% ━━━━━━━━━━━━ 32/32 3.4it/s 9.4s0.3s
                   all       1000       5087      0.914      0.877      0.932      0.598

      Epoch    GPU_mem   box_loss   cls_loss   dfl_loss  Instances       Size
[K     30/100      3.12G      1.279     0.6559      1.083        125        640: 0% ──────────── 0/250  0.3s

  pred_dist = pred_dist.view(b, a, 4, c // 4).softmax(3).matmul(self.proj.type(pred_dist.dtype))


[K     30/100      3.12G       1.26     0.6815      1.086        107        640: 100% ━━━━━━━━━━━━ 250/250 3.5it/s 1:11<0.3ss
[K                 Class     Images  Instances      Box(P          R      mAP50  mAP50-95): 100% ━━━━━━━━━━━━ 32/32 3.4it/s 9.5s0.3s
                   all       1000       5087       0.92      0.856      0.927      0.598

      Epoch    GPU_mem   box_loss   cls_loss   dfl_loss  Instances       Size
[K     31/100      3.12G      1.075     0.6284      1.134         83        640: 0% ──────────── 0/250  0.3s

  pred_dist = pred_dist.view(b, a, 4, c // 4).softmax(3).matmul(self.proj.type(pred_dist.dtype))


[K     31/100      3.12G      1.257     0.6752      1.084        113        640: 100% ━━━━━━━━━━━━ 250/250 3.5it/s 1:12<0.3ss
[K                 Class     Images  Instances      Box(P          R      mAP50  mAP50-95): 100% ━━━━━━━━━━━━ 32/32 3.5it/s 9.3s0.3s
                   all       1000       5087      0.932      0.848      0.929      0.603

      Epoch    GPU_mem   box_loss   cls_loss   dfl_loss  Instances       Size
[K     32/100      3.12G      1.384     0.6987      1.139         97        640: 0% ──────────── 0/250  0.3s

  pred_dist = pred_dist.view(b, a, 4, c // 4).softmax(3).matmul(self.proj.type(pred_dist.dtype))


[K     32/100      3.12G      1.233     0.6611      1.078         68        640: 100% ━━━━━━━━━━━━ 250/250 3.5it/s 1:12<0.3ss
[K                 Class     Images  Instances      Box(P          R      mAP50  mAP50-95): 100% ━━━━━━━━━━━━ 32/32 3.4it/s 9.3s0.3s
                   all       1000       5087      0.921      0.861      0.928      0.602

      Epoch    GPU_mem   box_loss   cls_loss   dfl_loss  Instances       Size
[K     33/100      3.12G      1.255     0.6776      1.109        107        640: 0% ──────────── 0/250  0.3s

  pred_dist = pred_dist.view(b, a, 4, c // 4).softmax(3).matmul(self.proj.type(pred_dist.dtype))


[K     33/100      3.12G      1.235     0.6601      1.081         85        640: 100% ━━━━━━━━━━━━ 250/250 3.6it/s 1:10<0.3ss
[K                 Class     Images  Instances      Box(P          R      mAP50  mAP50-95): 100% ━━━━━━━━━━━━ 32/32 3.5it/s 9.0s0.3s
                   all       1000       5087      0.915      0.866       0.93      0.595

      Epoch    GPU_mem   box_loss   cls_loss   dfl_loss  Instances       Size
[K     34/100      3.14G       1.45     0.7428      1.127        143        640: 0% ──────────── 0/250  0.3s

  pred_dist = pred_dist.view(b, a, 4, c // 4).softmax(3).matmul(self.proj.type(pred_dist.dtype))


[K     34/100      3.14G      1.233     0.6604      1.084         92        640: 100% ━━━━━━━━━━━━ 250/250 3.6it/s 1:09<0.3ss
[K                 Class     Images  Instances      Box(P          R      mAP50  mAP50-95): 100% ━━━━━━━━━━━━ 32/32 3.6it/s 8.8s0.3s
                   all       1000       5087      0.935      0.866      0.934      0.609

      Epoch    GPU_mem   box_loss   cls_loss   dfl_loss  Instances       Size
[K     35/100      3.14G       1.21     0.6294      1.052        121        640: 0% ──────────── 0/250  0.3s

  pred_dist = pred_dist.view(b, a, 4, c // 4).softmax(3).matmul(self.proj.type(pred_dist.dtype))


[K     35/100      3.14G      1.241     0.6555      1.082        111        640: 100% ━━━━━━━━━━━━ 250/250 3.6it/s 1:10<0.3ss
[K                 Class     Images  Instances      Box(P          R      mAP50  mAP50-95): 100% ━━━━━━━━━━━━ 32/32 3.5it/s 9.3s0.3s
                   all       1000       5087      0.922      0.868      0.934      0.605

      Epoch    GPU_mem   box_loss   cls_loss   dfl_loss  Instances       Size
[K     36/100      3.14G       1.16     0.5298       1.06        104        640: 0% ──────────── 0/250  0.3s

  pred_dist = pred_dist.view(b, a, 4, c // 4).softmax(3).matmul(self.proj.type(pred_dist.dtype))


[K     36/100      3.14G      1.226     0.6451      1.074         98        640: 100% ━━━━━━━━━━━━ 250/250 3.4it/s 1:14<0.3ss
[K                 Class     Images  Instances      Box(P          R      mAP50  mAP50-95): 100% ━━━━━━━━━━━━ 32/32 3.5it/s 9.2s0.3s
                   all       1000       5087      0.927      0.873      0.932      0.608

      Epoch    GPU_mem   box_loss   cls_loss   dfl_loss  Instances       Size
[K     37/100      3.14G      1.185     0.5901      1.058         96        640: 0% ──────────── 0/250  0.3s

  pred_dist = pred_dist.view(b, a, 4, c // 4).softmax(3).matmul(self.proj.type(pred_dist.dtype))


[K     37/100      3.14G      1.223     0.6482      1.073        101        640: 100% ━━━━━━━━━━━━ 250/250 3.4it/s 1:13<0.3ss
[K                 Class     Images  Instances      Box(P          R      mAP50  mAP50-95): 100% ━━━━━━━━━━━━ 32/32 3.5it/s 9.2s0.3s
                   all       1000       5087       0.92      0.876      0.935      0.608

      Epoch    GPU_mem   box_loss   cls_loss   dfl_loss  Instances       Size
[K     38/100      3.14G      1.346     0.6909      1.134        105        640: 0% ──────────── 0/250  0.3s

  pred_dist = pred_dist.view(b, a, 4, c // 4).softmax(3).matmul(self.proj.type(pred_dist.dtype))


[K     38/100      3.14G      1.227     0.6482      1.074        111        640: 100% ━━━━━━━━━━━━ 250/250 3.5it/s 1:12<0.3ss
[K                 Class     Images  Instances      Box(P          R      mAP50  mAP50-95): 100% ━━━━━━━━━━━━ 32/32 3.4it/s 9.3s0.3s
                   all       1000       5087      0.914      0.874      0.932       0.61

      Epoch    GPU_mem   box_loss   cls_loss   dfl_loss  Instances       Size
[K     39/100      3.14G      1.067     0.6558     0.9932        155        640: 0% ──────────── 0/250  0.3s

  pred_dist = pred_dist.view(b, a, 4, c // 4).softmax(3).matmul(self.proj.type(pred_dist.dtype))


[K     39/100      3.14G      1.223     0.6455      1.072        141        640: 100% ━━━━━━━━━━━━ 250/250 3.6it/s 1:10<0.3ss
[K                 Class     Images  Instances      Box(P          R      mAP50  mAP50-95): 100% ━━━━━━━━━━━━ 32/32 3.5it/s 9.1s0.3s
                   all       1000       5087      0.931      0.864      0.934      0.607

      Epoch    GPU_mem   box_loss   cls_loss   dfl_loss  Instances       Size
[K     40/100      3.14G      1.213     0.6031      1.059        112        640: 0% ──────────── 0/250  0.3s

  pred_dist = pred_dist.view(b, a, 4, c // 4).softmax(3).matmul(self.proj.type(pred_dist.dtype))


[K     40/100      3.14G      1.209     0.6307      1.067         81        640: 100% ━━━━━━━━━━━━ 250/250 3.6it/s 1:10<0.3ss
[K                 Class     Images  Instances      Box(P          R      mAP50  mAP50-95): 100% ━━━━━━━━━━━━ 32/32 3.4it/s 9.3s0.3s
                   all       1000       5087      0.925      0.873      0.936      0.614

      Epoch    GPU_mem   box_loss   cls_loss   dfl_loss  Instances       Size
[K     41/100      3.14G      1.282     0.6109      1.035        116        640: 0% ──────────── 0/250  0.3s

  pred_dist = pred_dist.view(b, a, 4, c // 4).softmax(3).matmul(self.proj.type(pred_dist.dtype))


[K     41/100      3.14G      1.213     0.6374      1.071        141        640: 100% ━━━━━━━━━━━━ 250/250 3.5it/s 1:11<0.3ss
[K                 Class     Images  Instances      Box(P          R      mAP50  mAP50-95): 100% ━━━━━━━━━━━━ 32/32 3.5it/s 9.1s0.3s
                   all       1000       5087      0.922      0.868      0.931      0.612

      Epoch    GPU_mem   box_loss   cls_loss   dfl_loss  Instances       Size
[K     42/100      3.14G      1.061     0.5699     0.9833        113        640: 0% ──────────── 0/250  0.3s

  pred_dist = pred_dist.view(b, a, 4, c // 4).softmax(3).matmul(self.proj.type(pred_dist.dtype))


[K     42/100      3.14G      1.205     0.6287      1.064         86        640: 100% ━━━━━━━━━━━━ 250/250 3.5it/s 1:11<0.3ss
[K                 Class     Images  Instances      Box(P          R      mAP50  mAP50-95): 100% ━━━━━━━━━━━━ 32/32 3.5it/s 9.2s0.3s
                   all       1000       5087      0.925      0.873      0.933      0.612

      Epoch    GPU_mem   box_loss   cls_loss   dfl_loss  Instances       Size
[K     43/100      3.14G      1.202     0.6013      1.085        101        640: 0% ──────────── 0/250  0.3s

  pred_dist = pred_dist.view(b, a, 4, c // 4).softmax(3).matmul(self.proj.type(pred_dist.dtype))


[K     43/100      3.14G      1.216     0.6263      1.069        130        640: 100% ━━━━━━━━━━━━ 250/250 3.5it/s 1:11<0.3ss
[K                 Class     Images  Instances      Box(P          R      mAP50  mAP50-95): 100% ━━━━━━━━━━━━ 32/32 3.5it/s 9.2s0.3s
                   all       1000       5087      0.929      0.874      0.936      0.614

      Epoch    GPU_mem   box_loss   cls_loss   dfl_loss  Instances       Size
[K     44/100      3.14G      1.231     0.6348       1.09        135        640: 0% ──────────── 0/250  0.3s

  pred_dist = pred_dist.view(b, a, 4, c // 4).softmax(3).matmul(self.proj.type(pred_dist.dtype))


[K     44/100      3.14G      1.204     0.6201      1.067        103        640: 100% ━━━━━━━━━━━━ 250/250 3.5it/s 1:11<0.3ss
[K                 Class     Images  Instances      Box(P          R      mAP50  mAP50-95): 100% ━━━━━━━━━━━━ 32/32 3.5it/s 9.3s0.3s
                   all       1000       5087      0.923      0.872      0.933      0.609

      Epoch    GPU_mem   box_loss   cls_loss   dfl_loss  Instances       Size
[K     45/100      3.14G      1.132     0.6087      1.017         97        640: 0% ──────────── 0/250  0.3s

  pred_dist = pred_dist.view(b, a, 4, c // 4).softmax(3).matmul(self.proj.type(pred_dist.dtype))


[K     45/100      3.14G      1.197     0.6203      1.062         98        640: 100% ━━━━━━━━━━━━ 250/250 3.5it/s 1:12<0.3ss
[K                 Class     Images  Instances      Box(P          R      mAP50  mAP50-95): 100% ━━━━━━━━━━━━ 32/32 3.4it/s 9.4s0.3s
                   all       1000       5087      0.922      0.874      0.933      0.612

      Epoch    GPU_mem   box_loss   cls_loss   dfl_loss  Instances       Size
[K     46/100      3.14G       1.22     0.6076      1.036        150        640: 0% ──────────── 0/250  0.3s

  pred_dist = pred_dist.view(b, a, 4, c // 4).softmax(3).matmul(self.proj.type(pred_dist.dtype))


[K     46/100      3.14G      1.195      0.614      1.059         91        640: 100% ━━━━━━━━━━━━ 250/250 3.5it/s 1:12<0.3ss
[K                 Class     Images  Instances      Box(P          R      mAP50  mAP50-95): 100% ━━━━━━━━━━━━ 32/32 3.4it/s 9.4s0.3s
                   all       1000       5087      0.928      0.871      0.935      0.617

      Epoch    GPU_mem   box_loss   cls_loss   dfl_loss  Instances       Size
[K     47/100      3.14G      1.403     0.6686      1.054        119        640: 0% ──────────── 0/250  0.3s

  pred_dist = pred_dist.view(b, a, 4, c // 4).softmax(3).matmul(self.proj.type(pred_dist.dtype))


[K     47/100      3.14G      1.193     0.6144      1.061        109        640: 100% ━━━━━━━━━━━━ 250/250 3.5it/s 1:11<0.3ss
[K                 Class     Images  Instances      Box(P          R      mAP50  mAP50-95): 100% ━━━━━━━━━━━━ 32/32 3.5it/s 9.2s0.3s
                   all       1000       5087      0.927      0.879      0.935      0.616

      Epoch    GPU_mem   box_loss   cls_loss   dfl_loss  Instances       Size
[K     48/100      3.14G      1.195      0.694      1.092        136        640: 0% ──────────── 0/250  0.3s

  pred_dist = pred_dist.view(b, a, 4, c // 4).softmax(3).matmul(self.proj.type(pred_dist.dtype))


[K     48/100      3.14G      1.192     0.6074      1.063         96        640: 100% ━━━━━━━━━━━━ 250/250 3.5it/s 1:11<0.3ss
[K                 Class     Images  Instances      Box(P          R      mAP50  mAP50-95): 100% ━━━━━━━━━━━━ 32/32 3.5it/s 9.1s0.3s
                   all       1000       5087      0.924      0.882      0.937      0.616

      Epoch    GPU_mem   box_loss   cls_loss   dfl_loss  Instances       Size
[K     49/100      3.14G      1.203     0.6307      1.029         91        640: 0% ──────────── 0/250  0.3s

  pred_dist = pred_dist.view(b, a, 4, c // 4).softmax(3).matmul(self.proj.type(pred_dist.dtype))


[K     49/100      3.14G      1.194     0.6058      1.059        105        640: 100% ━━━━━━━━━━━━ 250/250 3.5it/s 1:11<0.3ss
[K                 Class     Images  Instances      Box(P          R      mAP50  mAP50-95): 100% ━━━━━━━━━━━━ 32/32 3.5it/s 9.2s0.3s
                   all       1000       5087      0.928      0.878      0.933      0.618

      Epoch    GPU_mem   box_loss   cls_loss   dfl_loss  Instances       Size
[K     50/100      3.14G      1.137     0.6388      1.083         87        640: 0% ──────────── 0/250  0.3s

  pred_dist = pred_dist.view(b, a, 4, c // 4).softmax(3).matmul(self.proj.type(pred_dist.dtype))


[K     50/100      3.14G       1.19      0.603      1.065        133        640: 100% ━━━━━━━━━━━━ 250/250 3.6it/s 1:10<0.3ss
[K                 Class     Images  Instances      Box(P          R      mAP50  mAP50-95): 100% ━━━━━━━━━━━━ 32/32 3.5it/s 9.1s0.3s
                   all       1000       5087      0.927      0.879      0.939      0.619

      Epoch    GPU_mem   box_loss   cls_loss   dfl_loss  Instances       Size
[K     51/100      3.14G      1.046     0.5248      1.041        115        640: 0% ──────────── 0/250  0.3s

  pred_dist = pred_dist.view(b, a, 4, c // 4).softmax(3).matmul(self.proj.type(pred_dist.dtype))


[K     51/100      3.14G      1.176     0.5913      1.055        111        640: 100% ━━━━━━━━━━━━ 250/250 3.5it/s 1:12<0.3ss
[K                 Class     Images  Instances      Box(P          R      mAP50  mAP50-95): 100% ━━━━━━━━━━━━ 32/32 3.4it/s 9.4s0.3s
                   all       1000       5087      0.927       0.87      0.936      0.618

      Epoch    GPU_mem   box_loss   cls_loss   dfl_loss  Instances       Size
[K     52/100      3.14G      1.138     0.6276       1.01        129        640: 0% ──────────── 0/250  0.3s

  pred_dist = pred_dist.view(b, a, 4, c // 4).softmax(3).matmul(self.proj.type(pred_dist.dtype))


[K     52/100      3.14G      1.178     0.5954      1.053         99        640: 100% ━━━━━━━━━━━━ 250/250 3.5it/s 1:11<0.3ss
[K                 Class     Images  Instances      Box(P          R      mAP50  mAP50-95): 100% ━━━━━━━━━━━━ 32/32 3.5it/s 9.2s0.3s
                   all       1000       5087      0.929      0.875      0.939      0.617

      Epoch    GPU_mem   box_loss   cls_loss   dfl_loss  Instances       Size
[K     53/100      3.14G      1.183     0.5413     0.9966        123        640: 0% ──────────── 0/250  0.3s

  pred_dist = pred_dist.view(b, a, 4, c // 4).softmax(3).matmul(self.proj.type(pred_dist.dtype))


[K     53/100      3.14G      1.173     0.5892      1.051        105        640: 100% ━━━━━━━━━━━━ 250/250 3.5it/s 1:11<0.3ss
[K                 Class     Images  Instances      Box(P          R      mAP50  mAP50-95): 100% ━━━━━━━━━━━━ 32/32 3.4it/s 9.4s0.3s
                   all       1000       5087      0.928      0.881       0.94      0.616

      Epoch    GPU_mem   box_loss   cls_loss   dfl_loss  Instances       Size
[K     54/100      3.14G      1.152     0.6008      1.019         95        640: 0% ──────────── 0/250  0.3s

  pred_dist = pred_dist.view(b, a, 4, c // 4).softmax(3).matmul(self.proj.type(pred_dist.dtype))


[K     54/100      3.14G      1.179      0.592      1.054        110        640: 100% ━━━━━━━━━━━━ 250/250 3.5it/s 1:11<0.3ss
[K                 Class     Images  Instances      Box(P          R      mAP50  mAP50-95): 100% ━━━━━━━━━━━━ 32/32 3.5it/s 9.1s0.3s
                   all       1000       5087      0.928      0.881      0.943      0.617

      Epoch    GPU_mem   box_loss   cls_loss   dfl_loss  Instances       Size
[K     55/100      3.14G      1.282     0.6471      1.125        112        640: 0% ──────────── 0/250  0.3s

  pred_dist = pred_dist.view(b, a, 4, c // 4).softmax(3).matmul(self.proj.type(pred_dist.dtype))


[K     55/100      3.14G      1.172     0.5873      1.053        125        640: 100% ━━━━━━━━━━━━ 250/250 3.5it/s 1:11<0.3ss
[K                 Class     Images  Instances      Box(P          R      mAP50  mAP50-95): 100% ━━━━━━━━━━━━ 32/32 3.5it/s 9.1s0.3s
                   all       1000       5087      0.918      0.883      0.938       0.62

      Epoch    GPU_mem   box_loss   cls_loss   dfl_loss  Instances       Size
[K     56/100      3.14G      1.082     0.5498      1.061        111        640: 0% ──────────── 0/250  0.3s

  pred_dist = pred_dist.view(b, a, 4, c // 4).softmax(3).matmul(self.proj.type(pred_dist.dtype))


[K     56/100      3.14G       1.16     0.5772      1.049         71        640: 100% ━━━━━━━━━━━━ 250/250 3.5it/s 1:11<0.3ss
[K                 Class     Images  Instances      Box(P          R      mAP50  mAP50-95): 100% ━━━━━━━━━━━━ 32/32 3.4it/s 9.4s0.3s
                   all       1000       5087       0.93      0.881      0.938       0.62

      Epoch    GPU_mem   box_loss   cls_loss   dfl_loss  Instances       Size
[K     57/100      3.14G      1.141     0.5075      1.058        140        640: 0% ──────────── 0/250  0.3s

  pred_dist = pred_dist.view(b, a, 4, c // 4).softmax(3).matmul(self.proj.type(pred_dist.dtype))


[K     57/100      3.14G      1.173     0.5835      1.051         72        640: 100% ━━━━━━━━━━━━ 250/250 3.5it/s 1:12<0.3ss
[K                 Class     Images  Instances      Box(P          R      mAP50  mAP50-95): 100% ━━━━━━━━━━━━ 32/32 3.5it/s 9.1s0.3s
                   all       1000       5087      0.924      0.878      0.939      0.625

      Epoch    GPU_mem   box_loss   cls_loss   dfl_loss  Instances       Size
[K     58/100      3.14G      1.154     0.5326      1.016        162        640: 0% ──────────── 0/250  0.3s

  pred_dist = pred_dist.view(b, a, 4, c // 4).softmax(3).matmul(self.proj.type(pred_dist.dtype))


[K     58/100      3.14G      1.163     0.5802      1.048         80        640: 100% ━━━━━━━━━━━━ 250/250 3.5it/s 1:11<0.3ss
[K                 Class     Images  Instances      Box(P          R      mAP50  mAP50-95): 100% ━━━━━━━━━━━━ 32/32 3.4it/s 9.4s0.3s
                   all       1000       5087       0.92      0.881      0.939      0.623

      Epoch    GPU_mem   box_loss   cls_loss   dfl_loss  Instances       Size
[K     59/100      3.14G      1.116     0.5653      1.058        119        640: 0% ──────────── 0/250  0.3s

  pred_dist = pred_dist.view(b, a, 4, c // 4).softmax(3).matmul(self.proj.type(pred_dist.dtype))


[K     59/100      3.14G      1.154       0.57      1.042         82        640: 100% ━━━━━━━━━━━━ 250/250 3.5it/s 1:11<0.3ss
[K                 Class     Images  Instances      Box(P          R      mAP50  mAP50-95): 100% ━━━━━━━━━━━━ 32/32 3.6it/s 9.0s0.3s
                   all       1000       5087      0.928      0.881       0.94      0.625

      Epoch    GPU_mem   box_loss   cls_loss   dfl_loss  Instances       Size
[K     60/100      3.14G      1.201     0.5948      1.026        105        640: 0% ──────────── 0/250  0.3s

  pred_dist = pred_dist.view(b, a, 4, c // 4).softmax(3).matmul(self.proj.type(pred_dist.dtype))


[K     60/100      3.14G      1.157     0.5736      1.044        104        640: 100% ━━━━━━━━━━━━ 250/250 3.5it/s 1:11<0.3ss
[K                 Class     Images  Instances      Box(P          R      mAP50  mAP50-95): 100% ━━━━━━━━━━━━ 32/32 3.5it/s 9.0s0.3s
                   all       1000       5087      0.927      0.882      0.941      0.625

      Epoch    GPU_mem   box_loss   cls_loss   dfl_loss  Instances       Size
[K     61/100      3.14G      1.144     0.6651      1.051        137        640: 0% ──────────── 0/250  0.3s

  pred_dist = pred_dist.view(b, a, 4, c // 4).softmax(3).matmul(self.proj.type(pred_dist.dtype))


[K     61/100      3.14G      1.149     0.5656      1.041         77        640: 100% ━━━━━━━━━━━━ 250/250 3.6it/s 1:10<0.3ss
[K                 Class     Images  Instances      Box(P          R      mAP50  mAP50-95): 100% ━━━━━━━━━━━━ 32/32 3.6it/s 9.0s0.3s
                   all       1000       5087      0.927      0.882      0.942      0.626

      Epoch    GPU_mem   box_loss   cls_loss   dfl_loss  Instances       Size
[K     62/100      3.14G      1.056       0.51      1.044        128        640: 0% ──────────── 0/250  0.3s

  pred_dist = pred_dist.view(b, a, 4, c // 4).softmax(3).matmul(self.proj.type(pred_dist.dtype))


[K     62/100      3.14G      1.146     0.5645      1.036        103        640: 100% ━━━━━━━━━━━━ 250/250 3.5it/s 1:10<0.3ss
[K                 Class     Images  Instances      Box(P          R      mAP50  mAP50-95): 100% ━━━━━━━━━━━━ 32/32 3.5it/s 9.2s0.3s
                   all       1000       5087      0.927       0.88      0.938      0.623

      Epoch    GPU_mem   box_loss   cls_loss   dfl_loss  Instances       Size
[K     63/100      3.14G      1.003     0.4899     0.9965         85        640: 0% ──────────── 0/250  0.3s

  pred_dist = pred_dist.view(b, a, 4, c // 4).softmax(3).matmul(self.proj.type(pred_dist.dtype))


[K     63/100      3.14G      1.147     0.5619      1.038        125        640: 100% ━━━━━━━━━━━━ 250/250 3.1it/s 1:21<0.3ss
[K                 Class     Images  Instances      Box(P          R      mAP50  mAP50-95): 100% ━━━━━━━━━━━━ 32/32 3.5it/s 9.2s0.3s
                   all       1000       5087      0.929      0.881      0.942      0.628

      Epoch    GPU_mem   box_loss   cls_loss   dfl_loss  Instances       Size
[K     64/100      3.14G      1.062     0.5069      1.006         98        640: 0% ──────────── 0/250  0.3s

  pred_dist = pred_dist.view(b, a, 4, c // 4).softmax(3).matmul(self.proj.type(pred_dist.dtype))


[K     64/100      3.14G      1.143     0.5597      1.037        112        640: 100% ━━━━━━━━━━━━ 250/250 3.6it/s 1:09<0.3ss
[K                 Class     Images  Instances      Box(P          R      mAP50  mAP50-95): 100% ━━━━━━━━━━━━ 32/32 3.6it/s 8.9s0.3s
                   all       1000       5087      0.915      0.893      0.943      0.624

      Epoch    GPU_mem   box_loss   cls_loss   dfl_loss  Instances       Size
[K     65/100      3.14G      1.247     0.6521      1.089        104        640: 0% ──────────── 0/250  0.3s

  pred_dist = pred_dist.view(b, a, 4, c // 4).softmax(3).matmul(self.proj.type(pred_dist.dtype))


[K     65/100      3.14G      1.139     0.5552      1.037        124        640: 100% ━━━━━━━━━━━━ 250/250 2.7it/s 1:32<0.4ss
[K                 Class     Images  Instances      Box(P          R      mAP50  mAP50-95): 100% ━━━━━━━━━━━━ 32/32 2.2it/s 14.4s0.4s
                   all       1000       5087      0.933      0.881       0.94      0.626

      Epoch    GPU_mem   box_loss   cls_loss   dfl_loss  Instances       Size
[K     66/100      3.14G      1.149     0.5761       1.06         80        640: 0% ──────────── 0/250  0.5s

  pred_dist = pred_dist.view(b, a, 4, c // 4).softmax(3).matmul(self.proj.type(pred_dist.dtype))


[K     66/100      3.14G      1.139     0.5553      1.033        177        640: 100% ━━━━━━━━━━━━ 250/250 2.3it/s 1:49<0.4ss
[K                 Class     Images  Instances      Box(P          R      mAP50  mAP50-95): 100% ━━━━━━━━━━━━ 32/32 2.2it/s 14.8s0.5s
                   all       1000       5087      0.924      0.891      0.942      0.628

      Epoch    GPU_mem   box_loss   cls_loss   dfl_loss  Instances       Size
[K     67/100      3.14G      1.253      0.624     0.9903        158        640: 0% ──────────── 0/250  0.4s

  pred_dist = pred_dist.view(b, a, 4, c // 4).softmax(3).matmul(self.proj.type(pred_dist.dtype))


[K     67/100      3.14G      1.123      0.545       1.03        189        640: 100% ━━━━━━━━━━━━ 250/250 2.3it/s 1:50<0.4ss
[K                 Class     Images  Instances      Box(P          R      mAP50  mAP50-95): 100% ━━━━━━━━━━━━ 32/32 2.1it/s 14.9s0.5s
                   all       1000       5087      0.932      0.881      0.943      0.627

      Epoch    GPU_mem   box_loss   cls_loss   dfl_loss  Instances       Size
[K     68/100      3.14G      1.142     0.5283      1.023        131        640: 0% ──────────── 0/250  0.5s

  pred_dist = pred_dist.view(b, a, 4, c // 4).softmax(3).matmul(self.proj.type(pred_dist.dtype))


[K     68/100      3.14G      1.123     0.5474      1.027        162        640: 100% ━━━━━━━━━━━━ 250/250 2.3it/s 1:46<0.4ss
[K                 Class     Images  Instances      Box(P          R      mAP50  mAP50-95): 100% ━━━━━━━━━━━━ 32/32 2.3it/s 13.7s0.5s
                   all       1000       5087      0.927      0.885      0.945      0.627

      Epoch    GPU_mem   box_loss   cls_loss   dfl_loss  Instances       Size
[K     69/100      3.14G      1.078     0.4946      1.039         50        640: 0% ──────────── 0/250  0.4s

  pred_dist = pred_dist.view(b, a, 4, c // 4).softmax(3).matmul(self.proj.type(pred_dist.dtype))


[K     69/100      3.14G      1.122     0.5432      1.027        147        640: 100% ━━━━━━━━━━━━ 250/250 2.4it/s 1:45<0.4ss
[K                 Class     Images  Instances      Box(P          R      mAP50  mAP50-95): 100% ━━━━━━━━━━━━ 32/32 2.3it/s 13.7s0.4s
                   all       1000       5087      0.925      0.883      0.942      0.627

      Epoch    GPU_mem   box_loss   cls_loss   dfl_loss  Instances       Size
[K     70/100      3.14G      1.201     0.5704      1.011        127        640: 0% ──────────── 0/250  0.4s

  pred_dist = pred_dist.view(b, a, 4, c // 4).softmax(3).matmul(self.proj.type(pred_dist.dtype))


[K     70/100      3.14G      1.128     0.5432      1.031        120        640: 100% ━━━━━━━━━━━━ 250/250 2.4it/s 1:45<0.4ss
[K                 Class     Images  Instances      Box(P          R      mAP50  mAP50-95): 100% ━━━━━━━━━━━━ 32/32 2.4it/s 13.6s0.4s
                   all       1000       5087      0.927      0.882      0.942      0.627

      Epoch    GPU_mem   box_loss   cls_loss   dfl_loss  Instances       Size
[K     71/100      3.14G      1.236      0.584      1.079        124        640: 0% ──────────── 0/250  0.4s

  pred_dist = pred_dist.view(b, a, 4, c // 4).softmax(3).matmul(self.proj.type(pred_dist.dtype))


[K     71/100      3.14G      1.115     0.5355      1.026        101        640: 100% ━━━━━━━━━━━━ 250/250 2.4it/s 1:46<0.4ss
[K                 Class     Images  Instances      Box(P          R      mAP50  mAP50-95): 100% ━━━━━━━━━━━━ 32/32 2.4it/s 13.6s0.4s
                   all       1000       5087      0.916      0.892       0.94      0.629

      Epoch    GPU_mem   box_loss   cls_loss   dfl_loss  Instances       Size
[K     72/100      3.14G      1.044     0.4692      0.966        121        640: 0% ──────────── 0/250  0.4s

  pred_dist = pred_dist.view(b, a, 4, c // 4).softmax(3).matmul(self.proj.type(pred_dist.dtype))


[K     72/100      3.14G      1.123      0.545      1.031        106        640: 100% ━━━━━━━━━━━━ 250/250 3.3it/s 1:15<0.3ss
[K                 Class     Images  Instances      Box(P          R      mAP50  mAP50-95): 100% ━━━━━━━━━━━━ 32/32 3.5it/s 9.2s0.3s
                   all       1000       5087      0.912      0.895      0.943      0.628

      Epoch    GPU_mem   box_loss   cls_loss   dfl_loss  Instances       Size
[K     73/100      3.14G      1.255     0.5952      1.058        109        640: 0% ──────────── 0/250  0.3s

  pred_dist = pred_dist.view(b, a, 4, c // 4).softmax(3).matmul(self.proj.type(pred_dist.dtype))


[K     73/100      3.14G      1.116     0.5365      1.024         87        640: 100% ━━━━━━━━━━━━ 250/250 3.1it/s 1:22<0.4ss
[K                 Class     Images  Instances      Box(P          R      mAP50  mAP50-95): 100% ━━━━━━━━━━━━ 32/32 2.4it/s 13.6s0.4s
                   all       1000       5087      0.918      0.892      0.944      0.629

      Epoch    GPU_mem   box_loss   cls_loss   dfl_loss  Instances       Size
[K     74/100      3.14G      1.058     0.5433     0.9758        109        640: 0% ──────────── 0/250  0.4s

  pred_dist = pred_dist.view(b, a, 4, c // 4).softmax(3).matmul(self.proj.type(pred_dist.dtype))


[K     74/100      3.14G      1.106     0.5325      1.019        105        640: 100% ━━━━━━━━━━━━ 250/250 2.5it/s 1:39<0.4ss
[K                 Class     Images  Instances      Box(P          R      mAP50  mAP50-95): 100% ━━━━━━━━━━━━ 32/32 2.4it/s 13.5s0.4s
                   all       1000       5087      0.922      0.891      0.943      0.626

      Epoch    GPU_mem   box_loss   cls_loss   dfl_loss  Instances       Size
[K     75/100      3.14G      1.147     0.5694      1.067        105        640: 0% ──────────── 0/250  0.4s

  pred_dist = pred_dist.view(b, a, 4, c // 4).softmax(3).matmul(self.proj.type(pred_dist.dtype))


[K     75/100      3.14G      1.098     0.5287      1.017        128        640: 100% ━━━━━━━━━━━━ 250/250 2.9it/s 1:26<0.3ss
[K                 Class     Images  Instances      Box(P          R      mAP50  mAP50-95): 100% ━━━━━━━━━━━━ 32/32 3.6it/s 9.0s0.3s
                   all       1000       5087      0.918      0.891      0.942      0.627

      Epoch    GPU_mem   box_loss   cls_loss   dfl_loss  Instances       Size
[K     76/100      3.14G      1.086     0.5501      1.028         97        640: 0% ──────────── 0/250  0.3s

  pred_dist = pred_dist.view(b, a, 4, c // 4).softmax(3).matmul(self.proj.type(pred_dist.dtype))


[K     76/100      3.14G      1.104      0.533      1.021         70        640: 100% ━━━━━━━━━━━━ 250/250 3.0it/s 1:25<0.3ss
[K                 Class     Images  Instances      Box(P          R      mAP50  mAP50-95): 100% ━━━━━━━━━━━━ 32/32 3.5it/s 9.2s0.3s
                   all       1000       5087      0.916      0.893      0.941      0.627

      Epoch    GPU_mem   box_loss   cls_loss   dfl_loss  Instances       Size
[K     77/100      3.14G      1.033     0.5209      1.044         83        640: 0% ──────────── 0/250  0.3s

  pred_dist = pred_dist.view(b, a, 4, c // 4).softmax(3).matmul(self.proj.type(pred_dist.dtype))


[K     77/100      3.14G      1.106      0.528      1.021        117        640: 100% ━━━━━━━━━━━━ 250/250 3.2it/s 1:17<0.4ss
[K                 Class     Images  Instances      Box(P          R      mAP50  mAP50-95): 100% ━━━━━━━━━━━━ 32/32 2.4it/s 13.5s0.4s
                   all       1000       5087      0.924      0.884       0.94      0.626

      Epoch    GPU_mem   box_loss   cls_loss   dfl_loss  Instances       Size
[K     78/100      3.14G      1.073     0.4806      1.015        141        640: 0% ──────────── 0/250  0.4s

  pred_dist = pred_dist.view(b, a, 4, c // 4).softmax(3).matmul(self.proj.type(pred_dist.dtype))


[K     78/100      3.14G      1.102     0.5251      1.019         84        640: 100% ━━━━━━━━━━━━ 250/250 2.4it/s 1:43<0.4ss
[K                 Class     Images  Instances      Box(P          R      mAP50  mAP50-95): 100% ━━━━━━━━━━━━ 32/32 2.3it/s 13.6s0.4s
                   all       1000       5087      0.924      0.891      0.942      0.628

      Epoch    GPU_mem   box_loss   cls_loss   dfl_loss  Instances       Size
[K     79/100      3.14G      1.101     0.5065     0.9879        122        640: 0% ──────────── 0/250  0.4s

  pred_dist = pred_dist.view(b, a, 4, c // 4).softmax(3).matmul(self.proj.type(pred_dist.dtype))


[K     79/100      3.14G      1.094     0.5224       1.02        108        640: 100% ━━━━━━━━━━━━ 250/250 2.4it/s 1:43<0.4ss
[K                 Class     Images  Instances      Box(P          R      mAP50  mAP50-95): 100% ━━━━━━━━━━━━ 32/32 2.4it/s 13.4s0.4s
                   all       1000       5087      0.925      0.886      0.943      0.627

      Epoch    GPU_mem   box_loss   cls_loss   dfl_loss  Instances       Size
[K     80/100      3.14G     0.9915     0.4949     0.9779        103        640: 0% ──────────── 0/250  0.5s

  pred_dist = pred_dist.view(b, a, 4, c // 4).softmax(3).matmul(self.proj.type(pred_dist.dtype))


[K     80/100      3.14G      1.099     0.5222      1.019         95        640: 100% ━━━━━━━━━━━━ 250/250 2.4it/s 1:44<0.4ss
[K                 Class     Images  Instances      Box(P          R      mAP50  mAP50-95): 100% ━━━━━━━━━━━━ 32/32 2.5it/s 12.8s0.4s
                   all       1000       5087      0.921      0.896      0.942      0.627

      Epoch    GPU_mem   box_loss   cls_loss   dfl_loss  Instances       Size
[K     81/100      3.14G      1.004     0.4773      1.068         73        640: 0% ──────────── 0/250  0.4s

  pred_dist = pred_dist.view(b, a, 4, c // 4).softmax(3).matmul(self.proj.type(pred_dist.dtype))


[K     81/100      3.14G      1.101     0.5218       1.02        133        640: 100% ━━━━━━━━━━━━ 250/250 2.4it/s 1:43<0.4ss
[K                 Class     Images  Instances      Box(P          R      mAP50  mAP50-95): 100% ━━━━━━━━━━━━ 32/32 2.4it/s 13.1s0.4s
                   all       1000       5087      0.926      0.889      0.943      0.628

      Epoch    GPU_mem   box_loss   cls_loss   dfl_loss  Instances       Size
[K     82/100      3.14G      1.129     0.5254      1.005        137        640: 0% ──────────── 0/250  0.4s

  pred_dist = pred_dist.view(b, a, 4, c // 4).softmax(3).matmul(self.proj.type(pred_dist.dtype))


[K     82/100      3.14G      1.089     0.5196      1.014        103        640: 100% ━━━━━━━━━━━━ 250/250 2.4it/s 1:43<0.4ss
[K                 Class     Images  Instances      Box(P          R      mAP50  mAP50-95): 100% ━━━━━━━━━━━━ 32/32 2.4it/s 13.5s0.4s
                   all       1000       5087      0.926      0.889      0.944      0.628

      Epoch    GPU_mem   box_loss   cls_loss   dfl_loss  Instances       Size
[K     83/100      3.14G     0.9927     0.4919     0.9737        131        640: 0% ──────────── 0/250  0.4s

  pred_dist = pred_dist.view(b, a, 4, c // 4).softmax(3).matmul(self.proj.type(pred_dist.dtype))


[K     83/100      3.14G      1.084     0.5152      1.017         99        640: 100% ━━━━━━━━━━━━ 250/250 2.5it/s 1:40<0.4ss
[K                 Class     Images  Instances      Box(P          R      mAP50  mAP50-95): 100% ━━━━━━━━━━━━ 32/32 2.4it/s 13.5s0.4s
                   all       1000       5087       0.92      0.893      0.943      0.629

      Epoch    GPU_mem   box_loss   cls_loss   dfl_loss  Instances       Size
[K     84/100      3.14G      1.145     0.5169      1.071        113        640: 0% ──────────── 0/250  0.4s

  pred_dist = pred_dist.view(b, a, 4, c // 4).softmax(3).matmul(self.proj.type(pred_dist.dtype))


[K     84/100      3.14G      1.088     0.5188      1.015         89        640: 100% ━━━━━━━━━━━━ 250/250 2.4it/s 1:43<0.4ss
[K                 Class     Images  Instances      Box(P          R      mAP50  mAP50-95): 100% ━━━━━━━━━━━━ 32/32 2.4it/s 13.5s0.4s
                   all       1000       5087      0.923       0.89      0.942      0.627

      Epoch    GPU_mem   box_loss   cls_loss   dfl_loss  Instances       Size
[K     85/100      3.14G      1.098     0.5519      1.004        112        640: 0% ──────────── 0/250  0.4s

  pred_dist = pred_dist.view(b, a, 4, c // 4).softmax(3).matmul(self.proj.type(pred_dist.dtype))


[K     85/100      3.14G      1.096      0.522      1.017         83        640: 100% ━━━━━━━━━━━━ 250/250 2.4it/s 1:44<0.4ss
[K                 Class     Images  Instances      Box(P          R      mAP50  mAP50-95): 100% ━━━━━━━━━━━━ 32/32 2.4it/s 13.6s0.4s
                   all       1000       5087      0.923       0.89      0.942      0.629

      Epoch    GPU_mem   box_loss   cls_loss   dfl_loss  Instances       Size
[K     86/100      3.14G      1.081     0.5563      1.038         84        640: 0% ──────────── 0/250  0.4s

  pred_dist = pred_dist.view(b, a, 4, c // 4).softmax(3).matmul(self.proj.type(pred_dist.dtype))


[K     86/100      3.14G       1.08     0.5096      1.008        131        640: 100% ━━━━━━━━━━━━ 250/250 2.4it/s 1:43<0.4ss
[K                 Class     Images  Instances      Box(P          R      mAP50  mAP50-95): 100% ━━━━━━━━━━━━ 32/32 2.4it/s 13.6s0.4s
                   all       1000       5087      0.928      0.889      0.942      0.629

      Epoch    GPU_mem   box_loss   cls_loss   dfl_loss  Instances       Size
[K     87/100      3.14G     0.9753     0.5001     0.9922        118        640: 0% ──────────── 0/250  0.4s

  pred_dist = pred_dist.view(b, a, 4, c // 4).softmax(3).matmul(self.proj.type(pred_dist.dtype))


[K     87/100      3.14G      1.077     0.5118       1.01        105        640: 100% ━━━━━━━━━━━━ 250/250 2.4it/s 1:44<0.4ss
[K                 Class     Images  Instances      Box(P          R      mAP50  mAP50-95): 100% ━━━━━━━━━━━━ 32/32 2.3it/s 13.6s0.4s
                   all       1000       5087      0.916      0.896      0.941      0.628

      Epoch    GPU_mem   box_loss   cls_loss   dfl_loss  Instances       Size
[K     88/100      3.14G      1.008     0.4991      1.025         83        640: 0% ──────────── 0/250  0.4s

  pred_dist = pred_dist.view(b, a, 4, c // 4).softmax(3).matmul(self.proj.type(pred_dist.dtype))


[K     88/100      3.14G      1.078     0.5085      1.013        109        640: 100% ━━━━━━━━━━━━ 250/250 2.6it/s 1:35<0.3ss
[K                 Class     Images  Instances      Box(P          R      mAP50  mAP50-95): 100% ━━━━━━━━━━━━ 32/32 2.8it/s 11.6s0.5s
                   all       1000       5087      0.927      0.886      0.941      0.629

      Epoch    GPU_mem   box_loss   cls_loss   dfl_loss  Instances       Size
[K     89/100      3.14G      1.134     0.5221      1.033        114        640: 0% ──────────── 0/250  0.4s

  pred_dist = pred_dist.view(b, a, 4, c // 4).softmax(3).matmul(self.proj.type(pred_dist.dtype))


[K     89/100      3.14G      1.084     0.5116      1.017        159        640: 100% ━━━━━━━━━━━━ 250/250 2.5it/s 1:42<0.4ss
[K                 Class     Images  Instances      Box(P          R      mAP50  mAP50-95): 100% ━━━━━━━━━━━━ 32/32 2.4it/s 13.4s0.4s
                   all       1000       5087      0.923       0.89      0.941      0.628

      Epoch    GPU_mem   box_loss   cls_loss   dfl_loss  Instances       Size
[K     90/100      3.14G      1.153     0.5346      0.999         99        640: 0% ──────────── 0/250  0.4s

  pred_dist = pred_dist.view(b, a, 4, c // 4).softmax(3).matmul(self.proj.type(pred_dist.dtype))


[K     90/100      3.14G      1.081     0.5121       1.01        154        640: 100% ━━━━━━━━━━━━ 250/250 2.4it/s 1:43<0.4ss
[K                 Class     Images  Instances      Box(P          R      mAP50  mAP50-95): 100% ━━━━━━━━━━━━ 32/32 2.4it/s 13.5s0.4s
                   all       1000       5087      0.923      0.891      0.941      0.628
Closing dataloader mosaic

      Epoch    GPU_mem   box_loss   cls_loss   dfl_loss  Instances       Size
[K     91/100      3.14G      1.053     0.5486      1.042         71        640: 0% ──────────── 0/250  0.4s

  pred_dist = pred_dist.view(b, a, 4, c // 4).softmax(3).matmul(self.proj.type(pred_dist.dtype))


[K     91/100      3.14G      1.071      0.462      1.018         58        640: 100% ━━━━━━━━━━━━ 250/250 3.7it/s 1:08<0.2ss
[K                 Class     Images  Instances      Box(P          R      mAP50  mAP50-95): 100% ━━━━━━━━━━━━ 32/32 3.6it/s 9.0s0.3s
                   all       1000       5087      0.923      0.886      0.938      0.622

      Epoch    GPU_mem   box_loss   cls_loss   dfl_loss  Instances       Size
[K     92/100      3.14G      1.023     0.4375      1.007         70        640: 0% ──────────── 0/250  0.3s

  pred_dist = pred_dist.view(b, a, 4, c // 4).softmax(3).matmul(self.proj.type(pred_dist.dtype))


[K     92/100      3.14G      1.062     0.4514      1.013         54        640: 100% ━━━━━━━━━━━━ 250/250 3.3it/s 1:16<0.3ss
[K                 Class     Images  Instances      Box(P          R      mAP50  mAP50-95): 100% ━━━━━━━━━━━━ 32/32 3.5it/s 9.0s0.3s
                   all       1000       5087      0.922      0.885      0.939      0.625

      Epoch    GPU_mem   box_loss   cls_loss   dfl_loss  Instances       Size
[K     93/100      3.14G       1.16     0.4737     0.9993         86        640: 0% ──────────── 0/250  0.3s

  pred_dist = pred_dist.view(b, a, 4, c // 4).softmax(3).matmul(self.proj.type(pred_dist.dtype))


[K     93/100      3.14G      1.063     0.4483      1.015         71        640: 100% ━━━━━━━━━━━━ 250/250 3.8it/s 1:05<0.3ss
[K                 Class     Images  Instances      Box(P          R      mAP50  mAP50-95): 100% ━━━━━━━━━━━━ 32/32 2.8it/s 11.6s0.4s
                   all       1000       5087      0.924      0.884      0.941      0.625

      Epoch    GPU_mem   box_loss   cls_loss   dfl_loss  Instances       Size
[K     94/100      3.14G      1.081     0.4268     0.9607         79        640: 0% ──────────── 0/250  0.4s

  pred_dist = pred_dist.view(b, a, 4, c // 4).softmax(3).matmul(self.proj.type(pred_dist.dtype))


[K     94/100      3.14G      1.063     0.4484      1.014         98        640: 100% ━━━━━━━━━━━━ 250/250 2.6it/s 1:36<0.4ss
[K                 Class     Images  Instances      Box(P          R      mAP50  mAP50-95): 100% ━━━━━━━━━━━━ 32/32 2.3it/s 13.8s0.4s
                   all       1000       5087      0.925      0.886       0.94      0.626

      Epoch    GPU_mem   box_loss   cls_loss   dfl_loss  Instances       Size
[K     95/100      3.14G     0.9422     0.3877      0.995         71        640: 0% ──────────── 0/250  0.4s

  pred_dist = pred_dist.view(b, a, 4, c // 4).softmax(3).matmul(self.proj.type(pred_dist.dtype))


[K     95/100      3.14G      1.059     0.4477       1.01         60        640: 100% ━━━━━━━━━━━━ 250/250 2.7it/s 1:33<0.4ss
[K                 Class     Images  Instances      Box(P          R      mAP50  mAP50-95): 100% ━━━━━━━━━━━━ 32/32 2.4it/s 13.6s0.4s
                   all       1000       5087       0.92       0.89      0.941      0.626

      Epoch    GPU_mem   box_loss   cls_loss   dfl_loss  Instances       Size
[K     96/100      3.14G      1.044     0.4462       1.05         65        640: 0% ──────────── 0/250  0.3s

  pred_dist = pred_dist.view(b, a, 4, c // 4).softmax(3).matmul(self.proj.type(pred_dist.dtype))


[K     96/100      3.14G      1.061     0.4477      1.012         83        640: 100% ━━━━━━━━━━━━ 250/250 2.6it/s 1:36<0.4ss
[K                 Class     Images  Instances      Box(P          R      mAP50  mAP50-95): 100% ━━━━━━━━━━━━ 32/32 2.4it/s 13.4s0.4s
                   all       1000       5087      0.923      0.889       0.94      0.627

      Epoch    GPU_mem   box_loss   cls_loss   dfl_loss  Instances       Size
[K     97/100      3.14G     0.9859     0.4117     0.9916         68        640: 0% ──────────── 0/250  0.4s

  pred_dist = pred_dist.view(b, a, 4, c // 4).softmax(3).matmul(self.proj.type(pred_dist.dtype))


[K     97/100      3.14G      1.056     0.4475      1.014         64        640: 100% ━━━━━━━━━━━━ 250/250 2.6it/s 1:36<0.4ss
[K                 Class     Images  Instances      Box(P          R      mAP50  mAP50-95): 100% ━━━━━━━━━━━━ 32/32 2.4it/s 13.4s0.4s
                   all       1000       5087      0.928      0.885      0.941      0.627

      Epoch    GPU_mem   box_loss   cls_loss   dfl_loss  Instances       Size
[K     98/100      3.14G      1.048      0.428     0.9883         78        640: 0% ──────────── 0/250  0.4s

  pred_dist = pred_dist.view(b, a, 4, c // 4).softmax(3).matmul(self.proj.type(pred_dist.dtype))


[K     98/100      3.14G      1.059     0.4473      1.011         54        640: 100% ━━━━━━━━━━━━ 250/250 2.6it/s 1:37<0.4ss
[K                 Class     Images  Instances      Box(P          R      mAP50  mAP50-95): 100% ━━━━━━━━━━━━ 32/32 2.4it/s 13.6s0.4s
                   all       1000       5087      0.931      0.881      0.941      0.628

      Epoch    GPU_mem   box_loss   cls_loss   dfl_loss  Instances       Size
[K     99/100      3.14G       1.08     0.4309      1.011         64        640: 0% ──────────── 0/250  0.4s

  pred_dist = pred_dist.view(b, a, 4, c // 4).softmax(3).matmul(self.proj.type(pred_dist.dtype))


[K     99/100      3.14G      1.057     0.4458      1.013         66        640: 100% ━━━━━━━━━━━━ 250/250 2.6it/s 1:36<0.4ss
[K                 Class     Images  Instances      Box(P          R      mAP50  mAP50-95): 100% ━━━━━━━━━━━━ 32/32 2.4it/s 13.2s0.4s
                   all       1000       5087      0.932       0.88      0.941      0.628

      Epoch    GPU_mem   box_loss   cls_loss   dfl_loss  Instances       Size
[K    100/100      3.14G      1.065     0.4104       1.05         70        640: 0% ──────────── 0/250  0.3s

  pred_dist = pred_dist.view(b, a, 4, c // 4).softmax(3).matmul(self.proj.type(pred_dist.dtype))


[K    100/100      3.14G       1.06     0.4444      1.013         86        640: 100% ━━━━━━━━━━━━ 250/250 3.4it/s 1:14<0.4ss
[K                 Class     Images  Instances      Box(P          R      mAP50  mAP50-95): 100% ━━━━━━━━━━━━ 32/32 2.3it/s 13.8s0.4s
                   all       1000       5087      0.931      0.881      0.942      0.628

100 epochs completed in 2.552 hours.
Optimizer stripped from E:\Helmet-Detection\Helmet-Detection\runs\detect\helmet_yolov8n_coco3\weights\last.pt, 6.3MB
Optimizer stripped from E:\Helmet-Detection\Helmet-Detection\runs\detect\helmet_yolov8n_coco3\weights\best.pt, 6.3MB

Validating E:\Helmet-Detection\Helmet-Detection\runs\detect\helmet_yolov8n_coco3\weights\best.pt...
Ultralytics 8.3.235  Python-3.12.0 torch-2.9.1+cu130 CUDA:0 (NVIDIA GeForce RTX 4060 Laptop GPU, 8188MiB)
Model summary (fused): 72 layers, 3,006,038 parameters, 0 gradients, 8.1 GFLOPs
[K                 Class     Images  Instances      Box(P          R      mAP50  mAP50-95

ultralytics.utils.metrics.DetMetrics object with attributes:

ap_class_index: array([0, 1])
box: ultralytics.utils.metrics.Metric object
confusion_matrix: <ultralytics.utils.metrics.ConfusionMatrix object at 0x000001E4C77563C0>
curves: ['Precision-Recall(B)', 'F1-Confidence(B)', 'Precision-Confidence(B)', 'Recall-Confidence(B)']
curves_results: [[array([          0,    0.001001,    0.002002,    0.003003,    0.004004,    0.005005,    0.006006,    0.007007,    0.008008,    0.009009,     0.01001,    0.011011,    0.012012,    0.013013,    0.014014,    0.015015,    0.016016,    0.017017,    0.018018,    0.019019,     0.02002,    0.021021,    0.022022,    0.023023,
          0.024024,    0.025025,    0.026026,    0.027027,    0.028028,    0.029029,     0.03003,    0.031031,    0.032032,    0.033033,    0.034034,    0.035035,    0.036036,    0.037037,    0.038038,    0.039039,     0.04004,    0.041041,    0.042042,    0.043043,    0.044044,    0.045045,    0.046046,    0.047047,
          0.0