In [20]:
# 모듈 import

from mmcv import Config
from mmdet.datasets import build_dataset
from mmdet.models import build_detector
from mmdet.apis import train_detector
from mmdet.datasets import (build_dataloader, build_dataset,
                            replace_ImageToTensor)
from mmdet.utils import get_device
import wandb

In [58]:
classes = ("General trash", "Paper", "Paper pack", "Metal", "Glass", 
           "Plastic", "Styrofoam", "Plastic bag", "Battery", "Clothing")
    
# config file 들고오기
filename = './configs/cascade_rcnn/cascade_rcnn_r50_fpn_1x_coco.py'
cfg = Config.fromfile(filename)


root='../../dataset/'

# dataset config 수정
cfg.data.train.classes = classes
cfg.data.train.img_prefix = root
cfg.data.train.ann_file = root + 'train.json' # train json 정보
cfg.data.train.pipeline[2]['img_scale'] = (512,512) # Resize

cfg.data.test.classes = classes
cfg.data.test.img_prefix = root
cfg.data.test.ann_file = root + 'test.json' # test json 정보
cfg.data.test.pipeline[1]['img_scale'] = (512,512) # Resize

# wandb logger hook 추가
cfg.log_config.hooks = [
    dict(type='TextLoggerHook'),
    dict(type='MMDetWandbHook',
         init_kwargs={'project': "object_detection",
                     'entity' : "cv-2",
                     'name' : filename.split('/')[-1]},
         interval=10,
         log_checkpoint=True,
         log_checkpoint_metadata=True,
         num_eval_images=100)]



cfg.data.samples_per_gpu = 4

cfg.seed = 2022
cfg.gpu_ids = [0]
cfg.work_dir = './work_dirs/cascade_rcnn_r50_fpn_1x_coco'

# change number of classes
if(filename in ['./configs/cascade_rcnn/cascade_rcnn_r50_fpn_1x_coco.py',
                './configs/convnext/cascade_mask_rcnn_convnext-t_p4_w7_fpn_giou_4conv1f_fp16_ms-crop_3x_coco.py']):
    cfg.model.roi_head.bbox_head[0].num_classes=10
    cfg.model.roi_head.bbox_head[1].num_classes=10
    cfg.model.roi_head.bbox_head[2].num_classes=10
elif(filename in ['./configs/swin/retinanet_swin-t-p4-w7_fpn_1x_coco.py',
                     './configs/detr/detr_r50_8x2_150e_coco.py']):
    cfg.model.bbox_head.num_classes = 10
elif(filename in ['./configs/yolox/yolox_tiny_8x8_300e_coco.py']):
    cfg.model.bbox_head.feat_channels=10
elif(filename in ['./configs/yolo/yolov3_d53_320_273e_coco.py']):
    pass
else:
    cfg.model.roi_head.bbox_head.num_classes = 10


#epoch 수 변경
cfg.runner = dict(type='EpochBasedRunner', max_epochs=10)


cfg.optimizer_config.grad_clip = dict(max_norm=35, norm_type=2)
cfg.checkpoint_config = dict(max_keep_ckpts=3, interval=1)
cfg.device = get_device()

In [59]:
# build_dataset
datasets = [build_dataset(cfg.data.train)]

loading annotations into memory...
Done (t=0.09s)
creating index...
index created!


In [60]:
# dataset 확인
datasets[0]


CocoDataset Train dataset with number of images 4882, and instance counts: 
+-------------------+-------+---------------+-------+-----------------+-------+-------------+-------+--------------+-------+
| category          | count | category      | count | category        | count | category    | count | category     | count |
+-------------------+-------+---------------+-------+-----------------+-------+-------------+-------+--------------+-------+
| 0 [General trash] | 4205  | 1 [Paper]     | 6349  | 2 [Paper pack]  | 909   | 3 [Metal]   | 936   | 4 [Glass]    | 976   |
| 5 [Plastic]       | 2966  | 6 [Styrofoam] | 1267  | 7 [Plastic bag] | 5182  | 8 [Battery] | 159   | 9 [Clothing] | 461   |
+-------------------+-------+---------------+-------+-----------------+-------+-------------+-------+--------------+-------+

In [61]:
# 모델 build 및 pretrained network 불러오기
model = build_detector(cfg.model)
model.init_weights()

2024-01-10 12:45:23,155 - mmcv - INFO - initialize ResNet with init_cfg {'type': 'Pretrained', 'checkpoint': 'torchvision://resnet50'}
2024-01-10 12:45:23,157 - mmcv - INFO - load model from: torchvision://resnet50
2024-01-10 12:45:23,158 - mmcv - INFO - load checkpoint from torchvision path: torchvision://resnet50

unexpected key in source state_dict: fc.weight, fc.bias

2024-01-10 12:45:23,362 - mmcv - INFO - initialize FPN with init_cfg {'type': 'Xavier', 'layer': 'Conv2d', 'distribution': 'uniform'}
2024-01-10 12:45:23,390 - mmcv - INFO - initialize RPNHead with init_cfg {'type': 'Normal', 'layer': 'Conv2d', 'std': 0.01}
2024-01-10 12:45:23,397 - mmcv - INFO - initialize Shared2FCBBoxHead with init_cfg [{'type': 'Normal', 'std': 0.01, 'override': {'name': 'fc_cls'}}, {'type': 'Normal', 'std': 0.001, 'override': {'name': 'fc_reg'}}, {'type': 'Xavier', 'distribution': 'uniform', 'override': [{'name': 'shared_fcs'}, {'name': 'cls_fcs'}, {'name': 'reg_fcs'}]}]
2024-01-10 12:45:23,499 -

In [62]:
# 모델 학습
train_detector(model, datasets[0], cfg, distributed=False, validate=False)

2024-01-10 12:45:24,290 - mmdet - INFO - Automatic scaling of learning rate (LR) has been disabled.
2024-01-10 12:45:24,294 - mmdet - INFO - Start running, host: root@instance-5032, work_dir: /data/ephemeral/home/level2-objectdetection-cv-02/mmdetection/work_dirs/cascade_rcnn_r50_fpn_1x_coco
2024-01-10 12:45:24,296 - mmdet - INFO - Hooks will be executed in the following order:
before_run:
(VERY_HIGH   ) StepLrUpdaterHook                  
(NORMAL      ) CheckpointHook                     
(VERY_LOW    ) TextLoggerHook                     
(VERY_LOW    ) MMDetWandbHook                     
 -------------------- 
before_train_epoch:
(VERY_HIGH   ) StepLrUpdaterHook                  
(NORMAL      ) NumClassCheckHook                  
(LOW         ) IterTimerHook                      
(VERY_LOW    ) TextLoggerHook                     
(VERY_LOW    ) MMDetWandbHook                     
 -------------------- 
before_train_iter:
(VERY_HIGH   ) StepLrUpdaterHook                  
(LOW        



VBox(children=(Label(value='0.002 MB of 0.002 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

VBox(children=(Label(value='Waiting for wandb.init()...\r'), FloatProgress(value=0.011112567823794153, max=1.0…

2024-01-10 12:46:03,381 - mmdet - INFO - Epoch [1][50/1221]	lr: 1.978e-03, eta: 1:05:58, time: 0.326, data_time: 0.052, memory: 4716, loss_rpn_cls: 0.3896, loss_rpn_bbox: 0.0457, s0.loss_cls: 0.6917, s0.acc: 87.6133, s0.loss_bbox: 0.1012, s1.loss_cls: 0.2878, s1.acc: 89.0273, s1.loss_bbox: 0.0287, s2.loss_cls: 0.1564, s2.acc: 84.4961, s2.loss_bbox: 0.0036, loss: 1.7047, grad_norm: 9.0202
2024-01-10 12:46:17,526 - mmdet - INFO - Epoch [1][100/1221]	lr: 3.976e-03, eta: 1:01:24, time: 0.283, data_time: 0.007, memory: 4716, loss_rpn_cls: 0.1253, loss_rpn_bbox: 0.0322, s0.loss_cls: 0.3287, s0.acc: 93.2861, s0.loss_bbox: 0.1632, s1.loss_cls: 0.0886, s1.acc: 97.1221, s1.loss_bbox: 0.0476, s2.loss_cls: 0.0252, s2.acc: 98.5859, s2.loss_bbox: 0.0071, loss: 0.8179, grad_norm: 2.5197
2024-01-10 12:46:31,662 - mmdet - INFO - Epoch [1][150/1221]	lr: 5.974e-03, eta: 0:59:42, time: 0.283, data_time: 0.007, memory: 4716, loss_rpn_cls: 0.1473, loss_rpn_bbox: 0.0420, s0.loss_cls: 0.3740, s0.acc: 92.4219,

VBox(children=(Label(value='4749.957 MB of 5273.164 MB uploaded\r'), FloatProgress(value=0.9007793549402214, m…

0,1
learning_rate,▃▅██████████████████████████████▁▁▁▁▁▁▁▁
momentum,▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
train/grad_norm,▄▇▃▄▇▁▄▂▁▆▁▂▄▄▅▂▂▂▂▄▆▂▃▃▄▂▇█▄▃▄▃▄▂▄▃▂▂▂▃
train/loss,▅▅▄▅█▄▄▅▄▆▃▄▄▄▄▃▃▅▄▄▄▄▄▃▄▂▄▄▄▂▃▂▂▂▃▂▂▂▁▂
train/loss_rpn_bbox,▄▄▆▃█▃▃▆▂▇▂▃▃▄▃▃▂▅▃▃▄▂▃▂▃▂▂▃▅▂▃▃▁▁▂▂▃▁▁▁
train/loss_rpn_cls,▆▅▅▃█▃▃▆▃▆▂▄▃▃▃▃▃▄▃▂▃▂▃▂▃▂▃▃▃▂▃▂▁▁▂▁▁▁▁▁
train/s0.acc,▅▅▆▃▁▅▅▄▅▂▅▅▅▄▅▆▆▃▄▄▄▅▅▆▅▇▅▄▅▇▆▆▆▇▆▆▇▇█▇
train/s0.loss_bbox,█▅▃▅█▄▃▄▃▆▂▃▃▃▃▃▂▅▄▃▄▃▃▂▄▁▃▃▃▂▂▂▂▂▃▂▂▁▁▂
train/s0.loss_cls,▆▅▄▆█▄▅▆▄▆▃▄▄▄▄▃▃▅▄▄▅▄▄▃▄▂▄▅▄▂▃▂▃▂▃▂▂▂▁▂
train/s1.acc,█▅▆▃▁▄▄▄▄▂▄▄▅▄▄▅▅▃▄▄▃▅▅▆▅▆▅▃▄▆▅▆▅▇▅▆▇▇█▇

0,1
learning_rate,0.002
momentum,0.9
train/grad_norm,1.84223
train/loss,0.35801
train/loss_rpn_bbox,0.00949
train/loss_rpn_cls,0.01624
train/s0.acc,96.25977
train/s0.loss_bbox,0.0586
train/s0.loss_cls,0.11848
train/s1.acc,96.79741


10 10 10
