feat(dataset): 自定义微调数据集类，每次返回图像以及64个RoI坐标

zjZSTU · Mar 31, 2020 · 580b10e · 580b10e
1 parent 6d7766d
commit 580b10e
Showing 1 changed file with 114 additions and 0 deletions.
diff --git a/py/utils/data/custom_finetune_dataset.py b/py/utils/data/custom_finetune_dataset.py
@@ -0,0 +1,114 @@
+# -*- coding: utf-8 -*-
+
+"""
+@date: 2020/3/31 下午8:26
+@file: custom_finetune_dataset.py
+@author: zj
+@description: 
+"""
+
+import random
+import cv2
+import os
+import numpy as np
+from torch.utils.data import Dataset
+import torchvision.transforms as transforms
+
+import utils.util as util
+
+
+class CustomFinetuneDataset(Dataset):
+
+    def __init__(self, root_dir, transform):
+        """
+        加载所有的图像以及正负样本边界框
+        """
+        self.transform = transform
+
+        samples = util.parse_car_csv(root_dir)
+
+        jpeg_images = list()
+        annotation_dict = dict()
+        for idx in range(len(samples)):
+            sample_name = samples[idx]
+            img = cv2.imread(os.path.join(root_dir, 'JPEGImages', sample_name + ".jpg"))
+            h, w = img.shape[:2]
+            jpeg_images.append(img)
+
+            positive_annotation_path = os.path.join(root_dir, 'Annotations', sample_name + '_1.csv')
+            positive_annotations = np.loadtxt(positive_annotation_path, dtype=np.float, delimiter=' ')
+            if len(positive_annotations.shape) == 1:
+                positive_annotations = positive_annotations[np.newaxis, :]
+            # print(positive_annotations.shape)
+            positive_annotations[:, 0] /= w
+            positive_annotations[:, 1] /= h
+            positive_annotations[:, 2] /= w
+            positive_annotations[:, 3] /= h
+            # if len(positive_annotations) < 16:
+            #     print(sample_name)
+
+            negative_annotation_path = os.path.join(root_dir, 'Annotations', sample_name + '_0.csv')
+            negative_annotations = np.loadtxt(negative_annotation_path, dtype=np.float, delimiter=' ')
+            negative_annotations[:, 0] /= w
+            negative_annotations[:, 1] /= h
+            negative_annotations[:, 2] /= w
+            negative_annotations[:, 3] /= h
+
+            annotation_dict[str(idx)] = {'positive': positive_annotations, 'negative': negative_annotations}
+
+        self.jpeg_images = jpeg_images
+        self.annotation_dict = annotation_dict
+
+    def __getitem__(self, index: int):
+        """
+        采样图像index中的64个RoI，其中正样本16个，负样本48个
+        :param index:
+        :return:
+        """
+        assert index < len(self.jpeg_images), '当前数据集总数: %d，输入Index：%d' % (len(self.jpeg_images), index)
+
+        image = self.jpeg_images[index]
+        annotation_dict = data_set.annotation_dict[str(index)]
+        positive_annotations = annotation_dict['positive']
+        negative_annotations = annotation_dict['negative']
+
+        positive_num = 16
+        negative_num = 48
+        # 正样本数目有可能小于16个
+        if len(positive_annotations) < positive_num:
+            positive_num = len(positive_annotations)
+            negative_annotations = 64 - positive_num
+
+            positive_array = positive_annotations
+        else:
+            positive_array = positive_annotations[random.sample(range(positive_annotations.shape[0]), positive_num)]
+        negative_array = negative_annotations[random.sample(range(negative_annotations.shape[0]), negative_num)]
+
+        rect_array = np.vstack((positive_array, negative_array))
+        targets = np.hstack((np.ones(positive_num), np.zeros(negative_num)))
+
+        if self.transform:
+            image = self.transform(image)
+
+        return image, targets, rect_array
+
+    def __len__(self) -> int:
+        return len(self.jpeg_images)
+
+
+if __name__ == '__main__':
+    root_dir = '../../data/finetune_car/train'
+    s = 600
+    transform = transforms.Compose([
+        transforms.ToPILImage(),
+        transforms.Resize(s),
+        transforms.ToTensor(),
+        transforms.Normalize((0.5, 0.5, 0.5), (0.5, 0.5, 0.5))
+    ])
+    data_set = CustomFinetuneDataset(root_dir, transform)
+    print(len(data_set.jpeg_images))
+
+    image, targets, rect_array = data_set.__getitem__(10)
+    print(image.shape)
+    print(targets)
+    print(rect_array.shape)