In [None]:
%load_ext autoreload
%autoreload 2

In [None]:
!nvidia-smi

In [None]:
import os
os.environ['CUDA_VISIBLE_DEVICES'] = "3"

## Create DATASET

### 1 - Split train test

In [None]:
import json 

In [None]:
data_path = '/root/data/aquabyte-images/'
coco_file_dir = 'cocofiles'
targets = ['full', 'clear', 'lateral']

In [None]:
target_coco_files = []
for file in os.listdir(data_path + coco_file_dir):
    count = 0
    for target in targets:
        if target in file:
            count += 1
    if count == len(targets):
        target_coco_files.append(file)  
size_dict = {}
datas = []
for coco_file in target_coco_files:
    with open(data_path + coco_file_dir + '/' + coco_file) as f:
        coco_dict = json.load(f)
        datas.append(coco_dict)
        size = len(coco_dict['annotations'])
        size_dict[size] = data_path + coco_file_dir + '/' + coco_file

In [None]:
size_dict

In [None]:
categories_dict = datas[0]['categories']

In [None]:
test_coco_sizes = [x for x in size_dict.keys() if x < 600]
print('Split is {}'.format(float(sum(test_coco_sizes)) / sum(size_dict.keys())))
test_coco_files = [size_dict[x] for x in test_coco_sizes]
train_coco_files = [size_dict[x] for x in list(set(size_dict.keys()) - set(test_coco_sizes))]

### 2 - Datasets

In [None]:
import os
import sys
import random
import math
import re
import time
import numpy as np
import cv2
import matplotlib
import matplotlib.pyplot as plt
import keras

sys.path.insert(0, '../libraries')
from mrcnn.config import Config
import mrcnn.utils as utils
import mrcnn.model as modellib
import mrcnn.visualize as visualize
from mrcnn.model import log
import mcoco.coco as coco
# import mextra.utils as extra_utils
from PIL import ImageFile
ImageFile.LOAD_TRUNCATED_IMAGES = True

%matplotlib inline
%config IPCompleter.greedy=True
BASE_DIR = '/root/data/models/erko/mask_rcnn_instance_segmentation'
DATA_DIR = '/root/data/erko/'
WEIGHTS_DIR = os.path.join(BASE_DIR, "weights")
MODEL_DIR = os.path.join(BASE_DIR, "logs")

# Local path to trained weights file
COCO_MODEL_PATH = os.path.join(WEIGHTS_DIR, "mask_rcnn_coco.h5")
# Download COCO trained weights from Releases if needed
if not os.path.exists(COCO_MODEL_PATH):
    utils.download_trained_weights(COCO_MODEL_PATH)

In [None]:
def get_ax(rows=1, cols=1, size=8):
    """Return a Matplotlib Axes array to be used in
    all visualizations in the notebook. Provide a
    central point to control graph sizes.
    
    Change the default size attribute to control the size
    of rendered images
    """
    _, ax = plt.subplots(rows, cols, figsize=(size*cols, size*rows))
    return ax

In [None]:
dataset_train = coco.CocoDataset()
for coco_file in train_coco_files:
    dataset_train.load_coco(coco_file, class_ids=[0])
dataset_train.prepare()
print("Number of train images: {}".format(dataset_train.num_images))

In [None]:
dataset_validate = coco.CocoDataset()
for coco_file in test_coco_files:
    dataset_validate.load_coco(coco_file, class_ids=[0])
dataset_validate.prepare()
print("Number of train images: {}".format(dataset_validate.num_images))

In [None]:
# Load and display random samples# Load  
image_ids = np.random.choice(dataset_train.image_ids, 4)
for image_id in image_ids:
    image = dataset_train.load_image(image_id)
    mask, class_ids = dataset_train.load_mask(image_id)
    visualize.display_top_masks(image, mask, class_ids, dataset_train.class_names)

## Configuration

In [None]:
image_size = 512
rpn_anchor_template = (1, 2, 4, 8, 16) # anchor sizes in pixels
rpn_anchor_scales = tuple(i * (image_size // 16) for i in rpn_anchor_template)

class FishConfig(Config):
    """Configuration for training on the shapes dataset.
    """
    # name your experiments here
    NAME = "clear_full_lateral"

    # Train on 1 GPU and 2 images per GPU. Put multiple images on each
    # GPU if the images are small. Batch size is 2 (GPUs * images/GPU).
    GPU_COUNT = 1
    IMAGES_PER_GPU = 1

    # Number of classes (including background)
    NUM_CLASSES = 1 + 1  # background + 3 shapes (triangles, circles, and squares)

    # Use smaller images for faster training. 
    IMAGE_MAX_DIM = image_size
    IMAGE_MIN_DIM = image_size
    
    # Use smaller anchors because our image and objects are small
    RPN_ANCHOR_SCALES = rpn_anchor_scales

    # Aim to allow ROI sampling to pick 33% positive ROIs.
    TRAIN_ROIS_PER_IMAGE = 32

    STEPS_PER_EPOCH = 1000

    VALIDATION_STEPS = 300
    
config = FishConfig()
config.display()

## Model

In [None]:
model = modellib.MaskRCNN(mode="training", config=config, model_dir=MODEL_DIR)

In [None]:
## inititalize_weights_with = "coco"  # imagenet, coco, or last

if inititalize_weights_with == "imagenet":
    model.load_weights(model.get_imagenet_weights(), by_name=True)
    
elif inititalize_weights_with == "coco":
    model.load_weights(COCO_MODEL_PATH, by_name=True,
                       exclude=["mrcnn_class_logits", "mrcnn_bbox_fc", 
                                "mrcnn_bbox", "mrcnn_mask"])
    
elif inititalize_weights_with == "last":
    # Load the last model you trained and continue training
    model.load_weights(model.find_last()[1], by_name=True)

## Training

In [None]:
# add more callbacks here if necessary
callbacks = [
    keras.callbacks.TensorBoard(log_dir=model.log_dir,
                                histogram_freq=0, write_graph=True, write_images=False),
    keras.callbacks.ModelCheckpoint(model.checkpoint_path,
                                    verbose=0, save_weights_only=True),
]

In [None]:
model.train(dataset_train, dataset_validate, 
            learning_rate=config.LEARNING_RATE / 10,
            epochs=50, # starts from the previous epoch, so only 1 additional is trained 
            layers="all",
            callback_list=callbacks)

## Detection

### 1 - Inference config

In [None]:
model_path = '/root/data/models/erko/mask_rcnn_instance_segmentation/logs/clear_full_lateral_20181003_12H35/mask_rcnn_clear_full_lateral_0045.h5'

In [None]:
class InferenceConfig(FishConfig):
    GPU_COUNT = 1
    IMAGES_PER_GPU = 1

inference_config = InferenceConfig()

# Recreate the model in inference mode
model = modellib.MaskRCNN(mode="inference", 
                          config=inference_config,
                          model_dir=MODEL_DIR)

print("Loading weights from ", model_path)
model.load_weights(model_path, by_name=True)

### 2 - Visualisation of prediction on every image of test set

**Instructions** : Press enter to continue to next image, and ctrl + c or pause the kernel to stop (then enter)

In [None]:
try:
    while True:
        for image_id in dataset_validate.image_ids:
            original_image, image_meta, gt_class_id, gt_bbox, gt_mask =\
            modellib.load_image_gt(dataset_validate, inference_config, 
                           image_id, use_mini_mask=False)

            log("original_image", original_image)
            log("image_meta", image_meta)
            log("gt_class_id", gt_class_id)
            log("gt_bbox", gt_bbox)
            log("gt_mask", gt_mask)

            visualize.display_instances(original_image, gt_bbox, gt_mask, gt_class_id, 
                            dataset_validate.class_names, figsize=(8, 8))

            results = model.detect([original_image], verbose=1)
            r = results[0]
            visualize.display_instances(original_image, r['rois'], r['masks'], r['class_ids'], 
                            dataset_validate.class_names, r['scores'], ax=get_ax())

            visualize.display_differences(original_image, gt_bbox, gt_class_id, gt_mask,
                        r['rois'], r['class_ids'], r['scores'], r['masks'],
                        dataset_validate.class_names)

            input('Press enter to continue: ')
except KeyboardInterrupt:
    pass

### 3 - Evaluation of prediction on every image of test set

In [None]:
dataset_validate.class_info = [{'id': 0, 'name': 'BG', 'source': ''},
 {'id': 1, 'name': 'salmon', 'source': 'coco'}]

#### 3.1 - mAP

In [None]:
from mextra.utils import compute_per_class_precision, compute_multiple_per_class_precision

In [None]:
predictions =\
compute_multiple_per_class_precision(model, inference_config, dataset_validate, iou_threshold=0.5)
complete_predictions = []

for shape in predictions:
    complete_predictions += predictions[shape]
    print("{} ({}): {}".format(shape, len(predictions[shape]), np.mean(predictions[shape])))

print("--------")
print("average: {}".format(np.mean(complete_predictions)))

#### 3.2 - Complementary metrics

In [None]:
from mextra.utils import compute_per_class_precision
from mrcnn.utils import compute_recall, compute_precision, compute_overlaps
from tqdm import tqdm

In [None]:
d = {'nb_gt_fish':[], 'nb_pred_fish':[]}
iou_threshold = 0.5

In [None]:
mean_mask_iou = []
mean_precision = []
mean_recall = []
for i in tqdm(range(len(dataset_validate.image_ids))):
    image_id = dataset_validate.image_ids[i]
    image, _, gt_class_id, gt_bbox, gt_mask =\
            modellib.load_image_gt(dataset_validate, inference_config,
                                image_id, use_mini_mask=False)
    results = model.detect([image], verbose=0)
    r = results[0]
    # Fill histogram dict
    d['nb_gt_fish'].append(float(gt_mask.shape[-1]))
    d['nb_pred_fish'].append(float(r['masks'].shape[-1]))
    # Recall
    mean_recall.append(compute_recall(pred_boxes=r['rois'], gt_boxes=gt_bbox, iou=iou_threshold)[0])
    # Precision
    mean_precision.append(compute_precision(pred_boxes=r['rois'], gt_boxes=gt_bbox, iou=iou_threshold))
    class_precision_info =\
    compute_per_class_precision(gt_bbox, gt_class_id, gt_mask,
                r["rois"], r["class_ids"], r["scores"], r["masks"],
                dataset_validate.class_info, 0.5)
    # Compute mask overlap
    for overlap in list(class_precision_info['salmon']['overlaps']):
        temp = overlap[overlap!=0]
        if len(temp) > 0:
            mean_mask_iou.append(float(temp.max()))

In [None]:
print('Mean Mask overlap: {}'.format(sum(mean_mask_iou) / len(mean_mask_iou)))
print('Mean precision: {}'.format(sum(mean_precision) / len(mean_precision)))
print('Mean recall: {}'.format(sum(mean_recall) / len(mean_recall)))

In [None]:
dataset_validate.class_names