### The following setup draws from the Mask_RCNN repo by matterport and Deep Learning with Python by Chollet. 

https://github.com/matterport/Mask_RCNN
https://github.com/fchollet/deep-learning-with-python-notebooks

We import our packages, including maskrcnn, which needs to be installed from the github repo. 

We also set up our directories and paths before we organize our data into tensors. 

We subclass the dataset and config classes for our specific dataset

Then, we train the model and test.

TO DO:
- Try to prepare the dataset and see if Keras trains succesfully, with loss decreasing at each step.

- Try data augmentation: image rotation and flipping to increase our training set 6 fold

- Explore data aug options in load_image_gt():  

        augmentation: Optional. An imgaug (https://github.com/aleju/imgaug) augmentation.
        For example, passing imgaug.augmenters.Fliplr(0.5) flips images
        right/left 50% of the time.

- change Config attributes to see if hyperparameters like anchor sizes (size of proposed regions that objects are located in) dramatically impact model training time and performance


In [27]:
import cv2
import os
import sys
import random
import math
import numpy as np
import skimage.io as skio
import matplotlib
import matplotlib.pyplot as plt
import copy
from imgaug import augmenters as iaa
%matplotlib inline

# Import Mask RCNN
from mrcnn import utils
import mrcnn.model as modellib
from mrcnn import visualize
from mrcnn.config import Config
from mrcnn.model import log

# Root directory of the project
ROOT_DIR = os.path.abspath("/home/rave/tana-crunch/waves/deepimagery/data/raw/wv2/")

# Directory to save logs and trained model
MODEL_DIR = os.path.join(ROOT_DIR, "models")

# # Local path to trained weights file
# COCO_MODEL_PATH = os.path.join(MODEL_DIR, "mask_rcnn_coco.h5")
# # Download COCO trained weights from Releases if needed
# if not os.path.exists(COCO_MODEL_PATH):
#     utils.download_trained_weights(COCO_MODEL_PATH)

TRAIN_DIR = os.path.join(ROOT_DIR, 'train')
TEST_DIR = os.path.join(ROOT_DIR, 'test')
MODEL_DIR = os.path.join(ROOT_DIR, 'models')
# Results directory
# Save submission files here
RESULTS_DIR = os.path.join(ROOT_DIR, "results/")

os.chdir(ROOT_DIR)

In [5]:
next(os.walk(TRAIN_DIR))[1]

['ZA0808100',
 'ZA0800513',
 'ZA0964181',
 'ZA0795180',
 'ZA0484201',
 'ZA0158191',
 'ZA0486815',
 'ZA0568743',
 'ZA0568734',
 'ZA0164205',
 'ZA0800519',
 'ZA0802357',
 'ZA0492085',
 'ZA0960464',
 'ZA0798669',
 'ZA0794958',
 'ZA0804428',
 'ZA0162477',
 'ZA0806266',
 'ZA0794952',
 'ZA0804422',
 'ZA0560059',
 'ZA0798663',
 'ZA0117891',
 'ZA0118665',
 'ZA0161610',
 'ZA0809727',
 'ZA0488125',
 'ZA0120210',
 'ZA0494726',
 'ZA0165081',
 'ZA0119437',
 'ZA0495034',
 'ZA0796817',
 'ZA0489439',
 'ZA0560061',
 'ZA0159898',
 'ZA0793314',
 'ZA0567275',
 'ZA0491075',
 'ZA0159892',
 'ZA0564354',
 'ZA0794960',
 'ZA0489444',
 'ZA0121771',
 'ZA0807882',
 'ZA0115607',
 'ZA0795177',
 'ZA0804205',
 'ZA0558646',
 'ZA0488439',
 'ZA0496044',
 'ZA0158188',
 'ZA0492395',
 'ZA0485820',
 'ZA0954877',
 'ZA0488444',
 'ZA0798670',
 'ZA0493717',
 'ZA0483208',
 'ZA0557245',
 'ZA0811574',
 'ZA0159040',
 'ZA0159037',
 'ZA0953007',
 'ZA0492078',
 'ZA0483202',
 'ZA0798885',
 'ZA0562912',
 'ZA0485818',
 'ZA0161609',
 'ZA09

In [10]:
import random
import shutil
random.seed(42)

def train_test_split(train_dir, test_dir, kprop):
    """Takes a sample of folder ids and copies them to a test directory. 
    each sample folder containes an images and corresponding masks folder"""
    
    sample_list = next(os.walk(train_dir))[1]
    k = round(kprop*len(sample_list))
    test_list = random.sample(sample_list,k)
    for test_sample in test_list:
        shutil.copytree(os.path.join(train_dir,test_sample),os.path.join(test_dir,test_sample))
    train_list = list(set(next(os.walk(train_dir))[1]) - set(test_list))
    print(len(train_list))
    print(len(test_list))
    return train_list, test_list
    
train_list, test_list = train_test_split(TRAIN_DIR, TEST_DIR, .1)

715
79


In [21]:
class ImageryConfig(Config):
    """Configuration for training on worldview-2 imagery. 
    Will eventually want to make this a sub-class of a 
    larger Imagery class. Overrides values specific to WV2.
    
    Descriptive documentation for each attribute is at
    https://github.com/matterport/Mask_RCNN/blob/master/mrcnn/config.py"""
    
    def __init__(self, N):
        """Set values of computed attributes. Channel dimension is overriden, 
        replaced 3 with N as per this guideline: https://github.com/matterport/Mask_RCNN/issues/314
        THERE MAY BE OTHER CODE CHANGES TO ACCOUNT FOR 3 vs N channels. See other 
        comments."""
        # https://github.com/matterport/Mask_RCNN/wiki helpful for N channels
        # Effective batch size
        self.BATCH_SIZE = self.IMAGES_PER_GPU * self.GPU_COUNT
        
        IMAGE_RESIZE_MODE = "crop"
        # Input image size
        if self.IMAGE_RESIZE_MODE == "crop":
            self.IMAGE_SHAPE = np.array([self.IMAGE_MIN_DIM, self.IMAGE_MIN_DIM, N])
        else:
            self.IMAGE_SHAPE = np.array([self.IMAGE_MAX_DIM, self.IMAGE_MAX_DIM, N])

        # Image meta data length
        # See compose_image_meta() for details
        self.IMAGE_META_SIZE = 1 + 3 + 3 + 4 + 1 + self.NUM_CLASSES

    # Image mean (RGB)
    # filling with N values, need to compute mean of each channel
    MEAN_PIXEL = np.array([123.7, 116.8, 103.9])
    
    # Give the configuration a recognizable name
    NAME = "wv2-gridded"

    # Batch size is 4 (GPUs * images/GPU).
    # New parralel_model.py allows for multi-gpu
    GPU_COUNT = 1
    IMAGES_PER_GPU = 4

    # Number of classes (including background)
    NUM_CLASSES = 1 + 1  # background + ag

    # Use small images for faster training. Determines the image shape.
    # From build() in model.py
    # Exception("Image size must be dividable by 2 at least 6 times "
                       #     "to avoid fractions when downscaling and upscaling."
                       #    "For example, use 256, 320, 384, 448, 512, ... etc. "
    IMAGE_MIN_DIM = 256
    IMAGE_MAX_DIM = 256

    # Use smaller anchors because our image and objects are small.
    # Setting Large upper scale since some fields take up nearly 
    # whole image
    RPN_ANCHOR_SCALES = (16, 32, 64, 128, 300)  # anchor side in pixels

    # Reduce training ROIs per image because the images are small and have
    # few objects. Aim to allow ROI sampling to pick 33% positive ROIs.
    TRAIN_ROIS_PER_IMAGE = 200

    # Use a small epoch since the data is simple
    STEPS_PER_EPOCH = 1000
    
    #reduces the max number of field instances
    MAX_GT_INSTANCES = 100

    # use small validation steps since the epoch is small
    VALIDATION_STEPS = 50
    
    # Backbone network architecture
    # Supported values are: resnet50, resnet101.
    # You can also provide a callable that should have the signature
    # of model.resnet_graph. If you do so, you need to supply a callable
    # to COMPUTE_BACKBONE_SHAPE as well
    BACKBONE = "resnet50"
    

In [29]:
class ImageryDataset(utils.Dataset):
    """Generates the Imagery dataset."""
    
    def load_image(self, image_id):
        """Load the specified image and return a [H,W,8] Numpy array.
        Channels are ordered [B, G, R, NIR]. This is called by the 
        Keras data_generator function
        """
        # Load image
        image = skio.imread(self.image_info[image_id]['path'])
    
        assert image.shape[-1] == 8
        assert image.ndim == 3
    
        return image
    
    def load_wv2(self, dataset_dir, subset):
        """Load a subset of the nuclei dataset.

        dataset_dir: Root directory of the dataset
        subset: Subset to load.
                * train: stage1_train excluding validation images
                * val: validation images from VAL_IMAGE_IDS
        """
        # Add classes. We have one class.
        # Naming the dataset wv2, and the class agriculture
        self.add_class("wv2", 1, "agriculture")

        assert subset in ["train", "test"]
        dataset_dir = os.path.join(dataset_dir, subset)
        if subset == "test":
            image_ids = test_list
        else:
            image_ids = train_list
        
        # Add images
        for image_id in image_ids:
            self.add_image(
                "wv2",
                image_id=image_id,
                path=os.path.join(dataset_dir, image_id, "image/{}.tif".format(image_id+'_OSGS_ms')))
    
    def load_mask(self, image_id):
        """Generate instance masks for an image.
       Returns:
        masks: A bool array of shape [height, width, instance count] with
            one mask per instance.
        class_ids: a 1D array of class IDs of the instance masks.
        """
        info = self.image_info[image_id]
        # Get mask directory from image path
        mask_dir = os.path.join(os.path.dirname(os.path.dirname(info['path'])), "masks")

        # Read mask files from .png image
        mask = []
        for f in next(os.walk(mask_dir))[2]:
            if f.endswith(".tif"):
                m = skio.imread(os.path.join(mask_dir, f)).astype(np.bool)
                mask.append(m)
        mask = np.stack(mask, axis=-1)
        # Return mask, and array of class IDs of each instance. Since we have
        # one class ID, we return an array of ones
        return mask, np.ones([mask.shape[-1]], dtype=np.int32)
    
    def image_reference(self, image_id):
        """Return the path of the image."""
        info = self.image_info[image_id]
        if info["source"] == "field":
            return info["id"]
        else:
            super(self.__class__, self).image_reference(image_id)

In [14]:
def train(model, dataset_dir, subset):
    """Train the model."""
    # Training dataset.
    dataset_train = ImageryDataset()
    dataset_train.load_wv2(dataset_dir, "train")
    dataset_train.prepare()

    # Validation dataset
    dataset_val = ImageryDataset()
    dataset_val.load_wv2(dataset_dir, "test")
    dataset_val.prepare()

    # Image augmentation
    # http://imgaug.readthedocs.io/en/latest/source/augmenters.html
    augmentation = iaa.SomeOf((0, 2), [
        iaa.Fliplr(0.5),
        iaa.Flipud(0.5),
        iaa.OneOf([iaa.Affine(rotate=90),
                   iaa.Affine(rotate=180),
                   iaa.Affine(rotate=270)]),
        iaa.Multiply((0.8, 1.5)),
        iaa.GaussianBlur(sigma=(0.0, 5.0))
    ])

    # *** This training schedule is an example. Update to your needs ***

    print("Train all layers")
    model.train(dataset_train, dataset_val,
                learning_rate=config.LEARNING_RATE,
                epochs=40,
                augmentation=augmentation,
                layers='all')


############################################################
#  RLE Encoding
############################################################

def rle_encode(mask):
    """Encodes a mask in Run Length Encoding (RLE).
    Returns a string of space-separated values.
    """
    assert mask.ndim == 2, "Mask must be of shape [Height, Width]"
    # Flatten it column wise
    m = mask.T.flatten()
    # Compute gradient. Equals 1 or -1 at transition points
    g = np.diff(np.concatenate([[0], m, [0]]), n=1)
    # 1-based indicies of transition points (where gradient != 0)
    rle = np.where(g != 0)[0].reshape([-1, 2]) + 1
    # Convert second index in each pair to lenth
    rle[:, 1] = rle[:, 1] - rle[:, 0]
    return " ".join(map(str, rle.flatten()))

def rle_decode(rle, shape):
    """Decodes an RLE encoded list of space separated
    numbers and returns a binary mask."""
    rle = list(map(int, rle.split()))
    rle = np.array(rle, dtype=np.int32).reshape([-1, 2])
    rle[:, 1] += rle[:, 0]
    rle -= 1
    mask = np.zeros([shape[0] * shape[1]], np.bool)
    for s, e in rle:
        assert 0 <= s < mask.shape[0]
        assert 1 <= e <= mask.shape[0], "shape: {}  s {}  e {}".format(shape, s, e)
        mask[s:e] = 1
    # Reshape and transpose
    mask = mask.reshape([shape[1], shape[0]]).T
    return mask


def mask_to_rle(image_id, mask, scores):
    "Encodes instance masks to submission format."
    assert mask.ndim == 3, "Mask must be [H, W, count]"
    # If mask is empty, return line with image ID only
    if mask.shape[-1] == 0:
        return "{},".format(image_id)
    # Remove mask overlaps
    # Multiply each instance mask by its score order
    # then take the maximum across the last dimension
    order = np.argsort(scores)[::-1] + 1  # 1-based descending
    mask = np.max(mask * np.reshape(order, [1, 1, -1]), -1)
    # Loop over instance masks
    lines = []
    for o in order:
        m = np.where(mask == o, 1, 0)
        # Skip if empty
        if m.sum() == 0.0:
            continue
        rle = rle_encode(m)
        lines.append("{}, {}".format(image_id, rle))
    return "\n".join(lines)


############################################################
#  Detection
############################################################

def detect(model, dataset_dir, subset):
    """Run detection on images in the given directory."""
    print("Running on {}".format(dataset_dir))

    # Create directory
    if not os.path.exists(RESULTS_DIR):
        os.makedirs(RESULTS_DIR)
    submit_dir = "submit_{:%Y%m%dT%H%M%S}".format(datetime.datetime.now())
    submit_dir = os.path.join(RESULTS_DIR, submit_dir)
    os.makedirs(submit_dir)

    # Read dataset
    dataset = ImageryDataset()
    dataset.load_wv2(dataset_dir, subset)
    dataset.prepare()
    # Load over images
    submission = []
    for image_id in dataset.image_ids:
        # Load image and run detection
        image = dataset.load_image(image_id)
        # Detect objects
        r = model.detect([image], verbose=0)[0]
        # Encode image to RLE. Returns a string of multiple lines
        source_id = dataset.image_info[image_id]["id"]
        rle = mask_to_rle(source_id, r["masks"], r["scores"])
        submission.append(rle)
        # Save image with masks
        visualize.display_instances(
            image, r['rois'], r['masks'], r['class_ids'],
            dataset.class_names, r['scores'],
            show_bbox=False, show_mask=False,
            title="Predictions")
        plt.savefig("{}/{}.png".format(submit_dir, dataset.image_info[image_id]["id"]))

    # Save to csv file
    submission = "ImageId,EncodedPixels\n" + "\n".join(submission)
    file_path = os.path.join(submit_dir, "submit.csv")
    with open(file_path, "w") as f:
        f.write(submission)
    print("Saved to ", submit_dir)

### Train the model, trying without initial weights
need to generate an empty mask for images without fields
or
toss images and masks where there are no fields (probably the worse option, bias)

In [31]:
from IPython.core.debugger import set_trace
config = ImageryConfig(8)
model = modellib.MaskRCNN(mode="training", config=config,
                                  model_dir=MODEL_DIR)
train(model, ROOT_DIR, "train")

Train all layers

Starting at epoch 0. LR=0.001

Checkpoint Path: /home/rave/tana-crunch/waves/deepimagery/data/raw/wv2/models/wv2-gridded20180624T0848/mask_rcnn_wv2-gridded_{epoch:04d}.h5
Selecting layers to train
conv1                  (Conv2D)
bn_conv1               (BatchNorm)
res2a_branch2a         (Conv2D)
bn2a_branch2a          (BatchNorm)
res2a_branch2b         (Conv2D)
bn2a_branch2b          (BatchNorm)
res2a_branch2c         (Conv2D)
res2a_branch1          (Conv2D)
bn2a_branch2c          (BatchNorm)
bn2a_branch1           (BatchNorm)
res2b_branch2a         (Conv2D)
bn2b_branch2a          (BatchNorm)
res2b_branch2b         (Conv2D)
bn2b_branch2b          (BatchNorm)
res2b_branch2c         (Conv2D)
bn2b_branch2c          (BatchNorm)
res2c_branch2a         (Conv2D)
bn2c_branch2a          (BatchNorm)
res2c_branch2b         (Conv2D)
bn2c_branch2b          (BatchNorm)
res2c_branch2c         (Conv2D)
bn2c_branch2c          (BatchNorm)
res3a_branch2a         (Conv2D)
bn3a_branch2a   

  "Converting sparse IndexedSlices to a dense Tensor of unknown shape. "
ERROR:root:Error processing image {'id': 'ZA0565810', 'source': 'wv2', 'path': '/home/rave/tana-crunch/waves/deepimagery/data/raw/wv2/train/ZA0565810/image/ZA0565810_OSGS_ms.tif'}
Traceback (most recent call last):
  File "/opt/anaconda3/envs/maskrcnn/lib/python3.6/site-packages/mask_rcnn-2.1-py3.6.egg/mrcnn/model.py", line 1695, in data_generator
    use_mini_mask=config.USE_MINI_MASK)
  File "/opt/anaconda3/envs/maskrcnn/lib/python3.6/site-packages/mask_rcnn-2.1-py3.6.egg/mrcnn/model.py", line 1218, in load_image_gt
    mask = utils.resize_mask(mask, scale, padding, crop)
  File "/opt/anaconda3/envs/maskrcnn/lib/python3.6/site-packages/mask_rcnn-2.1-py3.6.egg/mrcnn/utils.py", line 513, in resize_mask
    mask = scipy.ndimage.zoom(mask, zoom=[scale, scale, 1], order=0)
  File "/opt/anaconda3/envs/maskrcnn/lib/python3.6/site-packages/scipy/ndimage/interpolation.py", line 606, in zoom
    zoom = _ni_support._normal

RuntimeError: sequence argument must have length equal to input rankERROR:root:Error processing image {'id': 'ZA0159040', 'source': 'wv2', 'path': '/home/rave/tana-crunch/waves/deepimagery/data/raw/wv2/train/ZA0159040/image/ZA0159040_OSGS_ms.tif'}
Traceback (most recent call last):
  File "/opt/anaconda3/envs/maskrcnn/lib/python3.6/site-packages/mask_rcnn-2.1-py3.6.egg/mrcnn/model.py", line 1695, in data_generator
    use_mini_mask=config.USE_MINI_MASK)
  File "/opt/anaconda3/envs/maskrcnn/lib/python3.6/site-packages/mask_rcnn-2.1-py3.6.egg/mrcnn/model.py", line 1218, in load_image_gt
    mask = utils.resize_mask(mask, scale, padding, crop)
  File "/opt/anaconda3/envs/maskrcnn/lib/python3.6/site-packages/mask_rcnn-2.1-py3.6.egg/mrcnn/utils.py", line 513, in resize_mask
    mask = scipy.ndimage.zoom(mask, zoom=[scale, scale, 1], order=0)
  File "/opt/anaconda3/envs/maskrcnn/lib/python3.6/site-packages/scipy/ndimage/interpolation.py", line 606, in zoom
    zoom = _ni_support._normalize_s

Epoch 1/40


ERROR:root:Error processing image {'id': 'ZA0492082', 'source': 'wv2', 'path': '/home/rave/tana-crunch/waves/deepimagery/data/raw/wv2/train/ZA0492082/image/ZA0492082_OSGS_ms.tif'}
Traceback (most recent call last):
  File "/opt/anaconda3/envs/maskrcnn/lib/python3.6/site-packages/mask_rcnn-2.1-py3.6.egg/mrcnn/model.py", line 1758, in data_generator
    batch_images[b] = mold_image(image.astype(np.float32), config)
  File "/opt/anaconda3/envs/maskrcnn/lib/python3.6/site-packages/mask_rcnn-2.1-py3.6.egg/mrcnn/model.py", line 2757, in mold_image
    return images.astype(np.float32) - config.MEAN_PIXEL
ValueError: operands could not be broadcast together with shapes (256,256,8) (3,) 
ERROR:root:Error processing image {'id': 'ZA0158188', 'source': 'wv2', 'path': '/home/rave/tana-crunch/waves/deepimagery/data/raw/wv2/train/ZA0158188/image/ZA0158188_OSGS_ms.tif'}
Traceback (most recent call last):
  File "/opt/anaconda3/envs/maskrcnn/lib/python3.6/site-packages/mask_rcnn-2.1-py3.6.egg/mrcnn/mo

RuntimeError: sequence argument must have length equal to input rank
ERROR:root:Error processing image {'id': 'ZA0558650', 'source': 'wv2', 'path': '/home/rave/tana-crunch/waves/deepimagery/data/raw/wv2/train/ZA0558650/image/ZA0558650_OSGS_ms.tif'}
Traceback (most recent call last):
  File "/opt/anaconda3/envs/maskrcnn/lib/python3.6/site-packages/mask_rcnn-2.1-py3.6.egg/mrcnn/model.py", line 1695, in data_generator
    use_mini_mask=config.USE_MINI_MASK)
  File "/opt/anaconda3/envs/maskrcnn/lib/python3.6/site-packages/mask_rcnn-2.1-py3.6.egg/mrcnn/model.py", line 1218, in load_image_gt
    mask = utils.resize_mask(mask, scale, padding, crop)
  File "/opt/anaconda3/envs/maskrcnn/lib/python3.6/site-packages/mask_rcnn-2.1-py3.6.egg/mrcnn/utils.py", line 513, in resize_mask
    mask = scipy.ndimage.zoom(mask, zoom=[scale, scale, 1], order=0)
  File "/opt/anaconda3/envs/maskrcnn/lib/python3.6/site-packages/scipy/ndimage/interpolation.py", line 606, in zoom
    zoom = _ni_support._normalize_

RuntimeError: sequence argument must have length equal to input rank
ERROR:root:Error processing image {'id': 'ZA0493401', 'source': 'wv2', 'path': '/home/rave/tana-crunch/waves/deepimagery/data/raw/wv2/train/ZA0493401/image/ZA0493401_OSGS_ms.tif'}
Traceback (most recent call last):
  File "/opt/anaconda3/envs/maskrcnn/lib/python3.6/site-packages/mask_rcnn-2.1-py3.6.egg/mrcnn/model.py", line 1758, in data_generator
    batch_images[b] = mold_image(image.astype(np.float32), config)
  File "/opt/anaconda3/envs/maskrcnn/lib/python3.6/site-packages/mask_rcnn-2.1-py3.6.egg/mrcnn/model.py", line 2757, in mold_image
    return images.astype(np.float32) - config.MEAN_PIXEL
ValueError: operands could not be broadcast together with shapes (256,256,8) (3,) 
ERROR:root:Error processing image {'id': 'ZA0804423', 'source': 'wv2', 'path': '/home/rave/tana-crunch/waves/deepimagery/data/raw/wv2/train/ZA0804423/image/ZA0804423_OSGS_ms.tif'}
Traceback (most recent call last):
  File "/opt/anaconda3/envs/

RuntimeError: sequence argument must have length equal to input rank