# Watershed Distance Transform for 2D Data
---
Implementation of papers:

[Deep Watershed Transform for Instance Segmentation](http://openaccess.thecvf.com/content_cvpr_2017/papers/Bai_Deep_Watershed_Transform_CVPR_2017_paper.pdf)

[Learn to segment single cells with deep distance estimator and deep cell detector](https://arxiv.org/abs/1803.10829)

In [1]:
import os
import errno

import numpy as np

import deepcell
from tensorflow.python import keras




In [2]:
from tensorflow.keras.optimizers import SGD
from deepcell.utils.train_utils import rate_scheduler

n_epoch = 9  # Number of training epochs
test_size = .10  # % of data saved as test
norm_method = 'std'  # data normalization
receptive_field = 81  # should be adjusted for the scale of the data

optimizer = SGD(lr=0.01, decay=1e-6, momentum=0.9, nesterov=True)

lr_sched = rate_scheduler(lr=0.01, decay=0.99)

# Sample mode settings
batch_size = 64  # number of images per batch (should be 2 ^ n)
win = (receptive_field - 1) // 2  # sample window size
balance_classes = True  # sample each class equally
max_class_samples = 1e6  # max number of samples per class

# Transformation settings
transform = 'watershed'
distance_bins = 4  # number of distance "classes"
erosion_width = 1  # erode edges

In [3]:
base_name = 'Decidua_Object_Train_Small_Nuclei'
npz_name = '/data/npz_data/' + base_name + ".npz"
MODEL_DIR = '/data/models/' + '20190808_decidua_small_nuclei'

if not os.path.isdir(MODEL_DIR):
    os.makedirs(MODEL_DIR)

LOG_DIR = '/data/logs'

sample_model_name = base_name + "_watershed_81_rf_64_conv_256_dense_300k_5bins"
fgbg_model_name = base_name + "_watershed_fgbg_81_rf_64_conv_256_dense_300k"

### Load the Training Data

In [4]:
CHANNEL_AXIS = 3
training_data = np.load(npz_name)

X, y = training_data["X"], training_data["y"]
print("X.shape: {} & y.shape: {}".format(X.shape, y.shape))
#X = X[:, :, :, 0:1]

X.shape: (5, 1024, 1024, 6) & y.shape: (5, 1024, 1024, 1)


In [4]:
### First, create a foreground/background separation model

#### Instantiate the fgbg model

In [5]:
from deepcell import model_zoo
fgbg_model = model_zoo.bn_feature_net_2D(
    receptive_field=receptive_field,
    n_channels=X.shape[CHANNEL_AXIS],
    n_features=2)

In [None]:
from deepcell.training import train_model_sample

fgbg_model = train_model_sample(
    model=fgbg_model,
    dataset=npz_name,
    model_name=fgbg_model_name,
    test_size=test_size,
    optimizer=optimizer,
    window_size=(win, win),
    batch_size=128,
    transform='fgbg',
    n_epoch=5,
    balance_classes=balance_classes,
    max_class_samples=1000000,
    model_dir=MODEL_DIR,
    log_dir=LOG_DIR,
    lr_sched=lr_sched,
    rotation_range=180,
    flip=True,
    shear=False,
    zoom_range=(0.8, 1.2),
    val_monitor=False,
    save_period=1)

using all data as training data
Using class weights of {0: 1.0, 1: 1.0}
X_train shape: (5, 1024, 1024, 6)
y_train shape: (5, 1024, 1024, 1)
Output Shape: (None, 2)
Number of Classes: 2
Training on 1 GPUs
the max_class_samples per image is 200000
analyzing image 0
the least represented class has 259505 examples
max_class_samples is less than the smalleset class, downsampling all classes
analyzing class 0
downsampling from 259505 examples per class
analyzing class 1
downsampling from 629744 examples per class
analyzing image 1
the least represented class has 226163 examples
max_class_samples is less than the smalleset class, downsampling all classes
analyzing class 0
downsampling from 226163 examples per class
analyzing class 1
downsampling from 663086 examples per class
analyzing image 2
the least represented class has 269108 examples
max_class_samples is less than the smalleset class, downsampling all classes
analyzing class 0
downsampling from 620141 examples per class
analyzing class

#### Instantiate the distance transform model

In [13]:
from deepcell import model_zoo
from deepcell.training import train_model_sample

watershed_model = model_zoo.bn_feature_net_2D(
    receptive_field=receptive_field,
    n_channels=X.shape[CHANNEL_AXIS],
    n_features=distance_bins,
    n_conv_filters=64,
    n_dense_filters=256)

In [14]:
sample_model_name
#watershed_model.load_weights('/data/models/20190606_params/Point1_12_18_3X_interior_border_border_watershed_128_filters_balanced_epoch_40.h5')

'Decidua_Object_Train_Small_Nuclei_watershed_81_rf_64_conv_256_dense_300k_5bins'

#### Train the model

In [None]:
watershed_model = train_model_sample(
    model=watershed_model,
    dataset=npz_name, 
    model_name=sample_model_name,
    test_size=test_size,
    optimizer=optimizer,
    batch_size=batch_size,
    n_epoch=9,
    window_size=(win, win),
    transform=transform,
    distance_bins=distance_bins,
    erosion_width=erosion_width,
    balance_classes=True,
    max_class_samples=300000,
    model_dir=MODEL_DIR,
    log_dir=LOG_DIR,
    lr_sched=lr_sched,
    rotation_range=180,
    flip=True,
    shear=False,
    zoom_range=(0.8, 1.2),
    val_monitor=False,
    save_period=1)

using all data as training data
Using class weights of {0: 1.0, 1: 1.0, 2: 1.0, 3: 1.0, 4: 1.0}
X_train shape: (5, 1024, 1024, 6)
y_train shape: (5, 1024, 1024, 1)
Output Shape: (None, 5)
Number of Classes: 5
Training on 1 GPUs
the max_class_samples per image is 60000
analyzing image 0
the least represented class has 35379 examples
analyzing class 0
downsampling from 489607 examples per class
analyzing class 1
downsampling from 162204 examples per class
analyzing class 2
downsampling from 121323 examples per class
analyzing class 3
downsampling from 80736 examples per class
analyzing class 4
downsampling from 35379 examples per class
analyzing image 1
the least represented class has 36272 examples
analyzing class 0
downsampling from 469630 examples per class
analyzing class 1
downsampling from 172043 examples per class
analyzing class 2
downsampling from 127060 examples per class
analyzing class 3
downsampling from 84244 examples per class
analyzing class 4
downsampling from 36272 exam