In [None]:
%load_ext autoreload
%autoreload 2

In [None]:
import segmentation_models_pytorch as smp
from segmentation_models_pytorch.encoders import get_preprocessing_fn

In [None]:
import os
import wandb
#os.environ['WANDB_MODE'] = 'dryrun'
os.environ['WANDB_NOTEBOOK_NAME'] = 'data.ipynb'
wandb.init("sky-eye-full")
conf = wandb.config

In [None]:
from glob import glob
train_dir = '/home/jovyan/work/datasets/xview/train'
test_dir = '/home/jovyan/work/datasets/xview/test'

In [None]:
from tqdm import tqdm_notebook as tqdm
import numpy as np
import torch
from torch import nn
from xv.util import vis_im_mask
import segmentation_models_pytorch as smp

In [None]:
conf.aug_prob = .5
conf.train_pre = True
conf.train_post = False

conf.n_dmg_classes = 4
conf.batch_size = 12
conf.image_size = 512

conf.damage_scale_mode = 'ordinal'

conf.blocktype = 'bottleneck'

conf.blocks = [2, 4]
conf.strides = [2, 2]
conf.growth_rate = 1

#conf.pretrained_model = 'selimsef_spacenet4_densenet121unet'
#conf.pretrained = True

conf.segmentation_arch = 'Linknet'
conf.encoder = 'efficientnet-b2'

dmg_downscale=1
for s in conf.strides:
    dmg_downscale *= s
    
conf.dmg_downscale_ratio = dmg_downscale


In [None]:
import albumentations as al

augment = al.Compose([
        al.HorizontalFlip(p=conf.aug_prob),
        al.VerticalFlip(p=conf.aug_prob),
        al.RandomRotate90(p=conf.aug_prob),
        al.Transpose(p=conf.aug_prob),
        al.GridDistortion(p=conf.aug_prob, distort_limit=.2),
        al.ShiftScaleRotate(p=conf.aug_prob),
        al.RandomBrightnessContrast(p=conf.aug_prob)
])

In [None]:
from xv.nn.solaris.model_io import get_model
from xv.nn.nets import DownscaleLayer, XVNet
from torchvision.models.resnet import BasicBlock, Bottleneck
import segmentation_models_pytorch as smp


block_types = {
    'bottleneck': Bottleneck,
    'basic': BasicBlock
}

segmentation_types = {
    'PSPNet': smp.PSPNet,
    'FPN': smp.FPN,
    'Linknet': smp.Linknet,
    'Unet': smp.Unet
}

if 'pretrained_model' in dict(conf):
    building_seg = get_model(conf.pretrained_model, 'torch', pretrained=conf.pretrained)
    preprocess_fn=None
else:
    building_seg = segmentation_types[conf.segmentation_arch](conf.encoder, classes=1, activation='sigmoid')
    preprocess_fn = get_preprocessing_fn(conf.encoder)

if conf.train_post:
    damage = DownscaleLayer(inplanes=building_seg.final_filters, blocks=conf.blocks, strides=conf.strides,
                           block=block_types[conf.blocktype],
                           nclasses=conf.n_dmg_classes,
                           growth_rate=conf.growth_rate)
else:
    damage = None

model = XVNet(building_seg, damage).to('cuda')

In [None]:
from xv.nn import dataset
from xv import util
import random

instances = dataset.XViewSegmentationDataset.get_instances(train_dir)

random.seed(hash("😂"))
random.shuffle(instances)

dev_ix = int(len(instances)*.20)
dev_instances = instances[:dev_ix]
train_instances = instances[dev_ix:]
len(train_instances), len(dev_instances)

train_dataset = dataset.XViewSegmentationDataset(
    instances=train_instances,
    resolution=(conf.image_size, conf.image_size),
    dmg_downscale_ratio = conf.dmg_downscale_ratio,
    augment=augment,
    damage_scale_mode=conf.damage_scale_mode,
    preprocess_fn=preprocess_fn,
)

dev_dataset = dataset.XViewSegmentationDataset(
    instances=dev_instances,
    resolution=(conf.image_size, conf.image_size),
    dmg_downscale_ratio = conf.dmg_downscale_ratio,
    augment=None,
    damage_scale_mode=conf.damage_scale_mode,
    preprocess_fn=preprocess_fn
)

train_loader = torch.utils.data.DataLoader(
    train_dataset,
    batch_size=conf.batch_size,
    shuffle=True,
    num_workers=10,
    pin_memory=True,
)

dev_loader = torch.utils.data.DataLoader(
    dev_dataset,
    batch_size=conf.batch_size,
    shuffle=True,
    num_workers=10,
    pin_memory=True,
)

In [None]:
from xv.nn.losses import loss_dict, WeightedLoss

conf.loss_weights = {
    'dice': 1,
    'focal': 1,
    #'bcewithlogits': 1,
    #'jaccard': 1
}

loss = WeightedLoss({loss_dict[l]():w for l, w in conf.loss_weights.items()})

In [None]:
import apex

optims = {
    'adam': torch.optim.Adam,
}

conf.optim = 'adam'
conf.lr = 0.0005

optim = optims[conf.optim](model.parameters(), lr=conf.lr)

In [None]:
from apex import amp

In [None]:
from apex import amp
conf.amp_opt_level = 'O1'
model, optim = amp.initialize(model, optim, opt_level=conf.amp_opt_level)

In [None]:
wandb.watch(model);

In [None]:
conf.scheduler_factor = 0.5
conf.scheduler_patience = 5

scheduler = torch.optim.lr_scheduler.ReduceLROnPlateau(optim, factor=conf.scheduler_factor, patience=conf.scheduler_patience)

In [None]:
conf.pre_weight = 1.
conf.post_weight = 1.

In [None]:
from collections import defaultdict
def train(model, optim, data, loss_fn, train_pre=True, train_post=True):
    model = model.train()
    loss_sum, loss_pre_sum, loss_post_sum = 0., 0., 0.
    
    for batch in tqdm(iter(data)):
        optim.zero_grad()        
        loss = 0.
        
        if train_pre:
            pre_out = model(batch['images']['image'].to('cuda'))
            pre_targets = batch['masks']['buildings'].to('cuda')
            loss_pre = conf.pre_weight*loss_fn(pre_out, batch['masks']['buildings'].to('cuda'))
            loss += loss_pre
            loss_pre_sum += loss_pre

        if train_post:
            post_out = model(batch['images']['post'].to('cuda'), downscale=True)
            post_targets = batch['masks']['damage'].to('cuda')
            loss_post = conf.post_weight*sum((loss_fn(mask_out, mask) for mask_out, mask in zip(post_out, batch['masks']['damage'].to('cuda'))))
            loss_post /= post_out.shape[1]
            loss += loss_post
            loss_post_sum += loss_post

        if train_pre and train_post:
            loss /= (conf.pre_weight+conf.post_weight)
        
        with amp.scale_loss(loss, optim) as scaled_loss:
            scaled_loss.backward()
        optim.step()
        
        loss_sum += loss
        
    return {
        'loss':loss_sum/len(data), 
        'loss_pre': loss_pre_sum/len(data) if train_pre else None,
        'loss_post': loss_post_sum/len(data) if train_post else None
    }

def batch_metrics(outputs, targets, threshold=0.5):
    metrics = {}
    pr_sum, re_sum, f_sum = 0., 0., 0.
    for output, target in zip(outputs, targets):
        target_bool = target.to(torch.bool)
        output_bool = output.sigmoid() > threshold

        recall = output_bool[target_bool].float().mean()
        recall = recall if recall == recall else 1.

        precision = target_bool[output_bool].float().mean()
        precision = precision if precision == precision else 1.

        pr_sum += precision
        re_sum += recall
        f_sum += 2*precision*recall/(precision + recall) if (precision + recall) > 0. else 0.

    return {
        'recall': re_sum/len(outputs),
        'precision': pr_sum/len(outputs),
        'f1': f_sum/len(outputs)
    }
    

def evaluate(model, optim, data, loss_fn, threshold=0.5, eval_pre=True, eval_post=True):
    model = model.eval()
    metrics = defaultdict(float)
    
    with torch.no_grad():
        metric_sums = defaultdict(float)
        for batch in tqdm(iter(data)):
            loss = 0.
            
            if eval_pre:
                pre_out = model(batch['images']['image'].to('cuda'))
                pre_targets = batch['masks']['buildings'].to('cuda')
                loss_pre = conf.pre_weight*loss_fn(pre_out, pre_targets)
                metrics['loss_pre'] += loss_pre
                loss += loss_pre
                for k,v in batch_metrics(pre_out, pre_targets).items():    
                    metrics[f'building_{k}'] += v

            if eval_post:
                post_out = model(batch['images']['post'].to('cuda'), downscale=True)
                post_targets = batch['masks']['damage'].to('cuda')
                loss_post = conf.post_weight*sum((loss_fn(mask_out, mask) for mask_out, mask in zip(post_out, post_targets)))
                metrics['loss_post'] += loss_post
                loss += loss_post
                macro_metrics = defaultdict(float)
                for dmg_type, ix in train_dataset.DAMAGE_CLASSES.items():
                    for k,v in batch_metrics(post_out[:,ix], post_targets[:,ix]).items():
                        metrics[f'dmg_{dmg_type}_{k}'] += v
                        macro_metrics[k] += v
                for k, v in macro_metrics.items():
                    metrics[f'dmg_macro_{k}'] += v/len(train_dataset.DAMAGE_CLASSES)
            
            if eval_pre and eval_post:
                loss /= conf.pre_weight+conf.post_weight
            
            
            metrics['loss'] += loss

    return {k:v/len(data) for k, v in metrics.items()}

In [None]:
conf.epochs = 140
best_loss = 1e5
epoch = 0

In [None]:
for epoch in range(epoch, conf.epochs):
    metrics = {'epoch':epoch}
    metrics.update(({f'train_{k}':v for k,v in train(model, optim, train_loader, loss, train_pre=conf.train_pre, train_post=conf.train_post).items()}))
    metrics.update(evaluate(model, optim, dev_loader, loss, eval_pre=conf.train_pre, eval_post=conf.train_post))
    scheduler.step(metrics['loss'])
    wandb.log(metrics)
    if metrics['loss'] < best_loss:
        torch.save(model.state_dict(), os.path.join(wandb.run.dir, "state_dict.pth"))
        best_loss = metrics['loss']

In [None]:
ix = 1000
i = train_dataset[ix]
images, masks = i['images'], i['masks']
image = images['post']
image = np.array(train_dataset.inverse_transform_image(image))

util.vis_im_mask(image, masks['damage'], size=(512*2,512*2), opacity=.3);

In [None]:
from collections import Counter
counts = Counter(len(i['pre']['features']) for i in train_dataset.instances)

In [None]:
counts[0]/sum(counts.values())

In [None]:
sorted(dict(conf).items())