In [1]:
import wandb
import pandas as pd
from fastai.vision.all import *
from fastai.callback.wandb import WandbCallback

import params
from utils import get_predictions, create_dice_table

In [2]:
set_seed(42, reproducible=True)

In [3]:
train_config = SimpleNamespace(
    framework="fastai",
    img_size=(180, 320),
    batch_size=8, #8 keep small in Colab to be manageable
    augment=True, # use data augmentation
    epochs=3, # for brevity, increase for better results :)
    lr=2e-3,
    pretrained=True  # whether to use pretrained encoder,
)

In [4]:
run = wandb.init(project=params.WANDB_PROJECT, entity=params.ENTITY, job_type="training", config=train_config)

[34m[1mwandb[0m: Currently logged in as: [33mdarek[0m. Use [1m`wandb login --relogin`[0m to force relogin


In [5]:
processed_data_at = run.use_artifact(f'{params.PROCESSED_DATA_AT}:latest')
processed_dataset_dir = Path(processed_data_at.download())
df = pd.read_csv(processed_dataset_dir / 'data_split.csv')

[34m[1mwandb[0m: Downloading large artifact bdd_simple_1k_split:latest, 813.25MB. 4010 files... Done. 0:0:2.4


In [6]:
df = df[df.Stage != 'test'].reset_index(drop=True)
df['is_valid'] = df.Stage == 'valid'

In [7]:
def label_func(fname):
    return (fname.parent.parent/"labels")/f"{fname.stem}_mask.png"

In [8]:
# assign paths
df["image_fname"] = [processed_dataset_dir/f'images/{f}' for f in df.File_Name.values]
df["label_fname"] = [label_func(f) for f in df.image_fname.values]

In [12]:
def get_data(df, bs=4, img_size=(180, 320), augment=True):
    block = DataBlock(blocks=(ImageBlock, MaskBlock(codes=params.BDD_CLASSES)),
                  get_x=ColReader("image_fname"),
                  get_y=ColReader("label_fname"),
                  splitter=ColSplitter(),
                  item_tfms=Resize(img_size),
                  batch_tfms=aug_transforms() if augment else None,
                 )
    return block.dataloaders(df, bs=bs)

In [13]:
config = wandb.config

In [14]:
dls = get_data(df, bs=config.batch_size, img_size=config.img_size, augment=config.augment)

  ret = func(*args, **kwargs)


In [15]:
learn = unet_learner(dls, arch=resnet18, pretrained=config.pretrained, metrics=[foreground_acc, DiceMulti()], cbs=SaveModelCallback())#.to_fp16()

In [16]:
learn.fit_one_cycle(config.epochs, config.lr, cbs=[WandbCallback(log_preds=False, log_model=True)])

epoch,train_loss,valid_loss,foreground_acc,dice_multi,time
0,0.804109,0.750861,0.129264,0.158541,00:50
1,0.470633,0.35229,0.825075,0.359599,00:50
2,0.324693,0.299168,0.870585,0.369735,00:51


Better model found at epoch 0 with valid_loss value: 0.7508609890937805.
Better model found at epoch 1 with valid_loss value: 0.35229042172431946.
Better model found at epoch 2 with valid_loss value: 0.2991684675216675.


In [18]:
samples, outputs, predictions = get_predictions(learn)
table = create_dice_table(samples, outputs, predictions, params.BDD_CLASSES)
wandb.log({"pred_table":table})

In [19]:
wandb.finish()

VBox(children=(Label(value='126.527 MB of 126.527 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0,…

0,1
dice_multi,▁██
epoch,▁▁▁▁▂▂▂▂▂▃▃▃▃▃▃▄▄▄▄▄▄▅▅▅▅▅▆▆▆▆▆▆▇▇▇▇▇███
eps_0,▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
eps_1,▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
eps_2,▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
foreground_acc,▁██
lr_0,▁▁▂▃▄▅▆▇███████▇▇▇▇▆▆▆▅▅▅▄▄▄▃▃▃▂▂▂▂▁▁▁▁▁
lr_1,▁▁▂▃▄▅▆▇███████▇▇▇▇▆▆▆▅▅▅▄▄▄▃▃▃▂▂▂▂▁▁▁▁▁
lr_2,▁▁▂▃▄▅▆▇███████▇▇▇▇▆▆▆▅▅▅▄▄▄▃▃▃▂▂▂▂▁▁▁▁▁
mom_0,██▇▆▅▄▃▂▁▁▁▁▁▁▁▂▂▂▂▃▃▃▄▄▄▅▅▅▆▆▆▇▇▇▇█████

0,1
dice_multi,0.36974
epoch,3.0
eps_0,1e-05
eps_1,1e-05
eps_2,1e-05
foreground_acc,0.87059
lr_0,0.0
lr_1,0.0
lr_2,0.0
mom_0,0.95
