# Just an exercize


In [1]:
import torch
import torch.nn as nn
import torchvision.transforms.functional as TF


In [2]:
class DoubleConv(nn.Module):
    def __init__(self, in_channels, out_channels):
        super(DoubleConv, self).__init__()
        self.conv = nn.Sequential(
            nn.Conv2d(in_channels, out_channels, 3, 1, 1, bias=False),
            nn.BatchNorm2d(out_channels),
            nn.ReLU(inplace=True),
            nn.Conv2d(out_channels, out_channels, 3, 1, 1, bias=False),
            nn.BatchNorm2d(out_channels),
            nn.ReLU(inplace=True)
        )

    def forward(self, x):
        return self.conv(x)


In [3]:
class UNET(nn.Module):
    def __init__(self, in_channels=3, out_channels=1, features=[64, 128, 256, 512]):
        super(UNET, self).__init__()
        self.ups = nn.ModuleList()
        self.downs = nn.ModuleList()
        self.pool2d = nn.MaxPool2d(kernel_size=2, stride=2)

        for feature in features:
            self.downs.append(DoubleConv(in_channels, feature))
            in_channels = feature

        for feature in reversed(features):
            self.ups.append(nn.ConvTranspose2d(
                feature*2, feature, kernel_size=2, stride=2))
            self.ups.append(DoubleConv(feature*2, feature))

        self.bottleneck = DoubleConv(features[-1], features[-1]*2)
        self.finalConv = nn.Conv2d(features[0], out_channels, kernel_size=1)

    def forward(self, x):
        skip_conn = []
        for down in self.downs:
            x = down(x)
            skip_conn.append(x)
            x = self.pool2d(x)

        x = self.bottleneck(x)
        skip_conn = skip_conn[::-1]

        for idx in range(0, len(self.ups), 2):
            x = self.ups[idx](x)
            skip_co = skip_conn[idx//2]

            if x.shape != skip_co.shape:
                x = TF.resize(x, size=skip_co.shape[2:])

            concat_skip = torch.cat((skip_co, x), dim=1)
            x = self.ups[idx+1](concat_skip)

        return self.finalConv(x)


In [4]:
x = torch.randn((3, 1, 16, 16))
model = UNET(in_channels=1, out_channels=1)
preds = model(x)
# print('prediction: {}'.format(preds))
# print("original: {}".format(x))

assert preds.shape == x.shape


  return torch.max_pool2d(input, kernel_size, stride, padding, dilation, ceil_mode)


In [5]:
import os
from PIL import Image
from torch.utils.data import Dataset
import numpy as np

In [6]:
class KomatsDataset(Dataset):
    def __init__(self, img_dir, mask_dir, transform=None):
        self.img_dir = img_dir
        self.mask_dir = mask_dir
        self.transform = transform
        self.imgs = os.listdir(img_dir)

    def __len__(self):
        return len(self.imgs)

    def __getitem__(self, index):
        img_path = os.path.join(self.img_dir, self.imgs[index])
        mask_path = os.path.join(self.mask_dir, self.imgs[index].replace("rgb", "label"))
        image = np.array(Image.open(img_path).convert("RGB"))
        mask = np.array(Image.open(mask_path).convert("L"), dtype=np.float32)
        mask[mask != 0] = 1.0

        if self.transform is not None:
            augmentation = self.transform(image=image, mask=mask)
            image = augmentation["image"]
            mask = augmentation["mask"]


        return image, mask

In [9]:
import albumentations as A
from albumentations.pytorch import ToTensorV2
from tqdm import tqdm 
import torch.optim as optim 
# from utils import (load_checkpoint, save_checkpoint, get_loaders, check_accuracy, save_predictions_as_imgs)


# Hyper Parameters

In [10]:
LEARNING_RATE = 1E-4
DEVICE = "cuda" if torch.cuda.is_available() else "cpu"
BATCH_SIZE = 32
NUM_EPOCHS = 10
NUM_WORKERS = 2
IMAGE_HEIGHT = 480
IMAGE_WIDHT = 480
PIN_MEMORY = True
LOAD_MODEL = True
TRAIN_IMG_DIR = ".\dataset\multi\multi_plant"
TRAIN_IMG_LABEL = ".\dataset\multi\multi_label"
