In [6]:
import os
import torch
import numpy as np
from torch.utils.data import Dataset, DataLoader
from torchvision import transforms, utils

In [7]:
import torch
import torch.nn as nn
import torchvision.transforms.functional as TF

class DoubleConv(nn.Module):
    def __init__(self, in_channels, out_channels):
        super(DoubleConv, self).__init__()
        self.conv = nn.Sequential(
            nn.Conv2d(in_channels, out_channels, 3, 1, 1, bias=False),
            nn.BatchNorm2d(out_channels),
            nn.ReLU(inplace=True),
            nn.Conv2d(out_channels, out_channels, 3, 1, 1, bias=False),
            nn.BatchNorm2d(out_channels),
            nn.ReLU(inplace=True),
        )

    def forward(self, x):
        return self.conv(x)

class UNET(nn.Module):
    def __init__(
            self, in_channels=3, out_channels=1, features=[64, 128, 256, 512],
    ):
        super(UNET, self).__init__()
        self.ups = nn.ModuleList()
        self.downs = nn.ModuleList()
        self.pool = nn.MaxPool2d(kernel_size=2, stride=2)

        # Down part of UNET
        for feature in features:
            self.downs.append(DoubleConv(in_channels, feature))
            in_channels = feature

        # Up part of UNET
        for feature in reversed(features):
            self.ups.append(
                nn.ConvTranspose2d(
                    feature*2, feature, kernel_size=2, stride=2,
                )
            )
            self.ups.append(DoubleConv(feature*2, feature))

        self.bottleneck = DoubleConv(features[-1], features[-1]*2)
        self.final_conv = nn.Conv2d(features[0], out_channels, kernel_size=1)

    def forward(self, x):
        skip_connections = []

        for down in self.downs:
            x = down(x)
            skip_connections.append(x)
            x = self.pool(x)

        x = self.bottleneck(x)
        skip_connections = skip_connections[::-1]

        for idx in range(0, len(self.ups), 2):
            x = self.ups[idx](x)
            skip_connection = skip_connections[idx//2]

            if x.shape != skip_connection.shape:
                x = TF.resize(x, size=skip_connection.shape[2:])

            concat_skip = torch.cat((skip_connection, x), dim=1)
            x = self.ups[idx+1](concat_skip)

        return self.final_conv(x)

def test():
    x = torch.randn((3, 1, 161, 161))
    model = UNET(in_channels=1, out_channels=1)
    preds = model(x)
    assert preds.shape == x.shape

In [8]:
import os
import pandas as pd
from torchvision.io import read_image

class nails_data(Dataset):
    def __init__(self, img_dir, mask_dir, transform=None, target_transform=None):
        self.img_dir = img_dir
        self.mask_dir = mask_dir
        self.img_paths = os.listdir(img_dir)
        self.mask_paths = os.listdir(mask_dir)
        self.transform = transform
        self.target_transform = target_transform

    def __len__(self):
        return len(self.img_paths)

    def __getitem__(self, idx):
        img_path = os.path.join(self.img_dir, self.img_paths[idx])
        mask_path = os.path.join(self.mask_dir, self.mask_paths[idx])
        image = read_image(img_path)
        mask = read_image(mask_path)
        if self.transform:
            image = self.transform(image)
        if self.target_transform:
            mask = self.target_transform(mask)
        return image, mask

In [9]:
#paths
im_train = r"C:\Users\Alihan\Desktop\segmentation\nails\train"
im_test = r"C:\Users\Alihan\Desktop\segmentation\nails\test"

mask_train = r"C:\Users\Alihan\Desktop\segmentation\target\train"
mask_test = r"C:\Users\Alihan\Desktop\segmentation\target\test"

transform_img = transforms.Compose([
transforms.CenterCrop(500),
transforms.ConvertImageDtype(torch.float)])

transform_mask = transforms.Compose([transforms.Grayscale(num_output_channels=1),
transforms.CenterCrop(500),
transforms.ConvertImageDtype(torch.float)])

In [10]:
X = nails_data(im_train, mask_train, transform_img, transform_mask)
y = nails_data(im_test, mask_test, transform_img, transform_mask)

In [17]:
train_loader = DataLoader(X, batch_size=2, shuffle=True)
test_loader = DataLoader(y, batch_size=2, shuffle=True)
model = UNET(3,1)

In [21]:
optimizer = torch.optim.Adam(model.parameters(), lr=3e-4)
criterion = nn.BCEWithLogitsLoss()

In [23]:
epochs=1
for epoch in range(epochs):
    for i, data in enumerate(train_loader, 0):
        image, mask = data

        print(image.shape, mask.shape)
        optimizer.zero_grad()

        # Compute the forward pass
        outputs = model(image)

        # Compute the loss function
        loss = criterion(outputs, mask)

        # Compute the gradients
        loss.backward()

        # Update the weights
        optimizer.step()

torch.Size([2, 3, 500, 500]) torch.Size([2, 1, 500, 500])
torch.Size([2, 3, 500, 500]) torch.Size([2, 1, 500, 500])
torch.Size([2, 3, 500, 500]) torch.Size([2, 1, 500, 500])
torch.Size([2, 3, 500, 500]) torch.Size([2, 1, 500, 500])
torch.Size([2, 3, 500, 500]) torch.Size([2, 1, 500, 500])
torch.Size([2, 3, 500, 500]) torch.Size([2, 1, 500, 500])
torch.Size([2, 3, 500, 500]) torch.Size([2, 1, 500, 500])
torch.Size([2, 3, 500, 500]) torch.Size([2, 1, 500, 500])
torch.Size([2, 3, 500, 500]) torch.Size([2, 1, 500, 500])
torch.Size([2, 3, 500, 500]) torch.Size([2, 1, 500, 500])
torch.Size([2, 3, 500, 500]) torch.Size([2, 1, 500, 500])
torch.Size([2, 3, 500, 500]) torch.Size([2, 1, 500, 500])
torch.Size([2, 3, 500, 500]) torch.Size([2, 1, 500, 500])
torch.Size([2, 3, 500, 500]) torch.Size([2, 1, 500, 500])
torch.Size([2, 3, 500, 500]) torch.Size([2, 1, 500, 500])
torch.Size([2, 3, 500, 500]) torch.Size([2, 1, 500, 500])
torch.Size([2, 3, 500, 500]) torch.Size([2, 1, 500, 500])
torch.Size([2,