In [1]:
# For plotting
import numpy as np
import matplotlib.pyplot as plt
import matplotlib.image as mpimg
%matplotlib inline
# For conversion
from skimage.color import lab2rgb, rgb2lab, rgb2gray
from skimage import io
# For everything
import torch
import torch.nn as nn
import torch.nn.functional as F
# For our model
import torchvision
import torchvision.models as models
from torchvision import datasets, transforms
from PIL import Image
# For utilities
import os, shutil, time

In [2]:
%load_ext tensorboard
%tensorboard --logdir=runs

In [26]:
from torch.utils.tensorboard import SummaryWriter
writer = SummaryWriter()

In [27]:
# Check if GPU is available
use_gpu = torch.cuda.is_available()
print(use_gpu)

True


In [29]:
SIZE = 64
class LabImageFolder(torch.utils.data.Dataset):
    def __init__(self, paths, split='train'):
        if split == 'train':
            self.transforms = transforms.Compose([
                transforms.Resize((SIZE, SIZE), transforms.InterpolationMode.BICUBIC),
                transforms.RandomCrop(SIZE),
                transforms.RandomHorizontalFlip(), 
            ])
        elif split == 'val':
            self.transforms = transforms.Compose([
                transforms.Resize((SIZE, SIZE), transforms.InterpolationMode.BICUBIC), 
                transforms.RandomCrop(SIZE),
            ])
            
        self.split = split
        self.size = SIZE
        self.paths = [os.path.join(paths, file) for file in os.listdir(paths) if os.path.isfile(
            os.path.join(paths, file))]
        
        
    def __getitem__(self, index):
        img = Image.open(self.paths[index]).convert("RGB")
        img_original = self.transforms(img)
        img_original = np.asarray(img_original)
        img_lab = rgb2lab(img_original)
        img_lab = (img_lab + 128) / 255
        img_ab = img_lab[:, :, 1:3]
        img_ab = torch.from_numpy(img_ab.transpose((2, 0, 1))).float()
        img_gray = rgb2gray(img_original)
        img_gray = torch.from_numpy(img_gray).unsqueeze(0).float()
        return img_gray, img_ab
    
    def __len__(self):
        return len(self.paths)

In [30]:
# Training
batch_size = 128
train_imagefolder = LabImageFolder('../../datasets/dataset/train/colour')
train_loader = torch.utils.data.DataLoader(train_imagefolder, batch_size=batch_size, shuffle=True)
# Validation 
val_imagefolder = LabImageFolder('../../datasets/dataset/test/colour' , 'val')
val_loader = torch.utils.data.DataLoader(val_imagefolder, batch_size=batch_size, shuffle=False)

In [31]:
kernel_size=3
stride_en=2
stride_de=1
padding=1
scale_factor=2
padding_mode='zeros'
class ColorizationNet(nn.Module):
  def __init__(self, input_size=128):
    super(ColorizationNet, self).__init__()
    
    self.encoder = nn.Sequential(       
      nn.Conv2d(1, 16, kernel_size=kernel_size, stride=stride_en, padding=padding, padding_mode=padding_mode),
#       nn.BatchNorm2d(16),
      nn.ReLU(),
      nn.Conv2d(16, 32, kernel_size=kernel_size, stride=stride_en, padding=padding, padding_mode=padding_mode),
#       nn.BatchNorm2d(32),
      nn.ReLU(),
      nn.Conv2d(32, 64, kernel_size=kernel_size, stride=stride_en, padding=padding, padding_mode=padding_mode),
#       nn.BatchNorm2d(64),
      nn.ReLU(),   
    )     
        
    self.decoder = nn.Sequential(  
      nn.ConvTranspose2d(64, 32, kernel_size=kernel_size, stride=stride_de, padding=padding, padding_mode=padding_mode),
#       nn.BatchNorm2d(32),
      nn.ReLU(),
      nn.Upsample(scale_factor=scale_factor),   
      nn.ConvTranspose2d(32, 16, kernel_size=kernel_size, stride=stride_de, padding=padding, padding_mode=padding_mode),
#       nn.BatchNorm2d(16),
      nn.ReLU(),
      nn.Upsample(scale_factor=scale_factor),
      nn.ConvTranspose2d(16, 8, kernel_size=kernel_size, stride=stride_de, padding=padding, padding_mode=padding_mode),
#       nn.BatchNorm2d(8),
      nn.ReLU(),
      nn.ConvTranspose2d(8, 2, kernel_size=kernel_size, stride=stride_de, padding=padding, padding_mode=padding_mode),
      nn.Upsample(scale_factor=scale_factor)
    )

  def forward(self, input):

    encoder = self.encoder(input)
    # Upsample to get colors
    output = self.decoder(encoder)
    return output

In [32]:
model = ColorizationNet()

In [33]:
criterion = nn.MSELoss()

In [34]:
optimizer = torch.optim.Adam(model.parameters(), lr=1e-2)

In [35]:
# # Move model and loss function to GPU
if use_gpu: 
    criterion = criterion.cuda()
    model = model.cuda()

In [36]:
from torchsummary import summary

summary(model, (1, 64, 64))

----------------------------------------------------------------
        Layer (type)               Output Shape         Param #
            Conv2d-1           [-1, 16, 32, 32]             160
              ReLU-2           [-1, 16, 32, 32]               0
            Conv2d-3           [-1, 32, 16, 16]           4,640
              ReLU-4           [-1, 32, 16, 16]               0
            Conv2d-5             [-1, 64, 8, 8]          18,496
              ReLU-6             [-1, 64, 8, 8]               0
   ConvTranspose2d-7             [-1, 32, 8, 8]          18,464
              ReLU-8             [-1, 32, 8, 8]               0
          Upsample-9           [-1, 32, 16, 16]               0
  ConvTranspose2d-10           [-1, 16, 16, 16]           4,624
             ReLU-11           [-1, 16, 16, 16]               0
         Upsample-12           [-1, 16, 32, 32]               0
  ConvTranspose2d-13            [-1, 8, 32, 32]           1,160
             ReLU-14            [-1, 8,

In [37]:
class AverageMeter(object):
  '''A handy class from the PyTorch ImageNet tutorial''' 
  def __init__(self):
    self.reset()
  def reset(self):
    self.val, self.avg, self.sum, self.count = 0, 0, 0, 0
  def update(self, val, n=1):
    self.val = val
    self.sum += val * n
    self.count += n
    self.avg = self.sum / self.count

def to_rgb(grayscale_input, ab_input, save_path=None, save_name=None):
  '''Show/save rgb image from grayscale and ab channels
     Input save_path in the form {'grayscale': '/path/', 'colorized': '/path/'}'''
  plt.clf() # clear matplotlib 
  color_image = torch.cat((grayscale_input, ab_input), 0).numpy() # combine channels
  color_image = color_image.transpose((1, 2, 0))  # rescale for matplotlib
  color_image[:, :, 0:1] = color_image[:, :, 0:1] * 100
  color_image[:, :, 1:3] = color_image[:, :, 1:3] * 255 - 128   
  color_image = lab2rgb(color_image.astype(np.float64))
  grayscale_input = grayscale_input.squeeze().numpy()
  if save_path is not None and save_name is not None: 
    plt.imsave(arr=grayscale_input, fname='{}{}'.format(save_path['grayscale'], save_name), cmap='gray')
    plt.imsave(arr=color_image, fname='{}{}'.format(save_path['colorized'], save_name))

In [38]:
color_imgs = 'outputs/color/'
gray_imgs = 'outputs/gray/'

In [39]:
def validate(val_loader, model, criterion, save_images, epoch):
    _loss = AverageMeter()

    model.eval()
    already_saved_images = False
    for gray, ab in val_loader:
        if use_gpu: 
            gray, ab = gray.cuda(), ab.cuda()

        # Run model and record loss
        output_ab = model(gray) # throw away class predictions
        loss = criterion(output_ab, ab)
        
        _loss.update(loss.item(), gray.size(0))

        # Save images to file
        if save_images and not already_saved_images:
            already_saved_images = True
            for j in range(min(len(output_ab), 10)): # save at most 5 images
                save_path = {'grayscale': gray_imgs, 'colorized': color_imgs}
                save_name = 'img-{}-epoch-{}.jpg'.format(j, epoch)
                to_rgb(gray[j].cpu(), ab_input=output_ab[j].detach().cpu(), save_path=save_path, save_name=save_name)

    print('Validate: Loss {loss.val:.4f} ({loss.avg:.4f})\t'.format(
         loss=_loss))

    print('Finished validation.')
    if epoch >= 0:
        writer.add_scalar("Loss/test", _loss.avg, epoch)
    return _loss.avg

In [41]:
def train(train_loader, model, criterion, optimizer, epoch):
    print(f'Starting training epoch {epoch}')
    _loss = AverageMeter()
    
    model.train()

    for gray, ab in train_loader:
        if use_gpu: 
            gray, ab = gray.cuda(), ab.cuda()
            
        optimizer.zero_grad()

        output_ab = model(gray) 
        loss = criterion(output_ab, ab) 
        loss.backward()
        optimizer.step()
        
        _loss.update(loss.item(), gray.size(0))
        
    print(f'Epoch: {epoch}, Loss {_loss.val:.4f} ({_loss.avg:.4f})')
    
    print(f'Finished training epoch {epoch}')
    if epoch >= 0:
        writer.add_scalar("Loss/train", _loss.avg, epoch)

In [42]:
# Make folders and set parameters
checkpoints = 'checkpoints'
os.makedirs(color_imgs, exist_ok=True)
os.makedirs(gray_imgs, exist_ok=True)
os.makedirs(checkpoints, exist_ok=True)
save_images = True
best_losses = 1e10
epochs = 250

In [43]:
# Train model
for epoch in range(epochs):
    # Train for one epoch, then validate
    train(train_loader, model, criterion, optimizer, epoch)
    with torch.no_grad():
        losses = validate(val_loader, model, criterion, save_images, epoch)
    # Save checkpoint and replace old best model if current model is better
    if losses < best_losses:
        best_losses = losses
        torch.save(model.state_dict(), '{}/model-epoch-{}-losses-{:.3f}.pth'.format(checkpoints,epoch+1,losses))


    if epoch == epochs - 1:
        torch.save(model.state_dict(), '{}/model-epoch-{}-last-losses-{:.3f}.pth'.format(checkpoints,epoch+1,losses))


Starting training epoch 0
Epoch: 0, Loss 0.0112 (0.2320)
Finished training epoch 0
Validate: Loss 0.0108 (0.0108)	
Finished validation.
Starting training epoch 1
Epoch: 1, Loss 0.0076 (0.0100)
Finished training epoch 1
Validate: Loss 0.0082 (0.0083)	
Finished validation.
Starting training epoch 2
Epoch: 2, Loss 0.0070 (0.0078)
Finished training epoch 2
Validate: Loss 0.0072 (0.0073)	
Finished validation.
Starting training epoch 3
Epoch: 3, Loss 0.0071 (0.0076)
Finished training epoch 3
Validate: Loss 0.0071 (0.0073)	
Finished validation.
Starting training epoch 4
Epoch: 4, Loss 0.0071 (0.0076)
Finished training epoch 4
Validate: Loss 0.0071 (0.0073)	
Finished validation.
Starting training epoch 5
Epoch: 5, Loss 0.0072 (0.0076)
Finished training epoch 5
Validate: Loss 0.0072 (0.0073)	
Finished validation.
Starting training epoch 6
Epoch: 6, Loss 0.0074 (0.0076)
Finished training epoch 6
Validate: Loss 0.0072 (0.0074)	
Finished validation.
Starting training epoch 7
Epoch: 7, Loss 0.0077 

Epoch: 59, Loss 0.0076 (0.0076)
Finished training epoch 59
Validate: Loss 0.0072 (0.0073)	
Finished validation.
Starting training epoch 60
Epoch: 60, Loss 0.0076 (0.0076)
Finished training epoch 60
Validate: Loss 0.0072 (0.0074)	
Finished validation.
Starting training epoch 61
Epoch: 61, Loss 0.0077 (0.0076)
Finished training epoch 61
Validate: Loss 0.0072 (0.0073)	
Finished validation.
Starting training epoch 62
Epoch: 62, Loss 0.0062 (0.0076)
Finished training epoch 62
Validate: Loss 0.0072 (0.0073)	
Finished validation.
Starting training epoch 63
Epoch: 63, Loss 0.0079 (0.0076)
Finished training epoch 63
Validate: Loss 0.0071 (0.0073)	
Finished validation.
Starting training epoch 64
Epoch: 64, Loss 0.0064 (0.0076)
Finished training epoch 64
Validate: Loss 0.0071 (0.0073)	
Finished validation.
Starting training epoch 65
Epoch: 65, Loss 0.0077 (0.0076)
Finished training epoch 65
Validate: Loss 0.0073 (0.0074)	
Finished validation.
Starting training epoch 66
Epoch: 66, Loss 0.0083 (0.0

Epoch: 118, Loss 0.0062 (0.0076)
Finished training epoch 118
Validate: Loss 0.0072 (0.0073)	
Finished validation.
Starting training epoch 119
Epoch: 119, Loss 0.0087 (0.0076)
Finished training epoch 119
Validate: Loss 0.0072 (0.0073)	
Finished validation.
Starting training epoch 120
Epoch: 120, Loss 0.0074 (0.0076)
Finished training epoch 120
Validate: Loss 0.0071 (0.0073)	
Finished validation.
Starting training epoch 121
Epoch: 121, Loss 0.0075 (0.0076)
Finished training epoch 121
Validate: Loss 0.0072 (0.0073)	
Finished validation.
Starting training epoch 122
Epoch: 122, Loss 0.0078 (0.0076)
Finished training epoch 122
Validate: Loss 0.0071 (0.0073)	
Finished validation.
Starting training epoch 123
Epoch: 123, Loss 0.0085 (0.0076)
Finished training epoch 123
Validate: Loss 0.0073 (0.0074)	
Finished validation.
Starting training epoch 124
Epoch: 124, Loss 0.0068 (0.0076)
Finished training epoch 124
Validate: Loss 0.0073 (0.0073)	
Finished validation.
Starting training epoch 125
Epoch:

Epoch: 176, Loss 0.0085 (0.0076)
Finished training epoch 176
Validate: Loss 0.0071 (0.0073)	
Finished validation.
Starting training epoch 177
Epoch: 177, Loss 0.0076 (0.0076)
Finished training epoch 177
Validate: Loss 0.0072 (0.0073)	
Finished validation.
Starting training epoch 178
Epoch: 178, Loss 0.0067 (0.0076)
Finished training epoch 178
Validate: Loss 0.0071 (0.0073)	
Finished validation.
Starting training epoch 179
Epoch: 179, Loss 0.0078 (0.0076)
Finished training epoch 179
Validate: Loss 0.0072 (0.0074)	
Finished validation.
Starting training epoch 180
Epoch: 180, Loss 0.0071 (0.0076)
Finished training epoch 180
Validate: Loss 0.0071 (0.0073)	
Finished validation.
Starting training epoch 181
Epoch: 181, Loss 0.0078 (0.0076)
Finished training epoch 181
Validate: Loss 0.0072 (0.0073)	
Finished validation.
Starting training epoch 182
Epoch: 182, Loss 0.0073 (0.0076)
Finished training epoch 182
Validate: Loss 0.0072 (0.0073)	
Finished validation.
Starting training epoch 183
Epoch:

Epoch: 234, Loss 0.0077 (0.0076)
Finished training epoch 234
Validate: Loss 0.0072 (0.0073)	
Finished validation.
Starting training epoch 235
Epoch: 235, Loss 0.0080 (0.0076)
Finished training epoch 235
Validate: Loss 0.0072 (0.0073)	
Finished validation.
Starting training epoch 236
Epoch: 236, Loss 0.0076 (0.0076)
Finished training epoch 236
Validate: Loss 0.0074 (0.0074)	
Finished validation.
Starting training epoch 237
Epoch: 237, Loss 0.0070 (0.0076)
Finished training epoch 237
Validate: Loss 0.0073 (0.0073)	
Finished validation.
Starting training epoch 238
Epoch: 238, Loss 0.0078 (0.0076)
Finished training epoch 238
Validate: Loss 0.0072 (0.0073)	
Finished validation.
Starting training epoch 239
Epoch: 239, Loss 0.0069 (0.0076)
Finished training epoch 239
Validate: Loss 0.0071 (0.0073)	
Finished validation.
Starting training epoch 240
Epoch: 240, Loss 0.0073 (0.0076)
Finished training epoch 240
Validate: Loss 0.0071 (0.0073)	
Finished validation.
Starting training epoch 241
Epoch:

<Figure size 432x288 with 0 Axes>

In [44]:
torch.save(model.state_dict(), '{}/model-epoch-{}-last-losses-{:.3f}.pth'.format(checkpoints,"last",losses))

In [None]:
# Validate
save_images = True
with torch.no_grad():
    validate(val_loader, model, criterion, save_images, -1)

In [None]:
# # Show images 
# image_pairs = []

# for i in range(10):
#     image_pairs.append((f'{color_imgs}img-{i}-epoch-{best_epoch}.jpg', f'{gray_imgs}img-{i}-epoch-{best_epoch}.jpg'))
    
# for c, g in image_pairs:
#   color = mpimg.imread(c)
#   gray  = mpimg.imread(g)
#   f, axarr = plt.subplots(1, 2)
#   f.set_size_inches(15, 15)
#   axarr[0].imshow(gray, cmap='gray')
#   axarr[1].imshow(color)
#   axarr[0].axis('off'), axarr[1].axis('off')
#   plt.show()