#### IMPORT LIBRARIES

In [1]:
import numpy as np
import h5py as h5

import torch
from torchvision import datasets, transforms
import torch.nn.functional as F
import torch.nn as nn
import torch.optim as optim
from torch.autograd import Variable
from torch.utils.tensorboard import SummaryWriter

import matplotlib.pyplot as plt
from importlib import reload, import_module

import glob
import os

import pdb
from PIL import Image as im
import _pickle as pickle


from functions import MyDataset, customTransform, get_variable, get_numpy, compute_gradient, psnr_1

#### DATASET PATH

In [2]:
if os.name == 'nt':
    dataset_file = r"C:\Users\mummu\Documents\Datasets\srinivasan\trainset\h5\8bit.h5"
    test_file    = r"C:\Users\mummu\Documents\Datasets\srinivasan\testset\h5\8bit.h5"
    model_file   = r"model\model.pt"
    network_file = r"network_revised"
    trainwr_file = r"runs\train"
    testwr_file  = r"runs\test"
elif os.name == 'posix':
    raise NotImplementedError

#### BASIC PARAMETERS

In [3]:
patch_size     = 192
batch_size     = 300
minibatch_size = 8
gamma_val      = 0.4
lfsize         = [372, 540, 7, 7]
num_workers    = 0
num_test       = 10
num_minibatch  = batch_size//minibatch_size
batch_affine   = True
num_epochs     = 10000

#### INITIALIZE FUNCTIONS

In [4]:
data_transform = transforms.Compose([transforms.ToTensor(), 
                                     transforms.Lambda(customTransform)])

train_dataset  = MyDataset(dataset_file, lfsize, data_transform)
test_dataset   = MyDataset(test_file, lfsize, data_transform)

train_loader   = torch.utils.data.DataLoader(train_dataset, batch_size=minibatch_size, num_workers=num_workers, shuffle=True)
test_loader    = torch.utils.data.DataLoader(train_dataset, batch_size=minibatch_size, num_workers=num_workers, shuffle=True)

#### LOOKING FOR SAVED MODEL

In [5]:
network_module = import_module(network_file)
reload(network_module)
Net = network_module.Net

net = Net((patch_size, patch_size), minibatch_size, lfsize, batchAffine=batch_affine)
if torch.cuda.is_available():
    print('##converting network to cuda-enabled')
    net.cuda()

try:
    checkpoint = torch.load(model_file)
    
    epoch_id = checkpoint['epoch']
    net.load_state_dict(checkpoint['model'].state_dict())
    print('Model successfully loaded.')
    
except:
    print('No model.')
    epoch_id = 0

##converting network to cuda-enabled
Model successfully loaded.


In [6]:
#def count_parameters(model): return list(name for name, param in model.named_parameters() if param.requires_grad == False)

In [7]:
def count_parameters(model): return sum(p.numel() for p in model.parameters() if p.requires_grad)

In [8]:
count_parameters(net)

1256649

#### TRAINING SETTINGS

In [9]:
criterion1 = nn.L1Loss()
criterion2 = nn.L1Loss()
optimizer = optim.Adam(net.parameters(), lr=0.001, betas=(0.9, 0.999))

In [10]:
def train_epoch():
    costs = []
    psnr_vec = []
            
    for batch_num in range(num_minibatch):
        
        # fetching training batch
        corners, pers, ind = next(iter(train_loader))
        
        # converting to trainable variables
        X_corners = get_variable(corners)
        T_view = get_variable(pers)
        p = get_variable(ind[:,0])
        q = get_variable(ind[:,-1])
                
        optimizer.zero_grad()
        
        # Forward pass
        O_view, _, _ = net(X_corners, p, q)
        
        # Computing batch loss
        batch_loss = criterion1(O_view, T_view) + .5*criterion2(compute_gradient(O_view),
                                                          compute_gradient(T_view))
        
        # Backpropagation
        batch_loss.backward()
        optimizer.step()

        # recording performance
        costs.append(get_numpy(batch_loss))
        net_out = get_numpy(O_view)
        Y = get_numpy(T_view)      
        psnr_vec.append([psnr_1(np.squeeze(net_out[i]), np.squeeze(Y[i])) for i in range(minibatch_size)])
    
        
    return np.mean(costs), np.mean(psnr_vec)

def eval_epoch():
    costs = []
    psnr_vec = []
    
    for batch_num in range(num_test):
        
        # fetching training batch
        corners, pers, ind = next(iter(test_loader))
        
        # converting to trainable variables
        X_corners = get_variable(corners)
        T_view = get_variable(pers)
        p = get_variable(ind[:,0])
        q = get_variable(ind[:,-1])

        with torch.no_grad():
            # Forward pass
            O_view, _, _ = net(X_corners, p, q)
            
            # Computing batch loss
            batch_loss = criterion1(O_view, T_view) + .5*criterion2(compute_gradient(O_view), compute_gradient(T_view))
            
            # recording performance
            costs.append(get_numpy(batch_loss))
            net_out = get_numpy(O_view)
            Y = get_numpy(T_view)
            psnr_vec.append([psnr_1(np.squeeze(net_out[i]), np.squeeze(Y[i])) for i in range(minibatch_size)])

    return np.mean(costs), np.mean(psnr_vec)

In [None]:
valid_accs, train_accs, test_accs = [], [], []

writer_train = SummaryWriter(trainwr_file)
writer_test  = SummaryWriter(testwr_file)

while epoch_id < num_epochs:
    epoch_id += 1
    
    try:   
        net.train()
        train_cost, train_psnr = train_epoch()
        
        net.eval()
        test_cost, test_psnr = eval_epoch()
        
        print("Epoch %d:" % epoch_id)     
        print("Epoch {0:0}, train_cost {1:.2}, psnr {2:.2}".format(epoch_id, train_cost, train_psnr))
        
        writer_train.add_scalar('psnr', train_psnr, epoch_id)
        writer_train.add_scalar('loss', train_cost, epoch_id)
        writer_test.add_scalar('psnr', test_psnr, epoch_id)
        writer_test.add_scalar('loss', test_cost, epoch_id)
        
        torch.save({'model': net, 'epoch': epoch_id}, model_file)
    
    except KeyboardInterrupt:
        print('\nKeyboardInterrupt')
        break



Epoch 302:
Epoch 302, train_cost 0.039, psnr 4e+01


  "type " + obj.__name__ + ". It won't be checked "
  "type " + obj.__name__ + ". It won't be checked "
  "type " + obj.__name__ + ". It won't be checked "
  "type " + obj.__name__ + ". It won't be checked "


Epoch 303:
Epoch 303, train_cost 0.038, psnr 4.1e+01
Epoch 304:
Epoch 304, train_cost 0.037, psnr 4.1e+01
Epoch 305:
Epoch 305, train_cost 0.041, psnr 4e+01
Epoch 306:
Epoch 306, train_cost 0.039, psnr 4.1e+01
Epoch 307:
Epoch 307, train_cost 0.039, psnr 4.1e+01
Epoch 308:
Epoch 308, train_cost 0.041, psnr 4e+01
Epoch 309:
Epoch 309, train_cost 0.039, psnr 4e+01
Epoch 310:
Epoch 310, train_cost 0.04, psnr 4e+01
Epoch 311:
Epoch 311, train_cost 0.044, psnr 4e+01
Epoch 312:
Epoch 312, train_cost 0.039, psnr 4.1e+01
Epoch 313:
Epoch 313, train_cost 0.038, psnr 4.1e+01
Epoch 314:
Epoch 314, train_cost 0.041, psnr 4e+01
Epoch 315:
Epoch 315, train_cost 0.041, psnr 4e+01
Epoch 316:
Epoch 316, train_cost 0.036, psnr 4.1e+01
Epoch 317:
Epoch 317, train_cost 0.04, psnr 4e+01
Epoch 318:
Epoch 318, train_cost 0.04, psnr 4e+01
Epoch 319:
Epoch 319, train_cost 0.04, psnr 4.1e+01
Epoch 320:
Epoch 320, train_cost 0.04, psnr 4e+01
Epoch 321:
Epoch 321, train_cost 0.039, psnr 4e+01
Epoch 322:
Epoch 322

Epoch 460, train_cost 0.039, psnr 4e+01
Epoch 461:
Epoch 461, train_cost 0.037, psnr 4.1e+01
Epoch 462:
Epoch 462, train_cost 0.041, psnr 4e+01
Epoch 463:
Epoch 463, train_cost 0.041, psnr 4e+01
Epoch 464:
Epoch 464, train_cost 0.036, psnr 4.1e+01
Epoch 465:
Epoch 465, train_cost 0.037, psnr 4.1e+01
Epoch 466:
Epoch 466, train_cost 0.038, psnr 4.1e+01
Epoch 467:
Epoch 467, train_cost 0.04, psnr 4.1e+01
Epoch 468:
Epoch 468, train_cost 0.039, psnr 4.1e+01
Epoch 469:
Epoch 469, train_cost 0.04, psnr 4.1e+01
Epoch 470:
Epoch 470, train_cost 0.041, psnr 4e+01
Epoch 471:
Epoch 471, train_cost 0.038, psnr 4.1e+01
Epoch 472:
Epoch 472, train_cost 0.041, psnr 4e+01
Epoch 473:
Epoch 473, train_cost 0.037, psnr 4.1e+01
Epoch 474:
Epoch 474, train_cost 0.04, psnr 4e+01
Epoch 475:
Epoch 475, train_cost 0.041, psnr 4e+01
Epoch 476:
Epoch 476, train_cost 0.041, psnr 4e+01
Epoch 477:
Epoch 477, train_cost 0.038, psnr 4.1e+01
