#### IMPORT LIBRARIES

In [1]:
import numpy as np
import h5py as h5

import torch
from torchvision import datasets, transforms
import torch.nn.functional as F
import torch.nn as nn
import torch.optim as optim
from torch.autograd import Variable
from torch.utils.tensorboard import SummaryWriter

import matplotlib.pyplot as plt
from importlib import reload, import_module

import glob
import os

import pdb
from PIL import Image as im
import _pickle as pickle


from functions import MyDataset, customTransform, get_variable, get_numpy, compute_gradient, psnr_1, sd_to_usd

#### DATASET PATH

In [2]:
if os.name == 'nt':
    dataset_file = r"C:\Users\mummu\Documents\Datasets\srinivasan\trainset\h5\8bit.h5"
    test_file    = r"C:\Users\mummu\Documents\Datasets\srinivasan\testset\h5\8bit.h5"
    model_file   = r"model\model.pt"
    network_file = r"network"
    trainwr_file = r"runs\train"
    testwr_file  = r"runs\test"
elif os.name == 'posix':
    raise NotImplementedError

#### BASIC PARAMETERS

In [3]:
patch_size     = 192
batch_size     = 300
minibatch_size = 8
gamma_val      = 0.4
lfsize         = [372, 540, 7, 7]
num_workers    = 0
num_test       = 10
num_minibatch  = batch_size//minibatch_size
batch_affine   = True
num_epochs     = 10000

#### INITIALIZE FUNCTIONS

In [4]:
data_transform = transforms.Compose([transforms.ToTensor(), 
                                     transforms.Lambda(customTransform)])

train_dataset  = MyDataset(dataset_file, lfsize, data_transform)
test_dataset   = MyDataset(test_file, lfsize, data_transform)

train_loader   = torch.utils.data.DataLoader(train_dataset, batch_size=minibatch_size, num_workers=num_workers, shuffle=True)
test_loader    = torch.utils.data.DataLoader(train_dataset, batch_size=minibatch_size, num_workers=num_workers, shuffle=True)

#### LOOKING FOR SAVED MODEL

In [5]:
network_module = import_module(network_file)
reload(network_module)
Net = network_module.Net

net = Net((patch_size, patch_size), minibatch_size, lfsize, batchAffine=batch_affine)
if torch.cuda.is_available():
    print('##converting network to cuda-enabled')
    net.cuda()

try:
    checkpoint = torch.load(model_file)
    
    epoch_id = checkpoint['epoch']
    net.load_state_dict(checkpoint['model'].state_dict())
    print('Model successfully loaded.')
    
except:
    print('No model.')
    epoch_id = 0

##converting network to cuda-enabled
Model successfully loaded.


In [6]:
#def count_parameters(model): return list(name for name, param in model.named_parameters() if param.requires_grad == False)

In [7]:
def count_parameters(model): return sum(p.numel() for p in model.parameters() if p.requires_grad)

In [8]:
count_parameters(net)

1256649

#### TRAINING SETTINGS

In [9]:
criterion1 = nn.L1Loss()
criterion2 = nn.L1Loss()
optimizer = optim.Adam(net.parameters(), lr=0.001, betas=(0.9, 0.999))

In [10]:
def train_epoch():
    costs = []
    psnr_vec = []
            
    for batch_num in range(num_minibatch):
        
        # fetching training batch
        corners, pers, ind = next(iter(train_loader))
        
        # converting to trainable variables
        X_corners = get_variable(corners)
        T_view = get_variable(pers)
        p = get_variable(ind[:,0])
        q = get_variable(ind[:,-1])
                
        optimizer.zero_grad()
        
        # Forward pass
        O_view, _, _ = net(X_corners, p, q)
        
        # Computing batch loss
        batch_loss = criterion1(O_view, T_view) + .5*criterion2(compute_gradient(O_view),
                                                          compute_gradient(T_view))
        
        # Backpropagation
        batch_loss.backward()
        optimizer.step()

        # recording performance
        costs.append(get_numpy(batch_loss))
        net_out = get_numpy(O_view)
        Y = get_numpy(T_view)      
        psnr_vec.append([psnr_1(sd_to_usd(np.squeeze(net_out[i])), sd_to_usd(np.squeeze(Y[i]))) for i in range(minibatch_size)])
    
        
    return np.mean(costs), np.mean(psnr_vec)

def eval_epoch():
    costs = []
    psnr_vec = []
    
    for batch_num in range(num_test):
        
        # fetching training batch
        corners, pers, ind = next(iter(test_loader))
        
        # converting to trainable variables
        X_corners = get_variable(corners)
        T_view = get_variable(pers)
        p = get_variable(ind[:,0])
        q = get_variable(ind[:,-1])

        with torch.no_grad():
            # Forward pass
            O_view, _, _ = net(X_corners, p, q)
            
            # Computing batch loss
            batch_loss = criterion1(O_view, T_view) + .5*criterion2(compute_gradient(O_view), compute_gradient(T_view))
            
            # recording performance
            costs.append(get_numpy(batch_loss))
            net_out = get_numpy(O_view)
            Y = get_numpy(T_view)
            psnr_vec.append([psnr_1(sd_to_usd(np.squeeze(net_out[i])), sd_to_usd(np.squeeze(Y[i]))) for i in range(minibatch_size)])

    return np.mean(costs), np.mean(psnr_vec)

In [None]:
valid_accs, train_accs, test_accs = [], [], []

writer_train = SummaryWriter(trainwr_file)
writer_test  = SummaryWriter(testwr_file)

while epoch_id < num_epochs:
    epoch_id += 1
    
    try:   
        net.train()
        train_cost, train_psnr = train_epoch()
        
        net.eval()
        test_cost, test_psnr = eval_epoch()
        
        print("Epoch %d:" % epoch_id)     
        print("Epoch {0:0}, train_cost {1:.2}, psnr {2:.2}".format(epoch_id, train_cost, train_psnr))
        
        writer_train.add_scalar('psnr', train_psnr, epoch_id)
        writer_train.add_scalar('loss', train_cost, epoch_id)
        writer_test.add_scalar('psnr', test_psnr, epoch_id)
        writer_test.add_scalar('loss', test_cost, epoch_id)
        
        torch.save({'model': net, 'epoch': epoch_id}, model_file)
    
    except KeyboardInterrupt:
        print('\nKeyboardInterrupt')
        break



Epoch 2018:
Epoch 2018, train_cost 0.037, psnr 4.1e+01


  "type " + obj.__name__ + ". It won't be checked "
  "type " + obj.__name__ + ". It won't be checked "
  "type " + obj.__name__ + ". It won't be checked "
  "type " + obj.__name__ + ". It won't be checked "


Epoch 2019:
Epoch 2019, train_cost 0.041, psnr 4e+01
Epoch 2020:
Epoch 2020, train_cost 0.037, psnr 4.1e+01
Epoch 2021:
Epoch 2021, train_cost 0.04, psnr 4e+01
Epoch 2022:
Epoch 2022, train_cost 0.039, psnr 4.1e+01
Epoch 2023:
Epoch 2023, train_cost 0.039, psnr 4.1e+01
Epoch 2024:
Epoch 2024, train_cost 0.04, psnr 4e+01
Epoch 2025:
Epoch 2025, train_cost 0.04, psnr 4.1e+01
Epoch 2026:
Epoch 2026, train_cost 0.04, psnr 4.1e+01
Epoch 2027:
Epoch 2027, train_cost 0.038, psnr 4.1e+01
Epoch 2028:
Epoch 2028, train_cost 0.04, psnr 4.1e+01
Epoch 2029:
Epoch 2029, train_cost 0.037, psnr 4.1e+01
Epoch 2030:
Epoch 2030, train_cost 0.038, psnr 4.1e+01
Epoch 2031:
Epoch 2031, train_cost 0.038, psnr 4.1e+01
Epoch 2032:
Epoch 2032, train_cost 0.039, psnr 4.1e+01
Epoch 2033:
Epoch 2033, train_cost 0.039, psnr 4.1e+01
Epoch 2034:
Epoch 2034, train_cost 0.037, psnr 4.1e+01
Epoch 2035:
Epoch 2035, train_cost 0.037, psnr 4.1e+01
Epoch 2036:
Epoch 2036, train_cost 0.039, psnr 4.1e+01
Epoch 2037:
Epoch 203

Epoch 2168, train_cost 0.039, psnr 4.1e+01
Epoch 2169:
Epoch 2169, train_cost 0.036, psnr 4.1e+01
Epoch 2170:
Epoch 2170, train_cost 0.037, psnr 4.1e+01
Epoch 2171:
Epoch 2171, train_cost 0.037, psnr 4.1e+01
Epoch 2172:
Epoch 2172, train_cost 0.038, psnr 4.1e+01
Epoch 2173:
Epoch 2173, train_cost 0.038, psnr 4.1e+01
Epoch 2174:
Epoch 2174, train_cost 0.039, psnr 4.1e+01
Epoch 2175:
Epoch 2175, train_cost 0.038, psnr 4.1e+01
Epoch 2176:
Epoch 2176, train_cost 0.037, psnr 4.1e+01
Epoch 2177:
Epoch 2177, train_cost 0.039, psnr 4.1e+01
Epoch 2178:
Epoch 2178, train_cost 0.038, psnr 4.1e+01
Epoch 2179:
Epoch 2179, train_cost 0.04, psnr 4.1e+01
Epoch 2180:
Epoch 2180, train_cost 0.037, psnr 4.1e+01
Epoch 2181:
Epoch 2181, train_cost 0.039, psnr 4.1e+01
Epoch 2182:
Epoch 2182, train_cost 0.036, psnr 4.1e+01
Epoch 2183:
Epoch 2183, train_cost 0.038, psnr 4.1e+01
Epoch 2184:
Epoch 2184, train_cost 0.04, psnr 4.1e+01
Epoch 2185:
Epoch 2185, train_cost 0.037, psnr 4.1e+01
Epoch 2186:
Epoch 2186, 