### 1. Dependencies

In [1]:
import torch
from torch.utils.data import Dataset, DataLoader
from torchvision import transforms
from torch.autograd import Variable
import torch.optim as optim
import torch.nn as nn
import torch.nn.functional as F
from torch.nn import DataParallel

import time
import os
import numpy as np
import json
import cv2
from PIL import Image, ImageOps
import random
from tqdm import tqdm
import operator
import itertools
from scipy.io import  loadmat
import logging
from scipy import signal

from utils import data_transforms
from utils import get_paste_kernel, kernel_map
from utils_logging import setup_logger

### 2. Choose between Recasens or GazeNet

- Idea is you can just swap 
models.recasens, dataloader.recasens, training.train_recasens, etc...
- with the following
models.gazenet, dataloader.gazenet, training.train_gazenet

In [2]:
from models.gazenet import GazeNet
from models.__init__ import save_checkpoint, resume_checkpoint
from dataloader.gazenet import GooDataset, GazeDataset
from training.train_gazenet import train, test, GazeOptimizer

In [3]:
# Logger will save the training and test errors to a .log file 
logger = setup_logger(name='first_logger', 
                      log_dir ='./logs/',
                      log_file='train_gazenet_gooreal_.log',
                      log_format = '%(asctime)s %(levelname)s %(message)s',
                      verbose=True)

### 3. Dataloaders
- Choose between GazeDataset (Gazefollow dataset) or GooDataset (GooSynth/GooReal)
- Set paths to image directories and pickle paths. For Gazefollow, images_dir and test_images_dir should be the same and both lead to the path containing the train and test folders.

In [4]:
# Dataloaders for GazeFollow
batch_size=32
workers=12
testbatchsize=16

images_dir = '/home/eee198/Documents/datasets/GazeFollowData/'
pickle_path = '/home/eee198/Documents/datasets/GazeFollowData/train_annotations.mat'
test_images_dir = '/home/eee198/Documents/datasets/GazeFollowData/'
test_pickle_path = '/home/eee198/Documents/datasets/GazeFollowData/test_annotations.mat'

train_set = GazeDataset(images_dir, pickle_path, 'train')
train_data_loader = torch.utils.data.DataLoader(train_set, batch_size=batch_size, shuffle=True, num_workers=workers)

val_set = GazeDataset(test_images_dir, test_pickle_path, 'test')
test_data_loader = torch.utils.data.DataLoader(val_set, batch_size=testbatchsize, num_workers=workers, shuffle=False)

In [4]:
# Dataloaders for GOO-Synth
batch_size=32
workers=12
testbatchsize=32

images_dir = '/hdd/HENRI/goosynth/1person/GazeDatasets/'
pickle_path = '/hdd/HENRI/goosynth/picklefiles/trainpickle2to19human.pickle'
test_images_dir = '/hdd/HENRI/goosynth/test/'
test_pickle_path = '/hdd/HENRI/goosynth/picklefiles/testpickle120.pickle'

train_set = GooDataset(images_dir, pickle_path, 'train')
train_data_loader = torch.utils.data.DataLoader(train_set, batch_size=batch_size, shuffle=True, num_workers=workers)

val_set = GooDataset(test_images_dir, test_pickle_path, 'test')
test_data_loader = torch.utils.data.DataLoader(val_set, batch_size=testbatchsize, num_workers=workers, shuffle=False)

==> Number of Images: 172800
==> Number of Images: 19200


In [4]:
# Dataloaders for GOO-Real
batch_size=32
workers=12
testbatchsize=32

images_dir = '/home/eee198/Documents/datasets/GOOReal/finalrealdatasetImgsV2/'
pickle_path = '/home/eee198/Documents/datasets/GOOReal/oneshotrealhumans.pickle'
test_images_dir = '/home/eee198/Documents/datasets/GOOReal/finalrealdatasetImgsV2/'
test_pickle_path = '/home/eee198/Documents/datasets/GOOReal/testrealhumans.pickle'

train_set = GooDataset(images_dir, pickle_path, 'train')
train_data_loader = torch.utils.data.DataLoader(train_set, batch_size=batch_size, shuffle=True, num_workers=workers)

val_set = GooDataset(test_images_dir, test_pickle_path, 'test')
test_data_loader = torch.utils.data.DataLoader(val_set, batch_size=testbatchsize, num_workers=workers, shuffle=False)

==> Number of Images: 2451
==> Number of Images: 2156


### 4. Load Model and Set Training Hyperparameters
- For Gazefollow, the model requires the alexnet_places365 pretrained model, provided here: https://urlzs.com/ytKK3
- When resuming training, set to True and set the resume_path for the saved model.
- Here, logging module is initialized (logger) to save training and testing errors.

In [5]:
# Loads model
net = GazeNet()
net.cuda()

# Hyperparameters
start_epoch = 25
max_epoch = 30
learning_rate = 1e-4

# Initializes Optimizer
gaze_opt = GazeOptimizer(net, learning_rate)
optimizer = gaze_opt.getOptimizer(start_epoch)

# Is training resumed? If so, set the resume_path and set flag to True
# This can also be used to evaluate a model 
resume_training = True
resume_path = './saved_models/goosynth_pretrain/lian.pth.tar'
if resume_training :
    net, optimizer, _ = resume_checkpoint(net, optimizer, resume_path)
    scores = test(net, test_data_loader,logger, save_output=True)
    #print('L2 Distance: ', scores[1])

=> loading checkpoint './saved_models/goosynth_pretrain/lian.pth.tar'


  0%|          | 0/68 [00:00<?, ?it/s]

=> loaded checkpoint './saved_models/goosynth_pretrain/lian.pth.tar' (epoch 24)


loss: 0.13326, 0.56249, 0.69574
  1%|▏         | 1/68 [00:09<10:35,  9.48s/it]loss: 0.13666, 0.36980, 0.50646
  3%|▎         | 2/68 [00:09<07:22,  6.71s/it]loss: 0.13475, 0.39274, 0.52748
  4%|▍         | 3/68 [00:10<05:11,  4.79s/it]loss: 0.14008, 0.38407, 0.52415
  6%|▌         | 4/68 [00:10<03:40,  3.44s/it]loss: 0.14128, 0.47111, 0.61239
  7%|▋         | 5/68 [00:10<02:41,  2.56s/it]loss: 0.15968, 0.59962, 0.75929
  9%|▉         | 6/68 [00:11<01:54,  1.85s/it]loss: 0.14161, 0.45249, 0.59410
 10%|█         | 7/68 [00:11<01:23,  1.37s/it]loss: 0.14998, 0.46215, 0.61213
 12%|█▏        | 8/68 [00:11<01:02,  1.04s/it]loss: 0.14828, 0.29334, 0.44162
 13%|█▎        | 9/68 [00:11<00:48,  1.23it/s]loss: 0.15552, 0.55673, 0.71225
 15%|█▍        | 10/68 [00:12<00:39,  1.48it/s]loss: 0.12569, 0.26923, 0.39492
 16%|█▌        | 11/68 [00:12<00:31,  1.82it/s]loss: 0.15978, 0.49965, 0.65943
 18%|█▊        | 12/68 [00:12<00:25,  2.21it/s]loss: 0.14892, 0.53157, 0.68049
 19%|█▉        | 13/68 [00:18

In [6]:
scores = test(net, test_data_loader,logger, save_output=True)

  0%|          | 0/68 [00:00<?, ?it/s]loss: 0.73637, 0.54460, 1.28097
  1%|▏         | 1/68 [00:10<11:45, 10.53s/it]loss: 0.73724, 0.70453, 1.44177
  3%|▎         | 2/68 [00:10<08:14,  7.50s/it]loss: 0.73599, 0.60091, 1.33690
  4%|▍         | 3/68 [00:11<05:46,  5.33s/it]loss: 0.73410, 0.66665, 1.40076
  6%|▌         | 4/68 [00:11<04:04,  3.83s/it]loss: 0.73932, 0.67326, 1.41258
  7%|▋         | 5/68 [00:11<02:54,  2.77s/it]loss: 0.73536, 0.67505, 1.41041
  9%|▉         | 6/68 [00:12<02:05,  2.02s/it]loss: 0.73947, 0.69226, 1.43173
 10%|█         | 7/68 [00:12<01:31,  1.51s/it]loss: 0.73198, 0.49461, 1.22660
 12%|█▏        | 8/68 [00:12<01:07,  1.13s/it]loss: 0.73474, 0.46742, 1.20217
 13%|█▎        | 9/68 [00:12<00:50,  1.18it/s]loss: 0.73281, 0.70513, 1.43794
 15%|█▍        | 10/68 [00:13<00:40,  1.44it/s]loss: 0.73591, 0.79120, 1.52711
 16%|█▌        | 11/68 [00:13<00:31,  1.80it/s]loss: 0.73420, 0.68806, 1.42226
 18%|█▊        | 12/68 [00:13<00:24,  2.27it/s]loss: 0.73605, 0.70345,

### 5. Training the Model
- Determine in which epochs do you want to save the model, as you might not want to save every epoch
- Training and test errors can be accessed in the logs directory set up earlier

In [8]:
best_l2 = np.inf

for epoch in range(26, 30):
    
    # Update optimizer
    optimizer = gaze_opt.getOptimizer(epoch)

    # Train model
    train(net, train_data_loader, optimizer, epoch, logger)
    
    # Evaluate model
    #scores = test(net, test_data_loader, logger)
    
    # Save model+optimizer with best L2 Score
    #if scores[1] < best_l2:
    #    best_l2 = scores[1]
    #    save_path = './saved_models/gazenet_gooreal_notrain/'
    #    save_checkpoint(net, optimizer, 420, save_path)

100%|██████████| 77/77 [01:03<00:00,  1.21it/s]
100%|██████████| 77/77 [01:03<00:00,  1.22it/s]
100%|██████████| 77/77 [01:04<00:00,  1.19it/s]
100%|██████████| 77/77 [01:03<00:00,  1.21it/s]


In [9]:
test(net, test_data_loader,logger, save_output=True)

  0%|          | 0/68 [00:00<?, ?it/s]loss: 0.07214, 0.26543, 0.33757
  1%|▏         | 1/68 [00:10<12:03, 10.80s/it]loss: 0.07447, 0.24349, 0.31796
  3%|▎         | 2/68 [00:11<08:25,  7.66s/it]loss: 0.06412, 0.10938, 0.17350
  4%|▍         | 3/68 [00:11<05:54,  5.45s/it]loss: 0.06933, 0.16028, 0.22961
  6%|▌         | 4/68 [00:11<04:09,  3.89s/it]loss: 0.07046, 0.28990, 0.36037
  7%|▋         | 5/68 [00:11<02:55,  2.79s/it]loss: 0.07077, 0.29707, 0.36783
  9%|▉         | 6/68 [00:12<02:05,  2.02s/it]loss: 0.07177, 0.17802, 0.24980
 10%|█         | 7/68 [00:12<01:30,  1.49s/it]loss: 0.06956, 0.25314, 0.32271
 12%|█▏        | 8/68 [00:12<01:07,  1.12s/it]loss: 0.06615, 0.09999, 0.16614
 13%|█▎        | 9/68 [00:12<00:50,  1.16it/s]loss: 0.07876, 0.36843, 0.44719
 15%|█▍        | 10/68 [00:13<00:39,  1.48it/s]loss: 0.07102, 0.23269, 0.30372
 16%|█▌        | 11/68 [00:13<00:30,  1.87it/s]loss: 0.08862, 0.41587, 0.50448
 18%|█▊        | 12/68 [00:13<00:25,  2.20it/s]loss: 0.07576, 0.29878,

[0.8884825397733727, 0.17205015173593233, 33.337276480865654]