add initial example for homography regression

kornia · Sep 6, 2018 · ce1524d · ce1524d
1 parent 8cbddb5
commit ce1524d
Show file tree

Hide file tree

Showing 3 changed files with 132 additions and 0 deletions.
diff --git a/examples/homography_regression/.gitignore b/examples/homography_regression/.gitignore
@@ -0,0 +1 @@
+data/*
diff --git a/examples/homography_regression/download_data.sh b/examples/homography_regression/download_data.sh
@@ -0,0 +1,11 @@
+#!/bin/bash
+# This script is useful to download the example data
+
+DATA_DIR=./data
+
+mkdir -p $DATA_DIR
+wget http://www.robots.ox.ac.uk/~vgg/research/affine/det_eval_files/img1.ppm -P $DATA_DIR
+wget http://www.robots.ox.ac.uk/~vgg/research/affine/det_eval_files/img2.ppm -P $DATA_DIR
+wget http://www.robots.ox.ac.uk/~vgg/research/affine/det_eval_files/H1to2p -P $DATA_DIR
+
+echo "## Succeded to download files to $DATA_DIR"
diff --git a/examples/homography_regression/main.py b/examples/homography_regression/main.py
@@ -0,0 +1,120 @@
+import argparse
+import os
+import cv2
+import numpy as np
+
+import torch
+import torch.nn as nn
+import torch.nn.functional as F
+import torch.optim as optim
+import torchgeometry as dgm
+
+
+def load_homography(file_name):
+    """Loads an homography from text file.
+    """
+    assert os.path.isfile(file_name), "Invalid file {}".format(file_name)
+    return torch.from_numpy(np.loadtxt(file_name)).float()
+
+
+def load_image(file_name):
+    """Loads the image with OpenCV and converts to torch.Tensor
+    """
+    assert os.path.isfile(file_name), "Invalid file {}".format(file_name)
+
+    # load image with OpenCV
+    img = cv2.imread(file_name, cv2.IMREAD_COLOR)
+
+    # convert image to torch tensor
+    tensor = dgm.utils.image_to_tensor(img).float() / 255.
+    tensor = tensor.view(1, *tensor.shape)  # 1xCxHxW
+
+    return tensor, img
+
+
+class MyHomography(nn.Module):
+    def __init__(self):
+        super(MyHomography, self).__init__()
+        self.homo = nn.Parameter(torch.Tensor(3, 3))
+
+        self.reset_parameters()
+
+    def reset_parameters(self, std=1e-1):
+        torch.nn.init.eye_(self.homo)
+        self.homo.data += torch.zeros_like(self.homo).uniform_(-std, std)
+
+    def forward(self):
+        return torch.unsqueeze(self.homo, dim=0)  # 1x3x3
+
+
+def HomographyRegressionApp():
+    # Training settings
+    parser = argparse.ArgumentParser(description='Homography Regression with perception loss.')
+    parser.add_argument('--input-dir', type=str, required=True,
+                        help='the path to the directory with the input data.')
+    parser.add_argument('--output-dir', type=str, required=True,
+                        help='the path to output the results.')
+    parser.add_argument('--num-iterations', type=int, default=1000, metavar='N',
+                        help='number of training iterations (default: 1000)')
+    parser.add_argument('--lr', type=float, default=1e-3, metavar='LR',
+                        help='learning rate (default: 1e-3)')
+    parser.add_argument('--momentum', type=float, default=0.9, metavar='M',
+                        help='SGD momentum (default: 0.9)')
+    parser.add_argument('--cuda', action='store_true', default=False,
+                        help='enables CUDA training')
+    parser.add_argument('--seed', type=int, default=666, metavar='S',
+                        help='random seed (default: 666)')
+    parser.add_argument('--log-interval', type=int, default=10, metavar='N',
+                        help='how many batches to wait before logging training status')
+    args = parser.parse_args()
+
+    # define the device to use for inference
+    use_cuda = args.cuda and torch.cuda.is_available()
+    device = torch.device('cuda' if use_cuda else 'cpu')
+
+    torch.manual_seed(args.seed)
+
+    # load the data
+    img_src, _ = load_image(os.path.join(args.input_dir, 'img1.ppm'))
+    img_dst, _ = load_image(os.path.join(args.input_dir, 'img2.ppm'))
+    dst_homo_src_gt = load_homography(os.path.join(args.input_dir, 'H1to2p'))
+
+    # instantiate the homography worker from `torchgeometry`
+    height, width = img_src.shape[-2:]
+    warper = dgm.HomographyWarper(height, width)
+
+    # create the homography as the parameter to be optimized
+    dst_homo_src = MyHomography().to(device)
+
+    # setup optimizer
+    optimizer = optim.SGD(dst_homo_src.parameters(), lr=args.lr,
+                          momentum=args.momentum)
+
+    # main training loop
+
+    for iter_idx in range(args.num_iterations):
+        # send data to device
+        img_src, img_dst = img_src.to(device), img_dst.to(device)
+
+        # warp the reference image to the destiny with current homography
+        img_src_to_dst = warper(img_src, dst_homo_src())
+        #import ipdb;ipdb.set_trace()
+
+        # compute the photometric loss
+        loss = F.mse_loss(img_src_to_dst, img_dst)
+        #loss = F.smooth_l1_loss(img_src_to_dst, img_dst)
+        #loss = F.l1_loss(img_src_to_dst, img_dst)
+
+        # compute gradient and update optimizer parameters
+        optimizer.zero_grad()
+        loss.backward()
+        optimizer.step()
+
+        if iter_idx % args.log_interval == 0:
+            print('Train Tteration: {}/{}\tLoss: {:.6}'.format(
+                  iter_idx, args.num_iterations, loss.item()))
+            print(dst_homo_src.homo)
+
+
+if __name__ == "__main__":
+     HomographyRegressionApp()