Ensure that TripletEmbeddingTrainer does not introduce NaNs when norm…

…alizing input to the unit sphere
JohnVinyard · Aug 30, 2018 · 9741550 · 9741550
1 parent ab80e8c
commit 9741550
Show file tree

Hide file tree

Showing 4 changed files with 59 additions and 2 deletions.
diff --git a/zounds/learn/embedding.py b/zounds/learn/embedding.py
@@ -4,7 +4,7 @@
 from torch import nn
 from torch.optim import Adam
 import torch
-from util import trainable_parameters
+from util import trainable_parameters, batchwise_unit_norm
 
 
 class TripletEmbeddingTrainer(Trainer):
@@ -75,7 +75,7 @@ def _apply_network_and_normalize(self, x):
         by section 4.2 of https://arxiv.org/pdf/1711.02209.pdf
         """
         x = self.network(x)
-        return x / torch.norm(x, dim=1).view(-1, 1)
+        return batchwise_unit_norm(x)
 
     def _select_batch(self, training_set):
         indices = np.random.randint(0, len(training_set), self.batch_size)

diff --git a/zounds/learn/test_embedding.py b/zounds/learn/test_embedding.py
@@ -0,0 +1,21 @@
+import torch
+import unittest2
+from embedding import TripletEmbeddingTrainer
+from torch import nn
+import numpy as np
+
+
+class TripletEmbeddingTrainerTests(unittest2.TestCase):
+    def test_normalization_does_not_cause_nans(self):
+        class Network(nn.Module):
+            def __init__(self):
+                super(Network, self).__init__()
+
+            def forward(self, x):
+                return x
+
+        network = Network()
+        trainer = TripletEmbeddingTrainer(network, 100, 32, slice(None))
+        x = torch.zeros(8, 3)
+        result = trainer._apply_network_and_normalize(x).data.numpy()
+        self.assertFalse(np.any(np.isnan(result)))
diff --git a/zounds/learn/test_util.py b/zounds/learn/test_util.py
@@ -0,0 +1,27 @@
+import unittest2
+import torch
+from util import batchwise_unit_norm
+import numpy as np
+
+
+class BatchwiseUnitNormTests(unittest2.TestCase):
+    def test_all_elements_have_unit_norm(self):
+        t = torch.FloatTensor(100, 5).normal_(0, 1)
+        t = batchwise_unit_norm(t).data.numpy()
+        norms = np.linalg.norm(t, axis=1)
+        np.testing.assert_allclose(norms, 1, rtol=1e-6)
+
+    def test_maintains_correct_shape_2d(self):
+        t = torch.FloatTensor(100, 5).normal_(0, 1)
+        t = batchwise_unit_norm(t).data.numpy()
+        self.assertEqual((100, 5), t.shape)
+
+    def test_maintains_correct_shape_3d(self):
+        t = torch.FloatTensor(100, 5, 3).normal_(0, 1)
+        t = batchwise_unit_norm(t).data.numpy()
+        self.assertEqual((100, 5, 3), t.shape)
+
+    def test_does_not_introduce_nans(self):
+        t = torch.FloatTensor(100, 5, 3).zero_()
+        t = batchwise_unit_norm(t).data.numpy()
+        self.assertFalse(np.any(np.isnan(t)))
diff --git a/zounds/learn/util.py b/zounds/learn/util.py
@@ -126,6 +126,15 @@ def sample_norm(x):
     return original / x.view(-1, 1, x.shape[-1])
 
 
+def batchwise_unit_norm(x, epsilon=1e-8):
+    batch_size = x.shape[0]
+    flattened = x.view(batch_size, -1)
+    norm = torch.norm(flattened, dim=1, keepdim=True)
+    expanded = norm.view(batch_size, *((1,) * (x.dim() - 1)))
+    normed = x / (expanded + epsilon)
+    return normed
+
+
 def feature_map_size(inp, kernel, stride=1, padding=0):
     return ((inp - kernel + (2 * padding)) / stride) + 1