pytorch · dlibenzi · Sep 5, 2019 · Sep 4, 2019 · Sep 4, 2019 · Sep 5, 2019
diff --git a/test/test_operations.py b/test/test_operations.py
@@ -153,7 +153,10 @@ class XlaTestCase(TestCase):
 
   def assertEqualRel(self, out, expected, rel_err=1e-2, abs_err=1e-5):
     try:
+      nan_mask = torch.isnan(expected)
+      self.assertTrue(torch.equal(nan_mask, torch.isnan(out)))
       diff_tensor = (out - expected).abs().float()
+      diff_tensor[nan_mask] = 0
       max_rel_err = torch.max(out.abs(), expected.abs()).float() * rel_err
       # Allow higher relative differences as long as we're still below the
       # absolute error.
@@ -733,11 +736,24 @@ def test_fn(a):
 
     self.runAtenTest(torch.zeros([4, 4]), test_fn)
 
-  def test_max_throw(self):
+  def test_reduction_zero_dim(self):
+    self.runAtenTest(torch.rand(2, 0, 4).bool(), lambda x : torch.all(x))
+    self.runAtenTest(torch.rand(2, 0, 4).bool(), lambda x : torch.any(x))
+    self.runAtenTest(torch.rand(2, 0, 4), lambda x : torch.sum(x))
+    self.runAtenTest(torch.rand(2, 0, 4), lambda x : torch.mean(x))
+    self.runAtenTest(torch.rand(2, 0, 4), lambda x : torch.prod(x))
+    # min & max throws
     xla_device = xm.xla_device()
-    xla_a = torch.randn(2, 0, 4, device=xla_device)
+    a = torch.rand(2, 0, 4)
+    xla_a = a.to(xla_device)
+    self.assertRaises(RuntimeError, lambda: torch.max(a, dim=1))
+    self.assertRaises(RuntimeError, lambda: torch.max(a))
+    self.assertRaises(RuntimeError, lambda: torch.min(a, dim=1))
+    self.assertRaises(RuntimeError, lambda: torch.min(a))
     self.assertRaises(RuntimeError, lambda: torch.max(xla_a, dim=1))
     self.assertRaises(RuntimeError, lambda: torch.max(xla_a))
+    self.assertRaises(RuntimeError, lambda: torch.min(xla_a, dim=1))
+    self.assertRaises(RuntimeError, lambda: torch.min(xla_a))
 
   def test_writeable_tensors_updates(self):
 

diff --git a/torch_xla/csrc/reduction.cpp b/torch_xla/csrc/reduction.cpp
@@ -1,5 +1,7 @@
 #include "torch_xla/csrc/reduction.h"
 
+#include <cmath>
+
 #include "tensorflow/compiler/xla/client/lib/arithmetic.h"
 #include "tensorflow/compiler/xla/literal_util.h"
 #include "tensorflow/compiler/xla/xla_client/debug_macros.h"
@@ -31,7 +33,6 @@ ReductionInfo GetReductionInfo(
       rinfo.new_dimensions.push_back(shape.dimensions(i));
     }
   }
-  XLA_CHECK_GT(rinfo.element_count, 0);
   return rinfo;
 }
 
@@ -73,10 +74,11 @@ xla::XlaOp CreateSummation(
   xla::XlaOp result = xla::Reduce(
       input, init_value, XlaHelpers::CreateAddComputation(shape.element_type()),
       dimensions);
-  if (scale && rinfo.element_count > 1) {
+  if (scale) {
     xla::XlaOp scale = XlaHelpers::ScalarValue<float>(
-        1.0f / static_cast<float>(rinfo.element_count), shape.element_type(),
-        input.builder());
+        rinfo.element_count > 0 ? 1.0f / static_cast<float>(rinfo.element_count)
+                                : NAN,
+        shape.element_type(), input.builder());
     result = xla::Mul(result, scale);
   }
   if (keep_reduced_dimensions) {
@@ -146,6 +148,7 @@ xla::XlaOp BuildMaxInDim(const xla::XlaOp& input, xla::int64 dim,
   xla::XlaOp init_value = XlaHelpers::ScalarValue(
       min_max.min, shape.element_type(), input.builder());
   ReductionInfo rinfo = GetReductionInfo(shape, {dim}, keep_reduced_dimensions);
+  XLA_CHECK_GT(rinfo.element_count, 0);
   xla::XlaOp result = xla::Reduce(
       input, init_value, XlaHelpers::CreateMaxComputation(shape.element_type()),
       {dim});
@@ -162,6 +165,7 @@ xla::XlaOp BuildMinInDim(const xla::XlaOp& input, xla::int64 dim,
   xla::XlaOp init_value = XlaHelpers::ScalarValue(
       min_max.max, shape.element_type(), input.builder());
   ReductionInfo rinfo = GetReductionInfo(shape, {dim}, keep_reduced_dimensions);
+  XLA_CHECK_GT(rinfo.element_count, 0);
   xla::XlaOp result = xla::Reduce(
       input, init_value, XlaHelpers::CreateMinComputation(shape.element_type()),
       {dim});