Added aten::norm operations.

dlibenzi · dlibenzi · commit 63de0b542683 · 2019-03-05T14:27:44.000-08:00
diff --git a/test/cpp/test_aten_xla_tensor.cpp b/test/cpp/test_aten_xla_tensor.cpp
@@ -831,6 +831,66 @@ TEST_F(AtenXlaTensorTest, TestSumInDimsKeep) {
   });
 }
 
+TEST_F(AtenXlaTensorTest, TestNorm) {
+  at::Tensor a = at::rand({4, 3, 4}, at::TensorOptions(at::kFloat));
+  at::Tensor b = at::norm(a);
+  ForEachDevice([&](const Device& device) {
+    at::Tensor xla_a = bridge::CreateXlaTensor(a, device);
+    at::Tensor xla_b = at::norm(xla_a);
+    AllClose(b, xla_b);
+  });
+}
+
+TEST_F(AtenXlaTensorTest, TestNormInDim) {
+  at::Tensor a = at::rand({4, 3, 4}, at::TensorOptions(at::kFloat));
+  at::Tensor b = at::norm(a, 2, {1}, /*keepdim=*/false);
+  ForEachDevice([&](const Device& device) {
+    at::Tensor xla_a = bridge::CreateXlaTensor(a, device);
+    at::Tensor xla_b = at::norm(xla_a, 2, {1}, /*keepdim=*/false);
+    AllClose(b, xla_b);
+  });
+}
+
+TEST_F(AtenXlaTensorTest, TestNormInDims) {
+  at::Tensor a = at::rand({4, 3, 4}, at::TensorOptions(at::kFloat));
+  at::Tensor b = at::norm(a, 2, {1, 2}, /*keepdim=*/false);
+  ForEachDevice([&](const Device& device) {
+    at::Tensor xla_a = bridge::CreateXlaTensor(a, device);
+    at::Tensor xla_b = at::norm(xla_a, 2, {1, 2}, /*keepdim=*/false);
+    AllClose(b, xla_b);
+  });
+}
+
+TEST_F(AtenXlaTensorTest, TestNormInDimsKeep) {
+  at::Tensor a = at::rand({4, 3, 4}, at::TensorOptions(at::kFloat));
+  at::Tensor b = at::norm(a, 2, {1, 2}, /*keepdim=*/true);
+  ForEachDevice([&](const Device& device) {
+    at::Tensor xla_a = bridge::CreateXlaTensor(a, device);
+    at::Tensor xla_b = at::norm(xla_a, 2, {1, 2}, /*keepdim=*/true);
+    AllClose(b, xla_b);
+  });
+}
+
+TEST_F(AtenXlaTensorTest, TestNormGeneral) {
+  at::Tensor a = at::rand({4, 3, 4}, at::TensorOptions(at::kFloat));
+  at::Tensor b = at::norm(a, 3.5);
+  ForEachDevice([&](const Device& device) {
+    at::Tensor xla_a = bridge::CreateXlaTensor(a, device);
+    at::Tensor xla_b = at::norm(xla_a, 3.5);
+    AllClose(b, xla_b);
+  });
+}
+
+TEST_F(AtenXlaTensorTest, TestNormNuclear) {
+  at::Tensor a = at::rand({4, 3, 4}, at::TensorOptions(at::kFloat));
+  at::Tensor b = at::norm(a, 1);
+  ForEachDevice([&](const Device& device) {
+    at::Tensor xla_a = bridge::CreateXlaTensor(a, device);
+    at::Tensor xla_b = at::norm(xla_a, 1);
+    AllClose(b, xla_b);
+  });
+}
+
 TEST_F(AtenXlaTensorTest, TestProd) {
   at::Tensor a = at::rand({4, 3, 4}, at::TensorOptions(at::kFloat));
   at::Tensor b = at::prod(a);
diff --git a/torch_xla/csrc/aten_xla_type.cpp b/torch_xla/csrc/aten_xla_type.cpp
@@ -1039,8 +1039,7 @@ at::Tensor& AtenXlaType::trunc_(at::Tensor& self) const {
 }
 
 at::Tensor AtenXlaType::frac(const at::Tensor& self) const {
-  return bridge::AtenFromXlaTensor(
-      XLATensor::frac(bridge::GetXlaTensor(self)));
+  return bridge::AtenFromXlaTensor(XLATensor::frac(bridge::GetXlaTensor(self)));
 }
 
 at::Tensor& AtenXlaType::frac_(at::Tensor& self) const {
@@ -1365,6 +1364,32 @@ at::Tensor AtenXlaType::dropout(const at::Tensor& input, double p,
       XLATensor::dropout(bridge::GetXlaTensor(input), p));
 }
 
+at::Tensor AtenXlaType::norm(const at::Tensor& self,
+                             c10::optional<at::Scalar> p,
+                             at::ScalarType dtype) const {
+  return bridge::AtenFromXlaTensor(XLATensor::norm(
+      bridge::GetXlaTensor(self), p, dtype, {}, /*keepdim=*/false));
+}
+
+at::Tensor AtenXlaType::norm(const at::Tensor& self, at::Scalar p) const {
+  return bridge::AtenFromXlaTensor(XLATensor::norm(
+      bridge::GetXlaTensor(self), p, c10::nullopt, {}, /*keepdim=*/false));
+}
+
+at::Tensor AtenXlaType::norm(const at::Tensor& self,
+                             c10::optional<at::Scalar> p, at::IntArrayRef dim,
+                             bool keepdim, at::ScalarType dtype) const {
+  return bridge::AtenFromXlaTensor(
+      XLATensor::norm(bridge::GetXlaTensor(self), p, dtype, dim, keepdim));
+}
+
+at::Tensor AtenXlaType::norm(const at::Tensor& self,
+                             c10::optional<at::Scalar> p, at::IntArrayRef dim,
+                             bool keepdim) const {
+  return bridge::AtenFromXlaTensor(XLATensor::norm(
+      bridge::GetXlaTensor(self), p, c10::nullopt, dim, keepdim));
+}
+
 at::Tensor AtenXlaType::log_softmax(const at::Tensor& self, int64_t dim) const {
   return bridge::AtenFromXlaTensor(
       XLATensor::log_softmax(bridge::GetXlaTensor(self), dim));
diff --git a/torch_xla/csrc/aten_xla_type.h b/torch_xla/csrc/aten_xla_type.h
@@ -427,6 +427,15 @@ class AtenXlaType : public AtenXlaTypeBase {
   at::Tensor dropout(const at::Tensor& input, double p,
                      bool train) const override;
 
+  at::Tensor norm(const at::Tensor& self, c10::optional<at::Scalar> p,
+                  at::ScalarType dtype) const override;
+  at::Tensor norm(const at::Tensor& self, at::Scalar p) const override;
+  at::Tensor norm(const at::Tensor& self, c10::optional<at::Scalar> p,
+                  at::IntArrayRef dim, bool keepdim,
+                  at::ScalarType dtype) const override;
+  at::Tensor norm(const at::Tensor& self, c10::optional<at::Scalar> p,
+                  at::IntArrayRef dim, bool keepdim) const override;
+
   at::Tensor log_softmax(const at::Tensor& self, int64_t dim) const override;
   at::Tensor _log_softmax(const at::Tensor& self, int64_t dim,
                           bool half_to_float) const override;
diff --git a/torch_xla/csrc/ops/ops.cpp b/torch_xla/csrc/ops/ops.cpp
@@ -14,6 +14,7 @@
 #include "torch_xla/csrc/ops/arithmetic_ir_ops.h"
 #include "torch_xla/csrc/ops/constant.h"
 #include "torch_xla/csrc/ops/infer_output_shape.h"
+#include "torch_xla/csrc/ops/sum.h"
 #include "torch_xla/csrc/pooling.h"
 #include "torch_xla/csrc/tensor_util.h"
 #include "torch_xla/csrc/xla_lower_util.h"
@@ -415,6 +416,42 @@ NodePtr BroadcastTensors(tensorflow::gtl::ArraySlice<const Value> tensors) {
                    std::move(lower_fn), /*num_outputs=*/tensors.size());
 }
 
+NodePtr Norm(const Value& input, c10::optional<at::Scalar> p,
+             c10::optional<at::ScalarType> dtype, at::IntArrayRef dim,
+             bool keepdim) {
+  std::vector<xla::int64> dimensions(dim.begin(), dim.end());
+  if (dimensions.empty()) {
+    dimensions = xla::util::Iota<xla::int64>(input.shape().rank());
+  }
+  if (!p.has_value() || p->toDouble() == 2.0) {
+    NodePtr square = input * input;
+    NodePtr result = MakeNode<Sum>(square, dimensions, keepdim, dtype);
+    return Sqrt(result);
+  }
+  double norm_value = p->toDouble();
+  if (norm_value == 1.0) {
+    // Contrary to documentation, norm(p=1) has nothing to do with traces and
+    // standard mathematical definitions of nuclear norms:
+    //
+    //   >>> import torch
+    //   >>> x = torch.randn(4, 4)
+    //   >>> print(torch.norm(x, 1))
+    //   tensor(11.9437)
+    //   >>> print(torch.trace(x.abs()))
+    //   tensor(3.1235)
+    //   >>> print(x.abs().sum())
+    //   tensor(11.9437)
+    return MakeNode<Sum>(Abs(input), dimensions, keepdim, dtype);
+  }
+  // Generic sum(x^p)^(1/p) norms.
+  NodePtr norm_exp = ScalarOp(norm_value, input.shape().element_type());
+  NodePtr norm_exp_inv =
+      ScalarOp(1.0 / norm_value, input.shape().element_type());
+  NodePtr exp = Pow(input, norm_exp);
+  NodePtr result = MakeNode<Sum>(exp, dimensions, keepdim, dtype);
+  return Pow(result, norm_exp_inv);
+}
+
 }  // namespace ops
 }  // namespace ir
 }  // namespace torch_xla
diff --git a/torch_xla/csrc/ops/ops.h b/torch_xla/csrc/ops/ops.h
@@ -142,6 +142,10 @@ NodePtr ARange(const at::Scalar& start, const at::Scalar& end,
 
 NodePtr BroadcastTensors(tensorflow::gtl::ArraySlice<const Value> tensors);
 
+NodePtr Norm(const Value& input, c10::optional<at::Scalar> p,
+             c10::optional<at::ScalarType> dtype, at::IntArrayRef dim,
+             bool keepdim);
+
 }  // namespace ops
 }  // namespace ir
 }  // namespace torch_xla
diff --git a/torch_xla/csrc/tensor.cpp b/torch_xla/csrc/tensor.cpp
@@ -1037,6 +1037,13 @@ XLATensor XLATensor::dropout(const XLATensor& input, double p) {
       ir::MakeNode<ir::ops::Dropout>(input.GetIrValue(), p));
 }
 
+XLATensor XLATensor::norm(const XLATensor& input, c10::optional<at::Scalar> p,
+                          c10::optional<at::ScalarType> dtype,
+                          at::IntArrayRef dim, bool keepdim) {
+  return input.CreateFrom(
+      ir::ops::Norm(input.GetIrValue(), p, dtype, dim, keepdim));
+}
+
 XLATensor XLATensor::neg(const XLATensor& input) {
   return input.CreateFrom(ir::ops::Neg(input.GetIrValue()));
 }
diff --git a/torch_xla/csrc/tensor.h b/torch_xla/csrc/tensor.h
@@ -302,6 +302,10 @@ class XLATensor {
 
   static XLATensor dropout(const XLATensor& input, double p);
 
+  static XLATensor norm(const XLATensor& input, c10::optional<at::Scalar> p,
+                        c10::optional<at::ScalarType> dtype,
+                        at::IntArrayRef dim, bool keepdim);
+
   static XLATensor neg(const XLATensor& input);
   static void neg_(XLATensor& input);
 

Original file line number	Diff line number	Diff line change
`@@ -1037,6 +1037,13 @@ XLATensor XLATensor::dropout(const XLATensor& input, double p) {`
`1037`	`1037`	`ir::MakeNode<ir::ops::Dropout>(input.GetIrValue(), p));`
`1038`	`1038`	`}`
`1039`	`1039`
	`1040`	`+XLATensor XLATensor::norm(const XLATensor& input, c10::optional<at::Scalar> p,`
	`1041`	`+ c10::optional<at::ScalarType> dtype,`
	`1042`	`+ at::IntArrayRef dim, bool keepdim) {`
	`1043`	`+ return input.CreateFrom(`
	`1044`	`+ ir::ops::Norm(input.GetIrValue(), p, dtype, dim, keepdim));`
	`1045`	`+}`
	`1046`	`+`
`1040`	`1047`	`XLATensor XLATensor::neg(const XLATensor& input) {`
`1041`	`1048`	`return input.CreateFrom(ir::ops::Neg(input.GetIrValue()));`
`1042`	`1049`	`}`