pytorch
diff --git a/‎torch_xla/csrc/BUILD‎
Lines changed: 2 additions & 1 deletion b/‎torch_xla/csrc/BUILD‎
Lines changed: 2 additions & 1 deletion
diff --git a/‎torch_xla/csrc/convolution.cpp‎
Lines changed: 18 additions & 23 deletions b/‎torch_xla/csrc/convolution.cpp‎
Lines changed: 18 additions & 23 deletions
diff --git a/‎torch_xla/csrc/convolution.h‎
Lines changed: 1 addition & 0 deletions b/‎torch_xla/csrc/convolution.h‎
Lines changed: 1 addition & 0 deletions
@@ -37,6 +37,7 @@ ptxla_cc_library(
         "batch_norm.cpp",
         "convert_ops.cpp",
         "convolution.cpp",
+        "convolution_helper.cpp",
         "cross_replica_reduces.cpp",
         "data_ops.cpp",
         "debug_util.cpp",
@@ -75,6 +76,7 @@ ptxla_cc_library(
         "batch_norm.h",
         "convert_ops.h",
         "convolution.h",
+        "convolution_helper.h",
         "cross_replica_reduces.h",
         "data_ops.h",
         "debug_util.h",
@@ -128,7 +130,6 @@ ptxla_cc_library(
         "@com_google_absl//absl/strings",
         "@com_google_absl//absl/types:optional",
         "@com_google_absl//absl/types:span",
-        "@org_tensorflow//tensorflow/compiler/tf2xla/kernels:conv_op_helpers",
         "@org_tensorflow//tensorflow/compiler/xla:comparison_util",
         "@org_tensorflow//tensorflow/compiler/xla:literal_util",
         "@org_tensorflow//tensorflow/compiler/xla:permutation_util",
 
@@ -1,6 +1,5 @@
 #include "torch_xla/csrc/convolution.h"
 
-#include "tensorflow/compiler/tf2xla/kernels/conv_op_helpers.h"
 #include "tensorflow/compiler/xla/client/lib/constants.h"
 #include "torch_xla/csrc/helpers.h"
 #include "torch_xla/csrc/runtime/debug_macros.h"
@@ -33,10 +32,8 @@ namespace {
  *   - grad_input: conv(grad_output, weight^T) (with padding etc)
  *   - grad_weight: conv(input^T, grad_output)
  *
- * XLA provides the following wrappers instead of calling into raw
- * ConvGeneralDilated.
+ * Below helpers are inspired by TF2XLA implementation of the Convolution
  * https://github.com/tensorflow/tensorflow/blob/master/tensorflow/compiler/tf2xla/kernels/conv_op_helpers.cc
- *   - MakeXlaForwardConvOp (not used in our lowering, see below)
  *   - MakeXlaBackpropInputConvOp
  *   - MakeXlaBackpropFilterConvOp
  *
@@ -74,10 +71,9 @@ namespace {
  * depthwise convolution, there's no need to do additional reshapes to match to
  * XLA expected format. This is also why we use raw ConvGeneralDilated instead
  * of MakeXlaForwardConvOp in forward graph. For code simplicity we still want
- * to use the MakeXlaBackpropInputConvOp and MakeXlaBackpropFilterConvOp given
- * they have many useful steps that we don't want to duplicate here, we simply
- * enforce depthwise = false inside those functions, so that we skip the reshape
- * steps XLA has with a [Hker, Wker, Cin, M] input.
+ * to use the MakeXlaBackpropInputConvOp and MakeXlaBackpropFilterConvOp,
+ * we simply enforce depthwise = false inside those functions, so that we skip the
+ * reshape steps XLA has with a [Hker, Wker, Cin, M] input.
  *
  * forward: (conv with groups = G)
  *   - input: [N, Hin, Win, Cin]
@@ -121,16 +117,15 @@ xla::XlaOp PadInputFromOutputSize(xla::XlaOp input,
   return PadToSize(input, expected_input_sizes);
 }
 
-// Create a TF convolution metadata structure out of PyTorch convolution
-// attributes.
-tensorflow::ConvOpAttrs MakeConvOpAttrs(
-    absl::Span<const int64_t> spatial_stride,
-    absl::Span<const int64_t> spatial_padding,
-    absl::Span<const int64_t> spatial_dilation, bool depthwise) {
+// Create ConvOpAttrs
+ConvOpAttrs MakeConvOpAttrs(absl::Span<const int64_t> spatial_stride,
+                            absl::Span<const int64_t> spatial_padding,
+                            absl::Span<const int64_t> spatial_dilation,
+                            bool depthwise) {
   int num_spatial_dims = spatial_stride.size();
   XLA_CHECK_EQ(spatial_padding.size(), num_spatial_dims);
   XLA_CHECK_EQ(spatial_dilation.size(), num_spatial_dims);
-  tensorflow::ConvOpAttrs conv_op_attrs;
+  ConvOpAttrs conv_op_attrs;
   conv_op_attrs.depthwise = depthwise;
   conv_op_attrs.num_spatial_dims = num_spatial_dims;
   // Stride, dilation and padding must be set for the batch and feature in the
@@ -142,15 +137,15 @@ tensorflow::ConvOpAttrs MakeConvOpAttrs(
   conv_op_attrs.strides = {1, 1};
   std::copy(spatial_stride.begin(), spatial_stride.end(),
             std::back_inserter(conv_op_attrs.strides));
-  conv_op_attrs.padding = tensorflow::Padding::EXPLICIT;
+  conv_op_attrs.padding = Padding::EXPLICIT;
   // https://github.com/tensorflow/tensorflow/blob/ec81825aaf7e848d9f8ddffdf1e0d20aebe9172c/tensorflow/core/util/padding.cc#L40
   // explicit_padding requires to have (spatial_dims + 2) * 2 elements
   conv_op_attrs.explicit_paddings.resize(4);
   for (int spatial_dim = 0; spatial_dim < num_spatial_dims; ++spatial_dim) {
     conv_op_attrs.explicit_paddings.push_back(spatial_padding[spatial_dim]);
     conv_op_attrs.explicit_paddings.push_back(spatial_padding[spatial_dim]);
   }
-  conv_op_attrs.data_format = tensorflow::TensorFormat::FORMAT_NCHW;
+  conv_op_attrs.data_format = TensorFormat::FORMAT_NCHW;
   return conv_op_attrs;
 }
 
@@ -218,13 +213,13 @@ xla::XlaOp BuildConvBackwardInput(xla::XlaOp grad_output, xla::XlaOp kernel,
                                   absl::Span<const int64_t> spatial_padding,
                                   absl::Span<const int64_t> spatial_dilation,
                                   int64_t groups) {
-  tensorflow::ConvOpAttrs conv_op_attrs =
+  ConvOpAttrs conv_op_attrs =
       MakeConvOpAttrs(spatial_stride, spatial_padding, spatial_dilation, false);
   xla::XlaOp kernel_transposed =
       xla::Transpose(kernel, FilterTransposePermutation(input_shape.rank()));
-  return ConsumeValue(tensorflow::MakeXlaBackpropInputConvOp(
-      "conv_backward_input", input_shape, kernel_transposed, grad_output,
-      conv_op_attrs));
+  return ConsumeValue(MakeXlaBackpropInputConvOp("conv_backward_input",
+                                                 input_shape, kernel_transposed,
+                                                 grad_output, conv_op_attrs));
 }
 
 // Computes the kernel gradient for a convolution.
@@ -234,14 +229,14 @@ xla::XlaOp BuildConvBackwardWeight(xla::XlaOp grad_output, xla::XlaOp input,
                                    absl::Span<const int64_t> spatial_padding,
                                    absl::Span<const int64_t> spatial_dilation,
                                    int64_t groups) {
-  tensorflow::ConvOpAttrs conv_op_attrs =
+  ConvOpAttrs conv_op_attrs =
       MakeConvOpAttrs(spatial_stride, spatial_padding, spatial_dilation, false);
   auto transpose_permutation = FilterTransposePermutation(kernel_shape.rank());
   auto inv_transpose_permutation =
       xla::InversePermutation(transpose_permutation);
   xla::Shape transposed_weight_shape =
       xla::ShapeUtil::PermuteDimensions(transpose_permutation, kernel_shape);
-  xla::XlaOp conv = ConsumeValue(tensorflow::MakeXlaBackpropFilterConvOp(
+  xla::XlaOp conv = ConsumeValue(MakeXlaBackpropFilterConvOp(
       "conv_backward_weight", input, transposed_weight_shape, grad_output,
       conv_op_attrs));
 
 
@@ -3,6 +3,7 @@
 
 #include "absl/types/span.h"
 #include "tensorflow/compiler/xla/client/xla_builder.h"
+#include "torch_xla/csrc/convolution_helper.h"
 
 namespace torch_xla {