pytorch · yhl48 · Apr 4, 2023 · Apr 4, 2023 · Apr 13, 2023 · Apr 13, 2023
diff --git a/aten/src/ATen/functorch/BatchRulesLoss.cpp b/aten/src/ATen/functorch/BatchRulesLoss.cpp
@@ -25,12 +25,14 @@ at::Tensor flatten_logical(const Tensor& tensor, optional<int64_t> bdim) {
   }
 }
 
-std::tuple<at::Tensor,optional<int64_t>>
-mse_loss_batch_rule(const at::Tensor& self, optional<int64_t> self_bdim, const at::Tensor& target,
-          optional<int64_t> target_bdim, int64_t reduction) {
+// Useful for many loss functions
+static std::tuple<at::Tensor,optional<int64_t>>
+loss_batch_rule_helper(const at::Tensor& self, optional<int64_t> self_bdim, const at::Tensor& target,
+          optional<int64_t> target_bdim, int64_t reduction,
+          std::function<at::Tensor(const at::Tensor&, const at::Tensor&, int64_t)> loss_fn) {
   auto self_ = flatten_logical(self, self_bdim);
   auto target_ = flatten_logical(target, target_bdim);
-  auto result = at::mse_loss(self_, target_, Reduction::None);
+  auto result = loss_fn(self_, target_, Reduction::None);
   if (result.dim() == 1) {
     return std::make_tuple(result, 0);
   } else if (reduction == Reduction::None) {
@@ -46,6 +48,24 @@ mse_loss_batch_rule(const at::Tensor& self, optional<int64_t> self_bdim, const a
   TORCH_INTERNAL_ASSERT(false);
 };
 
+std::tuple<at::Tensor,optional<int64_t>>
+mse_loss_batch_rule(const at::Tensor& self, optional<int64_t> self_bdim, const at::Tensor& target,
+          optional<int64_t> target_bdim, int64_t reduction) {
+  return loss_batch_rule_helper(self, self_bdim, target, target_bdim,
+                                reduction, [](const at::Tensor& a, const at::Tensor& b, int64_t red) {
+                                  return at::mse_loss(a, b, red);
+                                });
+};
+
+std::tuple<at::Tensor,optional<int64_t>>
+smooth_l1_loss_batch_rule(const at::Tensor& self, optional<int64_t> self_bdim, const at::Tensor& target,
+          optional<int64_t> target_bdim, int64_t reduction, double beta) {
+  return loss_batch_rule_helper(self, self_bdim, target, target_bdim,
+                                reduction, [beta](const at::Tensor& a, const at::Tensor& b, int64_t red) {
+                                  return at::smooth_l1_loss(a, b, red, beta);
+                                });
+};
+
 static Tensor apply_loss_reduction(const at::Tensor& unreduced, int64_t reduction) {
   if (reduction == at::Reduction::Mean) {
     return unreduced.mean();
@@ -283,6 +303,7 @@ TORCH_LIBRARY_IMPL(aten, FuncTorchBatched, m) {
   m.impl("nll_loss2d_backward", nll_loss_backward_decomposition);
   VMAP_SUPPORT(mse_loss, mse_loss_batch_rule);
   // mse_loss_backwards uses a decomposition for its batch rule
+  VMAP_SUPPORT(smooth_l1_loss, smooth_l1_loss_batch_rule);
   m.impl("binary_cross_entropy", binary_cross_entropy_plumbing);
   m.impl("binary_cross_entropy_backward", binary_cross_entropy_backward_plumbing);
 }

diff --git a/test/functorch/test_vmap.py b/test/functorch/test_vmap.py
@@ -3684,7 +3684,6 @@ def test_vmap_exhaustive(self, device, dtype, op):
         xfail('nn.functional.triplet_margin_loss', ''),
         xfail('nn.functional.pdist', ''),
         xfail('scatter_reduce', 'sum'),
-        xfail('nn.functional.smooth_l1_loss', ''),
         xfail('scatter_reduce', 'amax'),
         xfail('nn.functional.max_unpool1d', 'grad'),
         xfail('nn.functional.multi_margin_loss', ''),