From e153d2175170c61dd217ebfb6d00d0a9b66137a7 Mon Sep 17 00:00:00 2001
From: Deepak Cherian <deepak@cherian.net>
Date: Thu, 13 Nov 2025 21:07:29 -0700
Subject: [PATCH 1/2] Optimize padding for coarsening.
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Pad once instead of repeatedly in serial for every dimension being
coarsened.
```
| Before [6a7a11b5] <main>   | After [873f7ce6] |   Ratio | Benchmark (Parameter)                        |
|----------------------------|------------------|---------|----------------------------------------------|
| 856M                       | 727M             |    0.85 | coarsen.Coarsen.peakmem_coarsen_with_padding |
| 59.7±1ms                   | 49.9±0.4ms       |    0.84 | coarsen.Coarsen.time_coarsen_with_padding    |
| 729M                       | 597M             |    0.82 | coarsen.Coarsen.peakmem_coarsen_no_padding   |
| 55.2±0.4ms                 | 39.5±0.1ms       |    0.71 | coarsen.Coarsen.time_coarsen_no_padding      |
```

Co-authored-by: Claude <noreply@anthropic.com>
---
 asv_bench/benchmarks/coarsen.py | 47 +++++++++++++++++++++++++++++++++
 xarray/core/variable.py         | 11 ++++----
 2 files changed, 53 insertions(+), 5 deletions(-)
 create mode 100644 asv_bench/benchmarks/coarsen.py
diff --git a/asv_bench/benchmarks/coarsen.py b/asv_bench/benchmarks/coarsen.py
new file mode 100644
index 00000000000..8ece4550b3e
--- /dev/null
+++ b/asv_bench/benchmarks/coarsen.py
@@ -0,0 +1,47 @@
+import numpy as np
+
+import xarray as xr
+
+from . import randn
+
+# Sizes chosen to test padding optimization
+nx_padded = 4003  # Not divisible by 10 - requires padding
+ny_padded = 4007  # Not divisible by 10 - requires padding
+
+nx_exact = 4000  # Divisible by 10 - no padding needed
+ny_exact = 4000  # Divisible by 10 - no padding needed
+
+window = 10
+
+
+class Coarsen:
+    def setup(self, *args, **kwargs):
+        # Case 1: Requires padding on both dimensions
+        self.da_padded = xr.DataArray(
+            randn((nx_padded, ny_padded)),
+            dims=("x", "y"),
+            coords={"x": np.arange(nx_padded), "y": np.arange(ny_padded)},
+        )
+
+        # Case 2: No padding required
+        self.da_exact = xr.DataArray(
+            randn((nx_exact, ny_exact)),
+            dims=("x", "y"),
+            coords={"x": np.arange(nx_exact), "y": np.arange(ny_exact)},
+        )
+
+    def time_coarsen_with_padding(self):
+        """Coarsen 2D array where both dimensions require padding."""
+        self.da_padded.coarsen(x=window, y=window, boundary="pad").mean()
+
+    def time_coarsen_no_padding(self):
+        """Coarsen 2D array where dimensions are exact multiples (no padding)."""
+        self.da_exact.coarsen(x=window, y=window, boundary="pad").mean()
+
+    def peakmem_coarsen_with_padding(self):
+        """Peak memory for coarsening with padding on both dimensions."""
+        self.da_padded.coarsen(x=window, y=window, boundary="pad").mean()
+
+    def peakmem_coarsen_no_padding(self):
+        """Peak memory for coarsening without padding."""
+        self.da_exact.coarsen(x=window, y=window, boundary="pad").mean()
diff --git a/xarray/core/variable.py b/xarray/core/variable.py
index 72a3fbb9402..12bea89e1e0 100644
--- a/xarray/core/variable.py
+++ b/xarray/core/variable.py
@@ -2280,6 +2280,7 @@ def coarsen_reshape(self, windows, boundary, side):
                 )
 
         variable = self
+        pad_widths = {}
         for d, window in windows.items():
             # trim or pad the object
             size = variable.shape[self._get_axis_num(d)]
@@ -2300,16 +2301,16 @@ def coarsen_reshape(self, windows, boundary, side):
                 pad = window * n - size
                 if pad < 0:
                     pad += window
-                if side[d] == "left":
-                    pad_width = {d: (0, pad)}
-                else:
-                    pad_width = {d: (pad, 0)}
-                variable = variable.pad(pad_width, mode="constant")
+                elif pad == 0:
+                    continue
+                pad_widths[d] = (0, pad) if side[d] == "left" else (pad, 0)
             else:
                 raise TypeError(
                     f"{boundary[d]} is invalid for boundary. Valid option is 'exact', "
                     "'trim' and 'pad'"
                 )
+        if pad_widths:
+            variable = variable.pad(pad_widths, mode="constant")
 
         shape = []
         axes = []

From 9dca97ac2283edb5afdc9220028d0deecfe8ae79 Mon Sep 17 00:00:00 2001
From: Deepak Cherian <deepak@cherian.net>
Date: Fri, 14 Nov 2025 10:27:27 -0700
Subject: [PATCH 2/2] Add whats-new

---
 doc/whats-new.rst | 2 ++
 1 file changed, 2 insertions(+)

diff --git a/doc/whats-new.rst b/doc/whats-new.rst
index 6dcbdd1062b..cc61a0eebf6 100644
--- a/doc/whats-new.rst
+++ b/doc/whats-new.rst
@@ -51,6 +51,8 @@ Performance
 - Speedup and reduce memory usage of :py:func:`concat`. Magnitude of improvement scales
   with size of the concatenation dimension. By `Deepak Cherian <https://github.com/dcherian>`_.
   :issue:`10864` :pull:`10866`.
+- Speedup and reduce memory usage when coarsening along multiple dimensions.
+  By `Deepak Cherian <https://github.com/dcherian>`_. :pull:`10921`.
 
 Documentation
 ~~~~~~~~~~~~~