pymor · sdrave · Dec 4, 2020 · Oct 1, 2020 · Oct 1, 2020 · Oct 1, 2020
diff --git a/AUTHORS.md b/AUTHORS.md
@@ -12,9 +12,10 @@
 ## pyMOR 2020.2
 
 * Tim Keil, tim.keil@uni-muenster.de
-    * Energy product in elliptic discretizer
+    * energy product in elliptic discretizer
     * rename estimate --> estimate_error and estimator -> error_estimator
     * avoid nested Product and Lincomb Functionals and Functions
+    * linear optimization (dual solution, sensitivities, output gradient)
 
 * Hendrik Kleikamp, hendrik.kleikamp@uni-muenster.de
     * artificial neural networks for instationary problems

diff --git a/docs/source/bibliography.rst b/docs/source/bibliography.rst
@@ -91,6 +91,10 @@ Bibliography
            Hierarchical Approximate Proper Orthogonal Decomposition,
            SIAM J. Sci. Comput. 40, A3267-A3292, 2018.
 
+.. [HPUU09] M. Hinze, R. Pinnau, M. Ulbrich, S. Ulbrich,
+            Optimization with PDE constraints,
+            Springer Netherlands, 2009.
+
 .. [HU18]  J. Hesthaven, S. Ubbiali,
            Non-intrusive reduced order modeling of nonlinear problems using neural networks,
            Journal of Computational Physics, 363, pp. 55-78, 2018.

diff --git a/src/pymor/models/basic.py b/src/pymor/models/basic.py
@@ -2,8 +2,11 @@
 # Copyright 2013-2020 pyMOR developers and contributors. All rights reserved.
 # License: BSD 2-Clause License (http://opensource.org/licenses/BSD-2-Clause)
 
+import numpy as np
+
 from pymor.algorithms.timestepping import TimeStepper
 from pymor.models.interface import Model
+from pymor.operators.block import BlockOperatorBase
 from pymor.operators.constructions import IdentityOperator, VectorOperator, ZeroOperator
 from pymor.vectorarrays.interface import VectorArray
 from pymor.vectorarrays.numpy import NumpyVectorSpace
@@ -84,6 +87,66 @@ def __str__(self):
     def _compute_solution(self, mu=None, **kwargs):
         return self.operator.apply_inverse(self.rhs.as_range_array(mu), mu=mu)
 
+    def _compute_solution_d_mu_single_direction(self, parameter, index, solution, mu):
+        lhs_d_mu = self.operator.d_mu(parameter, index).apply(solution, mu=mu)
+        rhs_d_mu = self.rhs.d_mu(parameter, index).as_range_array(mu)
+        rhs = rhs_d_mu - lhs_d_mu
+        return self.operator.jacobian(solution, mu=mu).apply_inverse(rhs)
+
+    _compute_allowed_kwargs = frozenset({'use_adjoint'})
+
+    def _compute_output_d_mu(self, solution, mu, return_array=False, use_adjoint=None):
+        """compute the gradient of the output functional  w.r.t. the parameters
+
+        Parameters
+        ----------
+        solution
+            Internal model state for the given |Parameter value|
+        mu
+            |Parameter value| for which to compute the gradient
+        return_array
+            if `True`, return the output gradient as a |NumPy array|.
+            Otherwise, return a dict of gradients for each |Parameter|.
+        use_adjoint
+            if `None` use standard approach, if `True`, use
+            the adjoint solution for a more efficient way of computing the gradient.
+            See Section 1.6.2 in [HPUU09]_ for more details.
+            So far, the adjoint approach is only valid for linear models.
+
+        Returns
+        -------
+        The gradient as a |NumPy array| or a dict of |NumPy arrays|.
+        """
+        if use_adjoint is None:
+            use_adjoint = True if (self.output_functional.linear and self.operator.linear) else False
+        if not use_adjoint:
+            return super()._compute_output_d_mu(solution, mu, return_array)
+        else:
+            assert self.output_functional is not None
+            assert self.operator.linear
+            assert self.output_functional.linear
+            dual_solutions = self.operator.range.empty()
+            for d in range(self.output_functional.range.dim):
+                dual_problem = self.with_(operator=self.operator.H, rhs=self.output_functional.H.as_range_array(mu)[d])
+                dual_solutions.append(dual_problem.solve(mu))
+            gradients = [] if return_array else {}
+            for (parameter, size) in self.parameters.items():
+                array = np.empty(shape=(size,self.output_functional.range.dim))
+                for index in range(size):
+                    output_partial_dmu = self.output_functional.d_mu(parameter, index).apply(solution,
+                                                                                             mu=mu).to_numpy()[0]
+                    lhs_d_mu = self.operator.d_mu(parameter, index).apply2(dual_solutions, solution, mu=mu)[:,0]
+                    rhs_d_mu = self.rhs.d_mu(parameter, index).apply_adjoint(dual_solutions, mu=mu).to_numpy()[:,0]
+                    array[index] = output_partial_dmu + rhs_d_mu - lhs_d_mu
+                if return_array:
+                    gradients.extend(array)
+                else:
+                    gradients[parameter] = array
+        if return_array:
+            return np.array(gradients)
+        else:
+            return gradients
+
 
 class InstationaryModel(Model):
     """Generic class for models of instationary problems.

diff --git a/src/pymor/models/interface.py b/src/pymor/models/interface.py
@@ -48,9 +48,9 @@ def __init__(self, products=None, error_estimator=None, visualizer=None,
 
         self.__auto_init(locals())
 
-    def _compute(self, solution=False, output=False,
+    def _compute(self, solution=False, output=False, solution_d_mu=False, output_d_mu=False,
                  solution_error_estimate=False, output_error_estimate=False,
-                 mu=None, **kwargs):
+                 output_d_mu_return_array=False, mu=None, **kwargs):
         return {}
 
     def _compute_solution(self, mu=None, **kwargs):
@@ -109,6 +109,86 @@ def _compute_output(self, solution, mu=None, **kwargs):
         else:
             return self.output_functional.apply(solution, mu=mu).to_numpy()
 
+    def _compute_solution_d_mu_single_direction(self, parameter, index, solution, mu=None, **kwargs):
+        """Compute the partial derivative of the solution w.r.t. a parameter index
+
+        Parameters
+        ----------
+        parameter
+            parameter for which to compute the sensitivity
+        index
+            parameter index for which to compute the sensitivity
+        solution
+            Internal model state for the given |Parameter value|.
+        mu
+            |Parameter value| for which to solve
+
+        Returns
+        -------
+        The sensitivity of the solution as a |VectorArray|.
+        """
+        raise NotImplementedError
+
+    def _compute_solution_d_mu(self, solution, mu=None, **kwargs):
+        """Compute all partial derivative of the solution w.r.t. a parameter index
+
+        Parameters
+        ----------
+        solution
+            Internal model state for the given |Parameter value|.
+        mu
+            |Parameter value| for which to solve
+
+        Returns
+        -------
+        A dict of all partial sensitivities of the solution.
+        """
+        sensitivities = {}
+        for (parameter, size) in self.parameters.items():
+            sens_for_param = self.solution_space.empty()
+            for l in range(size):
+                sens_for_param.append(self._compute_solution_d_mu_single_direction(
+                    parameter, l, solution, mu))
+            sensitivities[parameter] = sens_for_param
+        return sensitivities
+
+    def _compute_output_d_mu(self, solution, mu=None, return_array=False, **kwargs):
+        """compute the gradient w.r.t. the parameter of the output functional
+
+        Parameters
+        ----------
+        solution
+            Internal model state for the given |Parameter value|.
+        mu
+            |Parameter value| for which to compute the gradient
+        return_array
+            if `True`, return the output gradient as a |NumPy array|.
+            Otherwise, return a dict of gradients for each |Parameter|.
+
+        Returns
+        -------
+        The gradient as a |NumPy array| or a dict of |NumPy arrays|.
+        """
+        assert self.output_functional is not None
+        U_d_mus = self._compute_solution_d_mu(solution, mu)
+        gradients = [] if return_array else {}
+        for (parameter, size) in self.parameters.items():
+            array = np.empty(shape=(size,self.output_functional.range.dim))
+            for index in range(size):
+                output_partial_dmu = self.output_functional.d_mu(parameter, index).apply(
+                    solution, mu=mu).to_numpy()[0]
+                U_d_mu = U_d_mus[parameter][index]
+                array[index] = output_partial_dmu + self.output_functional.jacobian(
+                    solution, mu).apply(U_d_mu, mu).to_numpy()[0]
+            if return_array:
+                gradients.extend(array)
+            else:
+                gradients[parameter] = array
+        if return_array:
+            return np.array(gradients)
+        else:
+            return gradients
+
     def _compute_solution_error_estimate(self, solution, mu=None, **kwargs):
         """Compute an error estimate for the computed internal state.
 
@@ -179,9 +259,9 @@ def _compute_output_error_estimate(self, solution, mu=None, **kwargs):
 
     _compute_allowed_kwargs = frozenset()
 
-    def compute(self, solution=False, output=False,
-                solution_error_estimate=False, output_error_estimate=False, *,
-                mu=None, **kwargs):
+    def compute(self, solution=False, output=False, solution_d_mu=False, output_d_mu=False,
+                solution_error_estimate=False, output_error_estimate=False,
+                output_d_mu_return_array=False, *, mu=None, **kwargs):
         """Compute the solution of the model and associated quantities.
 
         This methods computes the output of the model it's internal state
@@ -205,10 +285,19 @@ def compute(self, solution=False, output=False,
             If `True`, return the model's internal state.
         output
             If `True`, return the model output.
+        solution_d_mu
+            If not `False`, either `True` to return the derivative of the model's
+            internal state w.r.t. all parameter components or a tuple `(parameter, index)`
+            to return the derivative of a single parameter component.
+        output_d_mu
+            If `True`, return the gradient of the model output w.r.t. the |Parameter|.
         solution_error_estimate
             If `True`, return an error estimate for the computed internal state.
         output_error_estimate
             If `True`, return an error estimate for the computed output.
+        output_d_mu_return_array
+            if `True`, return the output gradient as a |NumPy array|.
+            Otherwise, return a dict of gradients for each |Parameter|.
         mu
             |Parameter values| for which to compute the values.
         kwargs
@@ -235,12 +324,14 @@ def compute(self, solution=False, output=False,
 
         # first call _compute to give subclasses more control
         data = self._compute(solution=solution, output=output,
+                             solution_d_mu=solution_d_mu, output_d_mu=output_d_mu,
                              solution_error_estimate=solution_error_estimate,
                              output_error_estimate=output_error_estimate,
                              mu=mu, **kwargs)
 
-        if (solution or output or solution_error_estimate or output_error_estimate) and \
-                'solution' not in data:
+        if (solution or output or solution_error_estimate or
+                output_error_estimate or solution_d_mu or output_d_mu) \
+           and 'solution' not in data:
             retval = self.cached_method_call(self._compute_solution, mu=mu, **kwargs)
             if isinstance(retval, dict):
                 assert 'solution' in retval
@@ -257,6 +348,29 @@ def compute(self, solution=False, output=False,
             else:
                 data['output'] = retval
 
+        if solution_d_mu and 'solution_d_mu' not in data:
+            if isinstance(solution_d_mu, tuple):
+                retval = self._compute_solution_d_mu_single_direction(
+                    solution_d_mu[0], solution_d_mu[1], data['solution'], mu=mu, **kwargs)
+            else:
+                retval = self._compute_solution_d_mu(data['solution'], mu=mu, **kwargs)
+            # retval is always a dict
+            if isinstance(retval, dict) and 'solution_d_mu' in retval:
+                data.update(retval)
+            else:
+                data['solution_d_mu'] = retval
+
+        if output_d_mu and 'output_d_mu' not in data:
+            # TODO use caching here (requires skipping args in key generation)
+            retval = self._compute_output_d_mu(data['solution'], mu=mu,
+                                               return_array=output_d_mu_return_array,
+                                               **kwargs)
+            # retval is always a dict
+            if isinstance(retval, dict) and 'output_d_mu' in retval:
+                data.update(retval)
+            else:
+                data['output_d_mu'] = retval
+
         if solution_error_estimate and 'solution_error_estimate' not in data:
             # TODO use caching here (requires skipping args in key generation)
             retval = self._compute_solution_error_estimate(data['solution'], mu=mu, **kwargs)
@@ -349,6 +463,52 @@ def output(self, mu=None, return_error_estimate=False, **kwargs):
         else:
             return data['output']
 
+    def solve_d_mu(self, parameter, index, mu=None, **kwargs):
+        """Solve for the partial derivative of the solution w.r.t. a parameter index
+
+        Parameters
+        ----------
+        parameter
+            parameter for which to compute the sensitivity
+        index
+            parameter index for which to compute the sensitivity
+        mu
+            |Parameter value| for which to solve
+
+        Returns
+        -------
+        The sensitivity of the solution as a |VectorArray|.
+        """
+        data = self.compute(
+            solution_d_mu=(parameter, index),
+            mu=mu,
+            **kwargs
+        )
+        return data['solution_d_mu']
+
+    def output_d_mu(self, mu=None, return_array=False, **kwargs):
+        """compute the gradient w.r.t. the parameter of the output functional
+
+        Parameters
+        ----------
+        mu
+            |Parameter value| for which to compute the gradient
+        return_array
+            if `True`, return the output gradient as a |NumPy array|.
+            Otherwise, return a dict of gradients for each |Parameter|.
+
+        Returns
+        -------
+        The gradient as a |NumPy array| or a dict of |NumPy arrays|.
+        """
+        data = self.compute(
+            output_d_mu=True,
+            mu=mu,
+            output_d_mu_return_array=return_array,
+            **kwargs
+        )
+        return data['output_d_mu']
+
     def estimate_error(self, mu=None, **kwargs):
         """Estimate the error for the computed internal state.
 

diff --git a/src/pymor/operators/block.py b/src/pymor/operators/block.py
@@ -119,6 +119,12 @@ def process_col(col, space):
         blocks = [process_col(col, space) for col, space in zip(self.blocks.T, subspaces)]
         return self.source.make_array(blocks) if self.blocked_source else blocks[0]
 
+    def d_mu(self, parameter, index=0):
+        blocks = np.empty(self.blocks.shape, dtype=object)
+        for (i, j) in np.ndindex(self.blocks.shape):
+            blocks[i, j] = self.blocks[i, j].d_mu(parameter, index)
+        return self.with_(blocks=blocks)
+
 
 class BlockOperator(BlockOperatorBase):
     """A matrix of arbitrary |Operators|.