ENH: add standard benchmarking features to Results

- Run time - Objective evaluations - Array of contraction evaluations for each objective evaluation. This also enhances progress displays in line with the additional information being collected. Closes #2 .
jeffgortmaker · May 3, 2018 · 1980abb · 1980abb
1 parent 72cdd41
commit 1980abb
Show file tree

Hide file tree

Showing 5 changed files with 107 additions and 55 deletions.
diff --git a/pyblp/problem.py b/pyblp/problem.py
@@ -187,7 +187,7 @@ def __init__(self, product_data, agent_data=None, integration=None, nonlinear_pr
             self.MS = 0
 
     def solve(self, sigma, pi=None, sigma_bounds=None, pi_bounds=None, delta=None, WD=None, WS=None, steps=2,
-              optimization=None, custom_display=True, error_behavior='revert', error_punishment=1, iteration=None,
+              optimization=None, universal_display=True, error_behavior='revert', error_punishment=1, iteration=None,
               linear_fp=True, linear_costs=True, center_moments=True, se_type='robust', processes=1):
         r"""Solve the problem.
 
@@ -250,10 +250,11 @@ def solve(self, sigma, pi=None, sigma_bounds=None, pi_bounds=None, delta=None, W
             :class:`Optimization` configuration for how to solve the optimization problem in each GMM step. By default,
             ``Optimization('l-bfgs-b')`` is used. Routines that do not support bounds will ignore `sigma_bounds` and
             `pi_bounds`. Choosing a routine that does not use analytic gradients will slow down estimation.
-        custom_display : `bool, optional`
-            Whether to output a custom display of optimization progress. If this is ``False``, the default display for
-            the routine configured by `optimization` will be used. Default displays may contain some extra information,
-            but compared to other output will look very different, so the default is ``True``.
+        universal_display : `bool, optional`
+            Whether to format optimization progress such that the display looks similar for all `optimization` routines.
+            Specifically, information will be displayed for each objective evaluation. If this is ``False``, the default
+            display for the routine configured by `optimization` will be used. Default displays may contain some extra
+            information, but compared to other output will look very different.
         error_behavior : `str, optional`
             How to handle errors when computing the objective. For example, it is common to encounter overflow when
             computing :math:`\delta(\hat{\theta})` at a large :math:`\hat{\theta}`. The following behaviors are
@@ -407,16 +408,22 @@ def solve(self, sigma, pi=None, sigma_bounds=None, pi_bounds=None, delta=None, W
             # define the objective function for the optimization routine, which will also store optimization progress
             def objective_function(new_theta):
                 info = compute_step_info(new_theta, objective_function.last_info, optimization._compute_gradient)
-                if custom_display:
-                    output(info.format_progress(objective_function.iterations, objective_function.smallest))
-                objective_function.iterations += 1
-                objective_function.smallest = min(objective_function.smallest, info.objective)
+                objective_function.objective_evaluations += 1
+                objective_function.contraction_evaluations.append(info.contraction_evaluations)
+                if universal_display:
+                    output(info.format_progress(
+                        step,
+                        objective_function.objective_evaluations,
+                        objective_function.smallest_objective
+                    ))
+                objective_function.smallest_objective = min(objective_function.smallest_objective, info.objective)
                 objective_function.last_info = info
                 return (info.objective, info.gradient) if optimization._compute_gradient else info.objective
 
             # initialize optimization progress
-            objective_function.iterations = 1
-            objective_function.smallest = np.inf
+            objective_function.objective_evaluations = 0
+            objective_function.contraction_evaluations = []
+            objective_function.smallest_objective = np.inf
             objective_function.last_info = ObjectiveInfo(
                 self, parameter_info, WD, WS, theta, delta, jacobian, tilde_costs
             )
@@ -426,16 +433,24 @@ def objective_function(new_theta):
             output("")
             start_time = time.time()
             bounds = [p.bounds for p in parameter_info.unfixed]
-            verbose = options.verbose and not custom_display
+            verbose = options.verbose and not universal_display
             theta = optimization._optimize(objective_function, theta, bounds, verbose=verbose)
             end_time = time.time()
+            run_time = end_time - start_time
             output("")
-            output(f"Completed step {step} after {output.format_seconds(end_time - start_time)}.")
+            output(f"Completed step {step} after {output.format_seconds(run_time)}.")
 
             # use objective information computed at the optimal theta to compute results for the step
             output(f"Computing step {step} results ...")
             step_info = compute_step_info(theta, objective_function.last_info, compute_gradient=True)
-            results = step_info.to_results(step, center_moments, se_type)
+            results = step_info.to_results(
+                step,
+                run_time,
+                objective_function.objective_evaluations,
+                objective_function.contraction_evaluations,
+                center_moments,
+                se_type
+            )
             delta = step_info.delta
             jacobian = step_info.jacobian
             tilde_costs = step_info.tilde_costs
@@ -466,17 +481,19 @@ def _compute_objective_info(self, parameter_info, WD, WS, error_behavior, error_
             last_delta_t = last_objective_info.delta[self.products.market_ids.flat == t]
             mapping[t] = [market_t, last_delta_t, parameter_info, iteration, linear_fp, compute_gradient]
 
-        # store any error classes
+        # store any error classes and the total number of contraction evaluations
         errors = set()
+        contraction_evaluations = 0
 
         # fill delta and its Jacobian market-by-market (the Jacobian will be null if the objective isn't being computed)
         delta = np.zeros((self.N, 1), dtype=options.dtype)
         jacobian = np.zeros((self.N, theta.size), dtype=options.dtype)
         with ParallelItems(ProblemMarket.solve, mapping, processes) as items:
-            for t, (delta_t, jacobian_t, errors_t) in items:
+            for t, (delta_t, jacobian_t, errors_t, contraction_evaluations_t) in items:
                 delta[self.products.market_ids.flat == t] = delta_t
                 jacobian[self.products.market_ids.flat == t] = jacobian_t
                 errors |= errors_t
+                contraction_evaluations += contraction_evaluations_t
 
         # replace invalid elements in delta and its Jacobian with their last values
         invalid_delta_indices = ~np.isfinite(delta)
@@ -557,8 +574,8 @@ def _compute_objective_info(self, parameter_info, WD, WS, error_behavior, error_
 
         # structure the objective information
         return ObjectiveInfo(
-            self, parameter_info, WD, WS, theta, delta, jacobian, tilde_costs, beta, gamma, xi, omega, objective,
-            gradient
+            self, parameter_info, WD, WS, theta, delta, jacobian, tilde_costs, beta, gamma, xi,
+            omega, objective, gradient, contraction_evaluations
         )
 
 
@@ -802,8 +819,10 @@ class ObjectiveInfo(object):
     """Structured information about a completed iteration of the optimization routine."""
 
     def __init__(self, problem, parameter_info, WD, WS, theta, delta, jacobian, tilde_costs, beta=None, gamma=None,
-                 xi=None, omega=None, objective=None, gradient=None):
-        """Initialize objective information. Optional parameters will not be specified in the first iteration."""
+                 xi=None, omega=None, objective=None, gradient=None, contraction_evaluations=None):
+        """Initialize objective information. Optional parameters will not be specified when preparing for the first
+        objective evaluation.
+        """
         self.problem = problem
         self.parameter_info = parameter_info
         self.WD = WD
@@ -818,26 +837,29 @@ def __init__(self, problem, parameter_info, WD, WS, theta, delta, jacobian, tild
         self.omega = omega
         self.objective = objective
         self.gradient = gradient
+        self.contraction_evaluations = contraction_evaluations
 
-    def format_progress(self, iterations, smallest_objective):
+    def format_progress(self, step, objective_evaluations, smallest_objective):
         """Format optimization progress as a string. The first iteration will include the progress table header. The
         smallest_objective is the smallest objective value encountered so far during optimization.
         """
         lines = []
-        header1 = ["Objective", "Objective", "Objective", "Largest Gradient"]
-        header2 = ["Evaluations", "Value", "Improvement", "Magnitude"]
-        widths = [max(len(header1[0]), len(header2[0]))]
-        widths.extend([max(len(k1), len(k2), options.digits + 6) for k1, k2 in list(zip(header1, header2))[1:]])
+        header1 = ["GMM", "Objective", "Contraction", "Objective", "Objective", "Largest Gradient"]
+        header2 = ["Step", "Evaluations", "Evaluations", "Value", "Improvement", "Magnitude"]
+        widths = [max(len(k1), len(k2)) for k1, k2 in list(zip(header1, header2))[:3]]
+        widths.extend([max(len(k1), len(k2), options.digits + 6) for k1, k2 in list(zip(header1, header2))[3:]])
         formatter = output.table_formatter(widths)
 
         # if this is the first iteration, include the header
-        if iterations == 1:
+        if objective_evaluations == 1:
             lines.extend([formatter(header1), formatter(header2), formatter.lines()])
 
         # include the progress update
         improved = np.isfinite(smallest_objective) and self.objective < smallest_objective
         lines.append(formatter([
-            iterations,
+            step,
+            objective_evaluations,
+            self.contraction_evaluations,
             output.format_number(self.objective),
             output.format_number(smallest_objective - self.objective) if improved else "",
             output.format_number(None if self.gradient is None else np.abs(self.gradient).max())
@@ -846,10 +868,10 @@ def format_progress(self, iterations, smallest_objective):
         # combine the lines into one string
         return "\n".join(lines)
 
-    def to_results(self, step, center_moments, se_type):
+    def to_results(self, step, run_time, objective_evaluations, contraction_evaluations, center_moments, se_type):
         """Convert this information about an iteration of the optimization routine into full results."""
         from .results import Results
-        return Results(self, step, center_moments, se_type)
+        return Results(self, step, run_time, objective_evaluations, contraction_evaluations, center_moments, se_type)
 
 
 class ProblemMarket(Market):
@@ -858,8 +880,8 @@ class ProblemMarket(Market):
     def solve(self, initial_delta, parameter_info, iteration, linear_fp, compute_gradient):
         """Compute the mean utility for this market that equates market shares to observed values by solving a fixed
         point problem. Then, if compute_gradient is True, compute its Jacobian with respect to theta. Finally, return a
-        set of any errors encountered during computation. If necessary, replace null elements in delta with their last
-        values before computing its Jacobian.
+        set of any errors encountered during computation and the number of contraction evaluations. If necessary,
+        replace null elements in delta with their last values before computing its Jacobian.
         """
 
         # configure numpy to identify floating point errors
@@ -880,11 +902,11 @@ def log(x):
             if linear_fp:
                 log_shares = log(self.products.shares)
                 contraction = lambda d: d + log_shares - log(self.compute_probabilities(d) @ self.agents.weights)
-                delta, converged = iteration._iterate(contraction, initial_delta)
+                delta, converged, contraction_evaluations = iteration._iterate(contraction, initial_delta)
             else:
                 compute_probabilities = functools.partial(self.compute_probabilities, mu=np.exp(self.mu), linear=False)
                 contraction = lambda d: d * self.products.shares / (compute_probabilities(d) @ self.agents.weights)
-                exp_delta, converged = iteration._iterate(contraction, np.exp(initial_delta))
+                exp_delta, converged, contraction_evaluations = iteration._iterate(contraction, np.exp(initial_delta))
                 delta = log(exp_delta)
 
             # identify whether the fixed point converged
@@ -893,7 +915,8 @@ def log(x):
 
             # return a null Jacobian if the gradient isn't being computed
             if not compute_gradient:
-                return delta, np.full((self.J, parameter_info.P), np.nan, dtype=options.dtype), errors
+                jacobian = np.full((self.J, parameter_info.P), np.nan, dtype=options.dtype)
+                return delta, jacobian, errors, contraction_evaluations
 
             # replace invalid values in delta with the last computed values before computing the Jacobian
             valid_delta = delta.copy()
@@ -902,7 +925,7 @@ def log(x):
 
             # compute the Jacobian of delta with respect to theta
             jacobian = self.compute_delta_by_theta_jacobian(valid_delta, parameter_info)
-            return delta, jacobian, errors
+            return delta, jacobian, errors, contraction_evaluations
 
     def compute_delta_by_theta_jacobian(self, delta, parameter_info):
         """Compute the Jacobian of delta with respect to theta."""

diff --git a/pyblp/results.py b/pyblp/results.py
@@ -21,6 +21,13 @@ class Results(object):
         The BLP :class:`Problem` that created these results.
     step : `int`
         The GMM step that created these results.
+    run_time : `float`
+        The number of seconds it took the optimization routine to finish during the GMM step that created these results.
+    objective_evaluations : `int`
+        The number of times the GMM objective was evaluated during the GMM step that created these results.
+    contraction_evaluations : `ndarray`
+        For each objective evaluation during the GMM step that created these results, the total number of times across
+        all markets the contraction used to compute :math:`\delta(\hat{\theta})` was evaluated.
     theta : `ndarray`
         Estimated unknown nonlinear parameters, :math:`\hat{\theta}`.
     sigma : `ndarray`
@@ -82,7 +89,8 @@ class Results(object):
 
     """
 
-    def __init__(self, objective_info, step, center_moments, se_type):
+    def __init__(self, objective_info, step, run_time, objective_evaluations, contraction_evaluations, center_moments,
+                 se_type):
         """Compute estimated standard errors and update weighting matrices."""
         self.problem = objective_info.problem
         self.WD = objective_info.WD
@@ -97,6 +105,9 @@ def __init__(self, objective_info, step, center_moments, se_type):
         self.objective = objective_info.objective
         self.gradient = objective_info.gradient
         self.step = step
+        self.run_time = run_time
+        self.objective_evaluations = objective_evaluations
+        self.contraction_evaluations = np.asarray(contraction_evaluations)
         self._parameter_info = objective_info.parameter_info
 
         # construct an array of unique and sorted market IDs
@@ -125,15 +136,22 @@ def __str__(self):
         sections = []
 
         # construct a table of values
-        header1 = ["Objective", "Largest Gradient"]
-        header2 = ["Value", "Magnitude"]
-        widths = [max(len(k1), len(k2), options.digits + 6) for k1, k2 in zip(header1, header2)]
+        header1 = ["GMM", "Objective", "Total Contraction", "Objective", "Largest Gradient"]
+        header2 = ["Step", "Evaluations", "Evaluations", "Value", "Magnitude"]
+        widths = [max(len(k1), len(k2)) for k1, k2 in list(zip(header1, header2))[:3]]
+        widths.extend([max(len(k1), len(k2), options.digits + 6) for k1, k2 in list(zip(header1, header2))[3:]])
         formatter = output.table_formatter(widths)
         sections.append([
             formatter(header1),
             formatter(header2),
             formatter.lines(),
-            formatter([output.format_number(self.objective), output.format_number(np.abs(self.gradient).max())])
+            formatter([
+                self.step,
+                self.objective_evaluations,
+                self.contraction_evaluations.sum(),
+                output.format_number(self.objective),
+                output.format_number(np.abs(self.gradient).max())
+            ])
         ])
 
         # construct a table of linear estimates
@@ -857,12 +875,12 @@ def solve_merger(self, firms_index, iteration, costs, prices=None):
             ownership = self.get_ownership_matrix(firms_index)
             jacobian = self.compute_utilities_by_prices_jacobian()
             contraction = lambda p: costs + self.compute_zeta(ownership, jacobian, costs, p)
-            prices, converged = iteration._iterate(contraction, self.products.prices if prices is None else prices)
+            prices, converged = iteration._iterate(contraction, self.products.prices if prices is None else prices)[:2]
 
-            # store whether the fixed point converged
-            if not converged:
-                errors.add(exceptions.ChangedPricesConvergenceError)
-            return prices, errors
+        # store whether the fixed point converged
+        if not converged:
+            errors.add(exceptions.ChangedPricesConvergenceError)
+        return prices, errors
 
     def compute_shares(self, prices):
         """Market-specific computation for Results.compute_shares."""