ENH: support different micro chunking for different market IDs

jeffgortmaker · Mar 10, 2023 · 64e1817 · 64e1817
1 parent 9d30295
commit 64e1817
Show file tree

Hide file tree

Showing 2 changed files with 15 additions and 4 deletions.
diff --git a/pyblp/markets/market.py b/pyblp/markets/market.py
@@ -1733,9 +1733,17 @@ def generate_micro_chunks(
             probabilities_tangent_mapping: Optional[Dict[int, Array]] = None) -> (
             Iterator[Tuple[Optional[Array], Optional[Array], Optional[Dict[int, Array]]]]):
         """Generate chunks of agents for micro computations to reduce memory usage."""
+        chunks = options.micro_computation_chunks
+        if isinstance(chunks, dict):
+            chunks = chunks.get(self.t, 1)
+        if not isinstance(chunks, int) or chunks < 1:
+            raise TypeError(
+                "micro_computation_chunks must be a positive int or a dict mapping market IDs to positive ints."
+            )
+
         agent_indices_chunks = [None]
-        if options.micro_computation_chunks > 1:
-            agent_indices_chunks = np.array_split(np.arange(self.I), options.micro_computation_chunks)
+        if chunks > 1:
+            agent_indices_chunks = np.array_split(np.arange(self.I), chunks)
 
         probabilities_chunk = probabilities
         probabilities_tangent_mapping_chunk = probabilities_tangent_mapping

diff --git a/pyblp/options.py b/pyblp/options.py
@@ -108,14 +108,17 @@
     of memory, one option is to temporarily reduce the number of markets, observations, or agents to cut down on memory
     while debugging one's code to see which micro moments are collinear with one another.
 
-micro_computation_chunks : `int`
+micro_computation_chunks : `int or dict`
     How finely to break up micro moment computation within market. Computation is broken up by groups of agents within
     market. This can help reduce the amount of memory being used by micro moments when there are a large number of
     agents and products, and especially when second choice micro moments are being used.
 
     By default, micro moment computation is done in one chunk for each market. To reduce memory usage without changing
     any estimation results, for example by splitting up computation into 10 chunks, use
-    ``pyblp.options. micro_computation_chunks = 10``.
+    ``pyblp.options.micro_computation_chunks = 10``.
+
+    If a dictionary, this should map market IDs to the number of chunks to use. For example, to only chunk computation
+    in market ID ``'big market'``, use ``pyblp.options.micro_computation_chunks = {'big_market': 10}``.
 
 drop_product_fields : `bool`
     Whether to conserve memory by dropping product data fields that are not needed for market-level computation when