pantsbuild · cosmicexplorer · Jan 23, 2019 · Jan 23, 2019 · jsirois · Jan 23, 2019
diff --git a/src/python/pants/backend/jvm/tasks/jvm_compile/rsc/rsc_compile.py b/src/python/pants/backend/jvm/tasks/jvm_compile/rsc/rsc_compile.py
@@ -182,7 +182,6 @@ def register_options(cls, register):
       ]
     )
 
-  # TODO: allow @memoized_method to convert lists into tuples so they can be hashed!
   @memoized_property
   def _nailgunnable_combined_classpath(self):
     """Register all of the component tools of the rsc compile task as a "combined" jvm tool.

diff --git a/src/python/pants/util/BUILD b/src/python/pants/util/BUILD
@@ -88,6 +88,7 @@ python_library(
   name = 'memo',
   sources = ['memo.py'],
   dependencies = [
+      '3rdparty/python/twitter/commons:twitter.common.collections',
       ':meta'
   ],
 )

diff --git a/src/python/pants/util/memo.py b/src/python/pants/util/memo.py
@@ -8,6 +8,8 @@
 import inspect
 from contextlib import contextmanager
 
+from twitter.common.collections import OrderedSet
+
 from pants.util.meta import classproperty, staticproperty
 
 
@@ -24,6 +26,44 @@ def equal_args(*args, **kwargs):
   return key
 
 
+def coercing_arg_normalizer(type_coercions, base_normalizer, args, kwargs):
+  """Generate a tuple based off of arguments, applying any specified coercions.
+
+  :param dict type_coercions: Map of type -> 1-arg function. If an argument's type matches any
+                              element, the function is called on the argument and stored in the
+                              returned tuple in its place.
+  :param func base_normalizer: A key factory like `equal_args`.
+
+  :rtype: tuple
+  """
+  args_key = base_normalizer(*args, **kwargs)
+  coerced = []
+  for arg in args_key:
+    arg_type = type(arg)
+    coercing_function = type_coercions.get(arg_type, None)
+    if coercing_function:
+      arg = coercing_function(arg)
+    coerced.append(arg)
+  return tuple(coerced)
+
+
+collection_coercions = {
+  list: tuple,
+  OrderedSet: tuple,
+}
+
+
+def coerce_collections(*args, **kwargs):
+  """Generate a key based off of arguments like `equal_args`, coercing ordered collections to tuple.
+
+  Although `list` and `OrderedSet` are mutable and therefore python doesn't let them be hashable,
+  since we convert these arguments to tuple (a hashable type) before entering them in the cache, we
+  can accept a greater range of inputs.
+  """
+  return coercing_arg_normalizer(type_coercions=collection_coercions, base_normalizer=equal_args,
+                                 args=args, kwargs=kwargs)
+
+
 class InstanceKey(object):
   """An equality wrapper for an arbitrary object instance.
 
@@ -58,6 +98,12 @@ def per_instance(*args, **kwargs):
   return equal_args(*instance_and_rest, **kwargs)
 
 
+def coerce_collections_per_instance(*args, **kwargs):
+  """Analogous to `coerce_collections`, but uses an `InstanceKey` like `per_instance`."""
+  return coercing_arg_normalizer(type_coercions=collection_coercions, base_normalizer=per_instance,
+                                 args=args, kwargs=kwargs)
+
+
 def memoized(func=None, key_factory=equal_args, cache_factory=dict):
   """Memoizes the results of a function call.
 

diff --git a/tests/python/pants_test/util/test_memo.py b/tests/python/pants_test/util/test_memo.py
@@ -4,12 +4,16 @@
 
 from __future__ import absolute_import, division, print_function, unicode_literals
 
+import re
 import unittest
 from builtins import object
 
-from pants.util.memo import (memoized, memoized_classmethod, memoized_classproperty,
-                             memoized_method, memoized_property, memoized_staticmethod,
-                             memoized_staticproperty, per_instance, testable_memoized_property)
+from twitter.common.collections import OrderedSet
+
+from pants.util.memo import (coerce_collections, coerce_collections_per_instance, memoized,
+                             memoized_classmethod, memoized_classproperty, memoized_method,
+                             memoized_property, memoized_staticmethod, memoized_staticproperty,
+                             per_instance, testable_memoized_property)
 
 
 class MemoizeTest(unittest.TestCase):
@@ -354,3 +358,48 @@ def calls(self):
 
     self.assertEqual(4, foo2.calls)
     self.assertEqual(4, foo2.calls)
+
+  def test_collection_coercion(self):
+    @memoized
+    def f(x):
+      return sum(x)
+    with self.assertRaisesRegexp(TypeError, re.escape("unhashable type: 'list'")):
+      f([3, 4])
+
+    g_called = self._Called(increment=1)
+    @memoized(key_factory=coerce_collections)
+    def g(x):
+      g_called._called()
+      return sum(x)
+    x = [3, 4]
+    # x is converted into a tuple by coerce_collections, so this will only call g once.
+    self.assertEqual(7, g(tuple(x)))
+    self.assertEqual(7, g(x))
+    x[0] = 2
+    self.assertEqual(6, g(x))
+    # OrderedSet is converted into a tuple which is equal to the previous call, so this should not
+    # increase the call count.
+    self.assertEqual(6, g(OrderedSet(x)))
+    self.assertEqual(2, g_called._calls)
+
+    class C(self._Called):
+      def __init__(self):
+        super(C, self).__init__(increment=1)
+
+      @memoized_method
+      def f(self, x):
+        return sum(x)
+
+      @memoized(key_factory=coerce_collections_per_instance)
+      def g(self, x):
+        self._called()
+        return sum(x)
+    c = C()
+    x = [3, 4]
+    with self.assertRaisesRegexp(TypeError, re.escape("unhashable type: 'list'")):
+      c.f(x)
+    self.assertEqual(7, c.f(tuple(x)))
+    self.assertEqual(7, c.g(x))
+    x[0] = 2
+    self.assertEqual(6, c.g(x))
+    self.assertEqual(2, c._calls)