enable symbolic backward optimization with einsum_path

apache · Aug 15, 2019 · 3255b3e · 3255b3e
1 parent b8a70c2
commit 3255b3e
Show file tree

Hide file tree

Showing 12 changed files with 250 additions and 80 deletions.
diff --git a/benchmark/python/einsum/benchmark_einsum.py b/benchmark/python/einsum/benchmark_einsum.py
@@ -41,11 +41,11 @@ def test_np_einsum():
     print("Basic einsum: {} ms".format(cost * 1000))
 
     # Sub-optimal einsum
-    cost = measure_cost(500, np.einsum, *args, optimize='optimal')
-    print("Optimal einsum: {} ms".format(cost * 1000))
+    # cost = measure_cost(500, np.einsum, *args, optimize='optimal')
+    # print("Optimal einsum: {} ms".format(cost * 1000))
 
     # Greedy einsum
-    cost = measure_cost(500, np.einsum, *args, optimize='greedy')
+    cost = measure_cost(500, np.einsum, *args, optimize=True)
     print("Greedy einsum: {} ms".format(cost * 1000))
 
     print('Inner Product:')
@@ -55,7 +55,7 @@ def test_np_einsum():
     cost = measure_cost(50, np.tensordot, *args, axes=([0],[0]))
     print('Tensordot: {} ms'.format(cost * 1000))
     args = ['i, i', a, b]
-    cost = measure_cost(50, np.einsum, *args, optimize='greedy')
+    cost = measure_cost(50, np.einsum, *args, optimize=True)
     print('Greedy einsum: {} ms'.format(cost * 1000))
     cost = measure_cost(50, np.einsum, *args)
     print('Basic einsum: {} ms'.format(cost * 1000))
@@ -67,7 +67,7 @@ def test_np_einsum():
     cost = measure_cost(50, np.tensordot, *args, axes=([1],[0]))
     print('Tensordot: {} ms'.format(cost * 1000))
     args = ['ij, jk', a, b]
-    cost = measure_cost(50, np.einsum, *args, optimize='greedy')
+    cost = measure_cost(50, np.einsum, *args, optimize=True)
     print('Greedy einsum: {} ms'.format(cost * 1000))
     cost = measure_cost(50, np.einsum, *args)
     print('Basic einsum: {} ms'.format(cost * 1000))

diff --git a/python/mxnet/ndarray/numpy/_op.py b/python/mxnet/ndarray/numpy/_op.py
@@ -737,10 +737,9 @@ def einsum(*operands, **kwargs):
         These are the arrays for the operation.
     out : ndarray, optional
         If provided, the calculation is done into this array.
-    optimize : {False, True, 'greedy', 'optimal'}, optional
+    optimize : {False, True}, optional
         Controls if intermediate optimization should occur. No optimization
-        will occur if False and True will default to the 'greedy' algorithm.
-        Defaults to False.
+        will occur if False.
 
     Returns
     -------
@@ -815,8 +814,8 @@ def einsum(*operands, **kwargs):
     memory footprint during computation.
 
     Typically a 'greedy' algorithm is applied which empirical tests have shown
-    returns the optimal path in the majority of cases. In some cases 'optimal'
-    will return the superlative path through a more expensive, exhaustive search.
+    returns the optimal path in the majority of cases. 'optimal' is not supported
+    for now.
 
     Examples
     --------
@@ -926,11 +925,8 @@ def einsum(*operands, **kwargs):
     # Basic `einsum`: ~42.22ms  (benchmarked on 3.4GHz Intel Xeon.)
     >>> for iteration in range(500):
     ...     np.einsum('ijk,ilm,njm,nlk,abc->',a,a,a,a,a)
-    # Optimal `einsum`: ~0.672ms
+    # Greedy `einsum` (faster optimal path approximation): ~0.117ms
     >>> for iteration in range(500):
-    ...     np.einsum('ijk,ilm,njm,nlk,abc->',a,a,a,a,a, optimize='optimal')
-    # Greedy `einsum` (faster optimal path approximation): ~0.306ms
-    >>> for iteration in range(500):
-    ...     np.einsum('ijk,ilm,njm,nlk,abc->',a,a,a,a,a, optimize='greedy')
+    ...     np.einsum('ijk,ilm,njm,nlk,abc->',a,a,a,a,a, optimize=True)
     """
     return _einsum_path_util._einsum('ndarray', *operands, **kwargs)
diff --git a/python/mxnet/numpy/multiarray.py b/python/mxnet/numpy/multiarray.py
@@ -1908,10 +1908,9 @@ def einsum(*operands, **kwargs):
         These are the arrays for the operation.
     out : ndarray, optional
         If provided, the calculation is done into this array.
-    optimize : {False, True, 'greedy', 'optimal'}, optional
+    optimize : {False, True}, optional
         Controls if intermediate optimization should occur. No optimization
-        will occur if False and True will default to the 'greedy' algorithm.
-        Defaults to False.
+        will occur if False.
 
     Returns
     -------
@@ -1986,8 +1985,8 @@ def einsum(*operands, **kwargs):
     memory footprint during computation.
 
     Typically a 'greedy' algorithm is applied which empirical tests have shown
-    returns the optimal path in the majority of cases. In some cases 'optimal'
-    will return the superlative path through a more expensive, exhaustive search.
+    returns the optimal path in the majority of cases. 'optimal' is not supported
+    for now.
 
     Examples
     --------
@@ -2097,11 +2096,8 @@ def einsum(*operands, **kwargs):
     # Basic `einsum`: ~42.22ms  (benchmarked on 3.4GHz Intel Xeon.)
     >>> for iteration in range(500):
     ...     np.einsum('ijk,ilm,njm,nlk,abc->',a,a,a,a,a)
-    # Optimal `einsum`: ~0.672ms
+    # Greedy `einsum` (faster optimal path approximation): ~0.117ms
     >>> for iteration in range(500):
-    ...     np.einsum('ijk,ilm,njm,nlk,abc->',a,a,a,a,a, optimize='optimal')
-    # Greedy `einsum` (faster optimal path approximation): ~0.306ms
-    >>> for iteration in range(500):
-    ...     np.einsum('ijk,ilm,njm,nlk,abc->',a,a,a,a,a, optimize='greedy')
+    ...     np.einsum('ijk,ilm,njm,nlk,abc->',a,a,a,a,a, optimize=True)
     """
     return _mx_nd_np.einsum(*operands, **kwargs)
diff --git a/python/mxnet/symbol/numpy/_symbol.py b/python/mxnet/symbol/numpy/_symbol.py
@@ -1365,10 +1365,9 @@ def einsum(*operands, **kwargs):
         These are the arrays for the operation.
     out : _Symbol, optional
         If provided, the calculation is done into this array.
-    optimize : {False, True, 'greedy', 'optimal'}, optional
+    optimize : {False, True}, optional
         Controls if intermediate optimization should occur. No optimization
-        will occur if False and True will default to the 'greedy' algorithm.
-        Defaults to False.
+        will occur if False.
 
     Returns
     -------
@@ -1443,8 +1442,8 @@ def einsum(*operands, **kwargs):
     memory footprint during computation.
 
     Typically a 'greedy' algorithm is applied which empirical tests have shown
-    returns the optimal path in the majority of cases. In some cases 'optimal'
-    will return the superlative path through a more expensive, exhaustive search.
+    returns the optimal path in the majority of cases. 'optimal' is not supported
+    for now.
     """
     return _einsum_path_util._einsum('symbol', *operands, **kwargs)
 

diff --git a/src/imperative/imperative_utils.h b/src/imperative/imperative_utils.h
@@ -274,7 +274,7 @@ inline void SetDependency(const nnvm::NodeAttrs& attrs,
       }
     }
     // relax the constraint for einsum (which needs 3) and tensordot (which needs 2)
-    CHECK_LE(ntmp, 3) << "Only support 3 temp space requests";
+    CHECK_LE(ntmp, 4) << "Only support 4 temp space requests";
   }
 
   // append extra resource requests for storage fallback

diff --git a/src/operator/numpy/np_dot.cc b/src/operator/numpy/np_dot.cc
@@ -129,7 +129,7 @@ NNVM_REGISTER_OP(_np_dot)
 .set_attr<nnvm::FInferType>("FInferType", ElemwiseType<2, 1>)
 .set_attr<FResourceRequest>("FResourceRequest",
   [](const NodeAttrs& attrs) {
-    return std::vector<ResourceRequest>{ResourceRequest::kTempSpace};
+    return std::vector<ResourceRequest>(2, ResourceRequest::kTempSpace);
   })
 .set_attr<FCompute>("FCompute<cpu>", NumpyDotForward<cpu>)
 .set_attr<nnvm::FGradient>("FGradient", ElemwiseGradUseIn{"_backward_np_dot"})
@@ -142,7 +142,7 @@ NNVM_REGISTER_OP(_backward_np_dot)
 .set_attr<nnvm::TIsBackward>("TIsBackward", true)
 .set_attr<FResourceRequest>("FResourceRequest",
   [](const NodeAttrs& attrs) {
-    return std::vector<ResourceRequest>{ResourceRequest::kTempSpace};
+    return std::vector<ResourceRequest>(2, ResourceRequest::kTempSpace);
   })
 .set_attr<FCompute>("FCompute<cpu>", NumpyDotBackward<cpu>);