tensor-compiler
diff --git a/‎sdh-docs/benchmarking/index.html‎
Lines changed: 354 additions & 0 deletions b/‎sdh-docs/benchmarking/index.html‎
Lines changed: 354 additions & 0 deletions
@@ -0,0 +1,354 @@
+<!DOCTYPE html>
+<!--[if IE 8]><html class="no-js lt-ie9" lang="en" > <![endif]-->
+<!--[if gt IE 8]><!--> <html class="no-js" lang="en" > <!--<![endif]-->
+<head>
+  <meta charset="utf-8">
+  <meta http-equiv="X-UA-Compatible" content="IE=edge">
+  <meta name="viewport" content="width=device-width, initial-scale=1.0">
+  
+  
+  <link rel="shortcut icon" href="../favicon.ico">
+  
+  <title>Guide to Benchmarking - Documentation - The Tensor Algebra Compiler (TACO)</title>
+  <link href='https://fonts.googleapis.com/css?family=Lato:400,700|Roboto+Slab:400,700|Inconsolata:400,700' rel='stylesheet' type='text/css'>
+
+  <link rel="stylesheet" href="../css/theme.css" type="text/css" />
+  <link rel="stylesheet" href="../css/theme_extra.css" type="text/css" />
+  <link rel="stylesheet" href="../css/highlight.css">
+  <link href="../extra.css" rel="stylesheet">
+  
+  <script>
+    // Current page data
+    var mkdocs_page_name = "Guide to Benchmarking";
+    var mkdocs_page_input_path = "benchmarking.md";
+    var mkdocs_page_url = "/benchmarking/index.html";
+  </script>
+  
+  <script src="../js/jquery-2.1.1.min.js"></script>
+  <script src="../js/modernizr-2.8.3.min.js"></script>
+  <script type="text/javascript" src="../js/highlight.pack.js"></script> 
+  
+</head>
+
+<body class="wy-body-for-nav" role="document">
+
+  <div class="wy-grid-for-nav">
+
+    
+    <nav data-toggle="wy-nav-shift" class="wy-nav-side stickynav">
+      <div class="wy-side-nav-search">
+        <a href="http://tensor-compiler.org" class="icon icon-home"> Tensor Algebra Compiler (TACO)</a>
+        <div role="search">
+  <form id ="rtd-search-form" class="wy-form" action="../search.html" method="get">
+    <input type="text" name="q" placeholder="Search docs" />
+  </form>
+</div>
+      </div>
+
+      <div class="wy-menu wy-menu-vertical" data-spy="affix" role="navigation" aria-label="main navigation">
+	<ul class="current">
+	  
+          
+            <li class="toctree-l1">
+		
+    <a class="" href="../index.html">Home</a>
+	    </li>
+          
+            <li class="toctree-l1">
+		
+    <span class="caption-text">Python Library</span>
+    <ul class="subnav">
+                <li class="">
+                    
+    <a class="" href="../pytensors/index.html">Defining Tensors</a>
+                </li>
+                <li class="">
+                    
+    <a class="" href="../pycomputations/index.html">Computing on Tensors</a>
+                </li>
+    </ul>
+	    </li>
+          
+            <li class="toctree-l1">
+		
+    <span class="caption-text">Example Applications</span>
+    <ul class="subnav">
+                <li class="">
+                    
+    <a class="" href="../scientific_computing/index.html">Scientific Computing: SpMV</a>
+                </li>
+                <li class="">
+                    
+    <a class="" href="../data_analytics/index.html">Data Analytics: MTTKRP</a>
+                </li>
+                <li class="">
+                    
+    <a class="" href="../machine_learning/index.html">Machine Learning: SDDMM</a>
+                </li>
+    </ul>
+	    </li>
+          
+            <li class="toctree-l1">
+		
+    <a class="" href="../optimization/index.html">Strategies for Optimization</a>
+	    </li>
+          
+            <li class="toctree-l1 current">
+		
+    <a class="current" href="index.html">Guide to Benchmarking</a>
+    <ul class="subnav">
+            
+    </ul>
+	    </li>
+          
+            <li class="toctree-l1">
+		
+    <span class="caption-text">C++ Library</span>
+    <ul class="subnav">
+                <li class="">
+                    
+    <a class="" href="../tensors/index.html">Defining Tensors</a>
+                </li>
+                <li class="">
+                    
+    <a class="" href="../computations/index.html">Computing on Tensors</a>
+                </li>
+    </ul>
+	    </li>
+          
+        </ul>
+      </div>
+      &nbsp;
+    </nav>
+
+    <section data-toggle="wy-nav-shift" class="wy-nav-content-wrap">
+
+      
+      <nav class="wy-nav-top" role="navigation" aria-label="top navigation">
+        <i data-toggle="wy-nav-top" class="fa fa-bars"></i>
+        <a href="http://tensor-compiler.org"> Tensor Algebra Compiler (taco)</a>
+      </nav>
+
+      
+      <div class="wy-nav-content">
+        <div class="rst-content">
+          <div role="navigation" aria-label="breadcrumbs navigation">
+  <ul class="wy-breadcrumbs">
+    <li><a href="../index.html">Docs</a> &raquo;</li>
+    
+      
+    
+    <li>Guide to Benchmarking</li>
+    <li class="wy-breadcrumbs-aside">
+      
+    </li>
+  </ul>
+  <hr/>
+</div>
+          <div role="main">
+            <div class="section">
+              
+                <p>The performance of Python applications that use TACO can be measured using
+Python's built-in <code>time.perf_counter</code> function with minimal changes to the
+applications.  As an example, we can benchmark the performance of the
+scientific computing application shown <a href="../scientific_computing/index.html">here</a> as
+follows:</p>
+<pre><code class="python">import pytaco as pt
+from pytaco import compressed, dense
+import numpy as np
+import time
+
+csr = pt.format([dense, compressed])
+dv  = pt.format([dense])
+
+A = pt.read(&quot;pwtk.mtx&quot;, csr)
+x = pt.from_array(np.random.uniform(size=A.shape[1]))
+z = pt.from_array(np.random.uniform(size=A.shape[0]))
+y = pt.tensor([A.shape[0]], dv)
+
+i, j = pt.get_index_vars(2)
+y[i] = A[i, j] * x[j] + z[i]
+
+# Tell TACO to generate code to perform the SpMV computation
+y.compile()
+
+# Benchmark the actual SpMV computation
+start = time.perf_counter()
+y.compute()
+end = time.perf_counter()
+
+print(&quot;Execution time: {0} seconds&quot;.format(end - start))
+</code></pre>
+
+<p>In order to accurately measure TACO's computational performance, <strong>only the
+time it takes to actually perform a computation should be measured.  The time
+it takes to generate code under the hood for performing that computation should
+not be measured</strong>, since this overhead can be quite variable but can often be
+amortized in practice.  By default though, TACO will only generate and compile
+code it needs for performing a computation immediately before it has to
+actually perform the computation.  As the example above demonstrates, by
+manually calling the result tensor's <code>compile</code> method, we can tell TACO to
+generate code needed for performing the computation before benchmarking starts,
+letting us measure only the performance of the computation itself.</p>
+<p><strong>The time it takes to construct the initial input tensors should also not be
+measured</strong>, since again this overhead can often be amortized in practice.  By
+default, <code>pytaco.read</code> and functions for converting NumPy arrays and SciPy
+matrices to TACO tensors return fully constructed tensors.  If you add nonzero
+elements to an input tensor by calling <code>insert</code> though, then <code>pack</code> must also
+be explicitly invoked before any benchmarking is done:</p>
+<pre><code class="python">import pytaco as pt
+from pytaco import compressed, dense
+import numpy as np
+import random
+import time
+
+csr = pt.format([dense, compressed])
+dv  = pt.format([dense])
+
+A = pt.read(&quot;pwtk.mtx&quot;, csr)
+x = pt.tensor([A.shape[1]], dv)
+z = pt.tensor([A.shape[0]], dv)
+y = pt.tensor([A.shape[0]], dv)
+
+# Insert random values into x and z and pack them into dense arrays
+for k in range(A.shape[1]):
+  x.insert([k], random.random())
+x.pack()
+for k in range(A.shape[0]):
+  z.insert([k], random.random())
+z.pack()
+
+i, j = pt.get_index_vars(2)
+y[i] = A[i, j] * x[j] + z[i]
+
+y.compile()
+
+start = time.perf_counter()
+y.compute()
+end = time.perf_counter()
+
+print(&quot;Execution time: {0} seconds&quot;.format(end - start))
+</code></pre>
+
+<p>TACO avoids regenerating code for performing the same computation though as
+long as the computation is redefined with the same index variables and with the
+same operand and result tensors.  Thus, if your application executes the same
+computation many times in a loop and if the computation is executed on
+sufficiently large data sets, TACO will naturally amortize the overhead
+associated with generating code for performing the computation.  In such 
+scenarios, it is acceptable to include the initial code generation overhead 
+in the performance measurement:</p>
+<pre><code class="python">import pytaco as pt
+from pytaco import compressed, dense
+import numpy as np
+import time
+
+csr = pt.format([dense, compressed])
+dv  = pt.format([dense])
+
+A = pt.read(&quot;pwtk.mtx&quot;, csr)
+x = pt.tensor([A.shape[1]], dv)
+z = pt.tensor([A.shape[0]], dv)
+y = pt.tensor([A.shape[0]], dv)
+
+for k in range(A.shape[1]):
+  x.insert([k], random.random())
+x.pack()
+for k in range(A.shape[0]):
+  z.insert([k], random.random())
+z.pack()
+
+i, j = pt.get_index_vars(2)
+
+# Benchmark the iterative SpMV computation, including overhead for 
+# generating code in the first iteration to perform the computation
+start = time.perf_counter()
+for k in range(1000):
+  y[i] = A[i, j] * x[j] + z[i]
+  y.evaluate()
+  x[i] = y[i]
+  x.evaluate()
+end = time.perf_counter()
+
+print(&quot;Execution time: {0} seconds&quot;.format(end - start))
+</code></pre>
+
+<div class="admonition warning">
+<p class="admonition-title">Warning</p>
+<p>In order to avoid regenerating code for performing a computation, the
+computation must be redefined with the exact same index variable <em>objects</em>
+and also with the exact same tensor objects for operands and result.  In
+the example above, every loop iteration redefines the computation of <code>y</code>
+and <code>x</code> using the same tensor and index variable objects costructed outside
+the loop, so TACO will only generate code to compute <code>y</code> and <code>x</code> in the
+first iteration.  If the index variables were constructed inside the loop
+though, TACO would regenerate code to compute <code>y</code> and <code>x</code> in every loop
+iteration, and the compilation overhead would not be amortized. </p>
+</div>
+<div class="admonition note">
+<p class="admonition-title">Note</p>
+<p>As a rough rule of thumb, if a computation takes on the order of seconds or
+more in total to perform across all invocations with identical operands and
+result (and is always redefined with identical index variables), then it is
+acceptable to include the overhead associated with generating code for
+performing the computation in performance measurements.</p>
+</div>
+              
+            </div>
+          </div>
+          <footer>
+  
+    <div class="rst-footer-buttons" role="navigation" aria-label="footer navigation">
+      
+        <a href="../tensors/index.html" class="btn btn-neutral float-right" title="Defining Tensors">Next <span class="icon icon-circle-arrow-right"></span></a>
+      
+      
+        <a href="../optimization/index.html" class="btn btn-neutral" title="Strategies for Optimization"><span class="icon icon-circle-arrow-left"></span> Previous</a>
+      
+    </div>
+  
+
+  <hr/>
+
+  <div role="contentinfo">
+    <!-- Copyright etc -->
+    
+  </div>
+  <script>
+    (function(i,s,o,g,r,a,m){i['GoogleAnalyticsObject']=r;i[r]=i[r]||function(){
+        (i[r].q=i[r].q||[]).push(arguments)},i[r].l=1*new Date();a=s.createElement(o),
+      m=s.getElementsByTagName(o)[0];a.async=1;a.src=g;m.parentNode.insertBefore(a,m)
+    })(window,document,'script','https://www.google-analytics.com/analytics.js','ga');
+    ga('create', 'UA-93058524-1', 'auto');
+    ga('send', 'pageview');
+  </script>
+
+  <small>Built with <a href="http://www.mkdocs.org">MkDocs</a> using a <a href="https://github.com/snide/sphinx_rtd_theme">theme</a> provided by <a href="https://readthedocs.org">Read the Docs</a>.</small>
+</footer>
+      
+        </div>
+      </div>
+
+    </section>
+
+  </div>
+
+  <div class="rst-versions" role="note" style="cursor: pointer">
+    <span class="rst-current-version" data-toggle="rst-current-version">
+      
+      
+        <span><a href="../optimization/index.html" style="color: #fcfcfc;">&laquo; Previous</a></span>
+      
+      
+        <span style="margin-left: 15px"><a href="../tensors/index.html" style="color: #fcfcfc">Next &raquo;</a></span>
+      
+    </span>
+</div>
+    <script>var base_url = '..';</script>
+    <script src="../js/theme.js"></script>
+      <script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.0/MathJax.js?config=TeX-AMS-MML_HTMLorMML"></script>
+      <script src="../search/require.js"></script>
+      <script src="../search/search.js"></script>
+
+</body>
+</html>