Merged in r4146 from std-trunk (internal Numexpr module updated to la…

…test 1.3). git-svn-id: http://www.pytables.org/svn/pytables/PyTablesPro/trunk@4147 1b98710c-d8ec-0310-ae81-f5f2bcd8cb94
avalentino · Jun 9, 2009 · 563c6d7 · 563c6d7
1 parent 537acd7
commit 563c6d7
Show file tree

Hide file tree

Showing 22 changed files with 1,408 additions and 346 deletions.
diff --git a/LICENSES/NUMEXPR.txt b/LICENSES/NUMEXPR.txt
@@ -1,4 +1,5 @@
-Copyright (c) 2007 David M. Cooke <david.m.cooke@gmail.com>
+Copyright (c) 2007,2008  David M. Cooke <david.m.cooke@gmail.com>
+Copyright (c) 2009  Francesc Alted <faltet@pytables.org>
 
 Permission is hereby granted, free of charge, to any person obtaining a copy
 of this software and associated documentation files (the "Software"), to deal

diff --git a/VERSION b/VERSION
@@ -1 +1 @@
-2.2a1pro
+2.2a2pro
diff --git a/doc/xml/usersguide.xml b/doc/xml/usersguide.xml
@@ -1018,7 +1018,7 @@ python -c "import tables; tables.test()"</screen>
           <literal>grid_i</literal> and <literal>grid_j</literal>. Our
           instrumentation also can obtain the pressure and energy of the
           particle. The resolution of the pressure-gauge allows us to use a
-          simple-precision float to store <literal>pressure</literal>
+          single-precision float to store <literal>pressure</literal>
           readings, while the <literal>energy</literal> value will need a
           double-precision float. Finally, to track the particle we want to
           assign it a name to identify the kind of the particle it is and a
@@ -14498,33 +14498,47 @@ time, min/max temp, temp[n,0,0] = 9.0 0.0107500003651 9.99187469482 8.1883249282
       <emphasis>can not be overridden</emphasis>, but you can always define
       other new names for the objects you intend to use.</para>
 
-      <para>Values in a condition may have the following types: <itemizedlist>
-          <listitem>
-            <para>8-bit boolean (<literal>bool</literal>).</para>
-          </listitem>
-
-          <listitem>
-            <para>32-bit signed integer (<literal>int</literal>).</para>
-          </listitem>
+      <para>Values in a condition may have the following types:</para>
 
-          <listitem>
-            <para>64-bit signed integer (<literal>long</literal>).</para>
-          </listitem>
+      <itemizedlist>
+        <listitem>
+          <para>8-bit boolean (<literal>bool</literal>).</para>
+        </listitem>
+
+        <listitem>
+          <para>32-bit signed integer (<literal>int</literal>).</para>
+        </listitem>
+
+        <listitem>
+          <para>64-bit signed integer (<literal>long</literal>).</para>
+        </listitem>
+
+        <listitem>
+          <para>32-bit, single-precision floating point number
+            (<literal>float</literal> or <literal>float32</literal>).</para>
+        </listitem>
+
+        <listitem>
+          <para>64-bit, double-precision floating point number
+            (<literal>double</literal> or <literal>float64</literal>).</para>
+        </listitem>
+
+        <listitem>
+          <para>2x64-bit, double-precision complex number
+            (<literal>complex</literal>).</para>
+        </listitem>
 
-          <listitem>
-            <para>64-bit, double-precision floating point number
-            (<literal>float</literal>).</para>
-          </listitem>
+        <listitem>
+          <para>Raw string of bytes (<literal>str</literal>).</para>
+        </listitem>
+      </itemizedlist>
 
-          <listitem>
-            <para>2x64-bit, double-precision complex number
-            (<literal>complex</literal>).</para>
-          </listitem>
+      <para>Nevertheless, if the type passed is not among the above ones, it
+      will be silently upcasted, so you don't need to worry too much about
+      passing supported types: just pass whatever type you want and the
+      interpreter will take care of it.</para>
 
-          <listitem>
-            <para>Raw string of bytes (<literal>str</literal>).</para>
-          </listitem>
-        </itemizedlist> The types in PyTables conditions are somewhat stricter
+      <para>However, the types in PyTables conditions are somewhat stricter
       than those of Python. For instance, the <emphasis>only</emphasis> valid
       constants for booleans are <literal>True</literal> and
       <literal>False</literal>, and they are <emphasis>never</emphasis>

diff --git a/tables/_conditions_common.py b/tables/_conditions_common.py
@@ -9,7 +9,7 @@
 """
 
 import re
-from tables.numexpr.compiler import typecode_to_kind
+from tables.numexpr.necompiler import typecode_to_kind
 
 _no_matching_opcode = re.compile(r"[^a-z]([a-z]+)_([a-z]+)[^a-z]")
 # E.g. "gt" and "bfc" from "couldn't find matching opcode for 'gt_bfc'".

diff --git a/tables/_conditions_pro.py b/tables/_conditions_pro.py
@@ -10,7 +10,7 @@
 :Revision: $Id$
 """
 
-from tables.numexpr.compiler import expressionToAST, typeCompileAst
+from tables.numexpr.necompiler import expressionToAST, typeCompileAst
 from tables._conditions_common import _unsupported_operation_error
 
 

diff --git a/tables/conditions.py b/tables/conditions.py
@@ -20,7 +20,7 @@
     Evaluate a function over a record array.
 """
 
-from tables.numexpr.compiler import stringToExpression, numexpr
+from tables.numexpr.necompiler import stringToExpression, NumExpr
 from tables.utilsExtension import getNestedField
 from tables._conditions_common import _unsupported_operation_error
 from tables.utils import lazyattr
@@ -150,7 +150,7 @@ def compile_condition(condition, typemap, indexedcols, copycols):
         # See the comments in `tables.numexpr.evaluate()` for the
         # reasons of inserting copy operators for unaligned,
         # *unidimensional* arrays.
-        func = numexpr(expr, signature, copy_args=copycols)
+        func = NumExpr(expr, signature, copy_args=copycols)
     except NotImplementedError, nie:
         # Try to make this Numexpr error less cryptic.
         raise _unsupported_operation_error(nie)

diff --git a/tables/numexpr/README b/tables/numexpr/README
@@ -1,30 +1,230 @@
-Numexpr is a fast numerical expression evaluator for Numpy. With it,
+What it is Numexpr?
+===================
+
+Numexpr is a fast numerical expression evaluator for NumPy.  With it,
 expressions that operate on arrays (like "3*a+4*b") are accelerated
 and use less memory than doing the same calculation in Python.
 
-Numexpr is written by David Cooke <david.m.cooke@gmail.com> and
-Tim Hochberg <tim.hochberg@ieee.org>. Francesc Alted <faltet@pytables.com>
-contributed support for booleans and for efficient strided and unaligned array
-operations. Ivan Vilata <ivan@selidor.net> contributed support for strings.
-It is distributed under the MIT license:
 
-Copyright (c) 2007 David M. Cooke <david.m.cooke@gmail.com>
+Examples of use
+===============
+
+>>> import numpy as np
+>>> import numexpr as ne
+
+>>> a = np.arange(1e6)   # Choose large arrays
+>>> b = np.arange(1e6)
+
+>>> ne.evaluate("a + 1")   # a simple expression
+array([  1.00000000e+00,   2.00000000e+00,   3.00000000e+00, ...,
+         9.99998000e+05,   9.99999000e+05,   1.00000000e+06])
+
+>>> ne.evaluate('a*b-4.1*a > 2.5*b')   # a more complex one
+array([False, False, False, ...,  True,  True,  True], dtype=bool)
+
+>>> ne.evaluate("sin(a) + arcsinh(a/b)")   # you can also use functions
+array([        NaN,  1.72284457,  1.79067101, ...,  1.09567006,
+        0.17523598, -0.09597844])
+
+>>> s = np.array(['abba', 'abbb', 'abbcdef'])
+>>> ne.evaluate("'abba' == s")   # string arrays are supported too
+array([ True, False, False], dtype=bool)
+
+
+Datatypes supported internally
+==============================
+
+Numexpr operates internally only with the following types:
+
+    * 8-bit boolean (bool)
+    * 32-bit signed integer (int or int32)
+    * 64-bit signed integer (long or int64)
+    * 32-bit single-precision floating point number (float or float32)
+    * 64-bit, double-precision floating point number (double or float64)
+    * 2x64-bit, double-precision complex number (complex or complex128)
+    * Raw string of bytes (str)
+
+If the arrays in the expression does not match any of these types,
+they will be upcasted to one of the above types (following the usual
+type inference rules, see below).  Have this in mind when doing
+estimations about the memory consumption during the computation of
+your expressions.
+
+Also, the types in Numexpr conditions are somewhat stricter than those
+of Python.  For instance, the only valid constants for booleans are
+`True` and `False`, and they are never automatically cast to integers.
+
+
+Casting rules
+=============
+
+Casting rules in Numexpr follow closely those of NumPy.  However, for
+implementation reasons, there are some known exceptions to this rule,
+namely:
+
+    * A floating point function (e.g. `sin`) acting on `int8` or
+      `int16` types returns a `float64` type, instead of the `float32`
+      that is returned by NumPy functions.  This is mainly due to the
+      absence of native `int8` or `int16` types in Numexpr.
+
+    * In operations implying a scalar and an array, the normal rules
+      of casting are used in Numexpr, in contrast with NumPy, where
+      array types takes priority.  For example, if 'a' is an array of
+      type `float32` and 'b' is an scalar of type `float64` (or Python
+      `float` type, which is equivalent), then 'a*b' returns a
+      `float64` in Numexpr, but a `float32` in NumPy (i.e. array
+      operands take priority in determining the result type).  If you
+      need to keep the result a `float32`, be sure you use a `float32`
+      scalar too.
+
+
+Supported operators
+===================
+
+Numexpr supports the set of operators listed below:
+
+    * Logical operators: &, |, ~
+    * Comparison operators: <, <=, ==, !=, >=, >
+    * Unary arithmetic operators: -
+    * Binary arithmetic operators: +, -, *, /, **, %
+
+
+Supported functions
+===================
+
+The next are the current supported set:
+
+    * where(bool, number1, number2): number
+        Number1 if the bool condition is true, number2 otherwise.
+    * {sin,cos,tan}(float|complex): float|complex
+        Trigonometric sine, cosine or tangent.
+    * {arcsin,arccos,arctan}(float|complex): float|complex
+        Trigonometric inverse sine, cosine or tangent.
+    * arctan2(float1, float2): float
+        Trigonometric inverse tangent of float1/float2.
+    * {sinh,cosh,tanh}(float|complex): float|complex
+        Hyperbolic sine, cosine or tangent.
+    * {arcsinh,arccosh,arctanh}(float|complex): float|complex
+        Hyperbolic inverse sine, cosine or tangent.
+    * {log,log10,log1p}(float|complex): float|complex
+        Natural, base-10 and log(1+x) logarithms.
+    * {exp,expm1}(float|complex): float|complex
+        Exponential and exponential minus one.
+    * sqrt(float|complex): float|complex
+        Square root.
+    * {real,imag}(complex): float
+        Real or imaginary part of complex.
+    * complex(float, float): complex
+        Complex from real and imaginary parts.
+
+More functions can be added if you need them.
+
+
+General routines
+================
+
+  * evaluate(expression, local_dict=None, global_dict=None, **kwargs):
+  Evaluate a simple array expression element-wise.  See examples above.
+
+  * test():  Run all the tests in the test suite.
+
+  * print_versions():  Print the versions of software that numexpr relies on.
+
+
+Intel's VML specific support routines
+=====================================
+
+When compiled with Intel's VML (Vector Math Library), you will be able
+to use some additional functions for controlling its use. These are:
+
+  * set_vml_accuracy_mode(mode):  Set the accuracy for VML operations.
+
+  The `mode` parameter can take the values:
+    - 'low': Equivalent to VML_LA - low accuracy VML functions are called
+    - 'high': Equivalent to VML_HA - high accuracy VML functions are called
+    - 'fast': Equivalent to VML_EP - enhanced performance VML functions are called
+
+  This call is equivalent to the `vmlSetMode()` in the VML library.
+  See:
+
+  http://www.intel.com/software/products/mkl/docs/webhelp/vml/vml_DataTypesAccuracyModes.html
+
+  for more info on the accuracy modes.
+
+  * set_vml_num_threads(nthreads): Suggests a maximum number of
+    threads to be used in VML operations.
+
+  This function is equivalent to the call
+  `mkl_domain_set_num_threads(nthreads, MKL_VML)` in the MKL library.
+  See:
+
+  http://www.intel.com/software/products/mkl/docs/webhelp/support/functn_mkl_domain_set_num_threads.html
+
+  for more info about it.
+
+  * get_vml_version():  Get the VML/MKL library version.
+
+
+How Numexpr can achieve such a high performance?
+================================================
+
+The main reason why Numexpr achieves better performance than NumPy (or
+even than plain C code) is that it avoids the creation of whole
+temporaries for keeping intermediate results, so saving memory
+bandwidth (the main bottleneck in many computations in nowadays
+computers). Due to this, it works best with arrays that are large
+enough (typically larger than processor caches).
+
+Briefly, it works as follows. Numexpr parses the expression into its
+own op-codes, that will be used by the integrated computing virtual
+machine. Then, the array operands are split in small chunks (that
+easily fit in the cache of the CPU) and passed to the virtual
+machine. Then, the computational phase starts, and the virtual machine
+applies the op-code operations for each chunk, saving the outcome in
+the resulting array. It is worth noting that all the temporaries and
+constants in the expression are kept in the same small chunk sizes
+than the operand ones, avoiding additional memory (and most specially,
+memory bandwidth) waste.
+
+The result is that Numexpr can get the most of your machine computing
+capabilities for array-wise computations.  Just to give you an idea of
+its performance, common speed-ups with regard to NumPy are usually
+between 0.95x (for very simple expressions, like ’a + 1’) and 4x (for
+relatively complex ones, like 'a*b-4.1*a > 2.5*b'), although much
+higher speed-ups can be achieved (up to 15x can be seen in not too
+esoteric expressions) because this depends on the kind of the
+operations and how many operands participates in the expression.  Of
+course, Numexpr will perform better (in comparison with NumPy) with
+larger matrices, i.e. typically those that does not fit in the cache
+of your CPU.  In order to get a better idea on the different speed-ups
+that can be achieved for your own platform, you may want to run the
+benchmarks in the directory bench/.
+
+See more info about how Numexpr works in:
+
+http://code.google.com/p/numexpr/wiki/Overview
+
+
+Authors
+=======
+
+Numexpr was initially written by David Cooke, and extended to more
+types by Tim Hochberg.  Francesc Alted contributed support for
+booleans and simple-precision floating point types and for efficient
+strided and unaligned array operations.  Ivan Vilata contributed
+support for strings.  Gregor Thalhammer implemented the support for
+Intel VML (Vector Math Library).
+
+
+License
+=======
 
-Permission is hereby granted, free of charge, to any person obtaining a copy
-of this software and associated documentation files (the "Software"), to deal
-in the Software without restriction, including without limitation the rights
-to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
-copies of the Software, and to permit persons to whom the Software is
-furnished to do so, subject to the following conditions:
+Numexpr is distributed under the MIT license (see LICENSE.txt file).
 
-The above copyright notice and this permission notice shall be included in
-all copies or substantial portions of the Software.
 
-THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
-IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
-FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
-AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
-LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
-OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
-THE SOFTWARE.
 
+.. Local Variables:
+.. mode: text
+.. coding: utf-8
+.. fill-column: 70
+.. End: