nedbat · arthurp · Jul 31, 2014 · Jul 31, 2014 · Jul 31, 2014 · Aug 2, 2014
diff --git a/LICENSE b/LICENSE
@@ -17,3 +17,53 @@ AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
 LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
 OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
 SOFTWARE.
+
+
+PYTHON SOFTWARE FOUNDATION LICENSE VERSION 2
+--------------------------------------------
+
+1. This LICENSE AGREEMENT is between the Python Software Foundation
+("PSF"), and the Individual or Organization ("Licensee") accessing and
+otherwise using this software ("Python") in source or binary form and
+its associated documentation.
+
+2. Subject to the terms and conditions of this License Agreement, PSF
+hereby grants Licensee a nonexclusive, royalty-free, world-wide
+license to reproduce, analyze, test, perform and/or display publicly,
+prepare derivative works, distribute, and otherwise use Python
+alone or in any derivative version, provided, however, that PSF's
+License Agreement and PSF's notice of copyright, i.e., "Copyright (c)
+2001, 2002, 2003, 2004, 2005, 2006 Python Software Foundation; All Rights
+Reserved" are retained in Python alone or in any derivative version
+prepared by Licensee.
+
+3. In the event Licensee prepares a derivative work that is based on
+or incorporates Python or any part thereof, and wants to make
+the derivative work available to others as provided herein, then
+Licensee hereby agrees to include in any such work a brief summary of
+the changes made to Python.
+
+4. PSF is making Python available to Licensee on an "AS IS"
+basis.  PSF MAKES NO REPRESENTATIONS OR WARRANTIES, EXPRESS OR
+IMPLIED.  BY WAY OF EXAMPLE, BUT NOT LIMITATION, PSF MAKES NO AND
+DISCLAIMS ANY REPRESENTATION OR WARRANTY OF MERCHANTABILITY OR FITNESS
+FOR ANY PARTICULAR PURPOSE OR THAT THE USE OF PYTHON WILL NOT
+INFRINGE ANY THIRD PARTY RIGHTS.
+
+5. PSF SHALL NOT BE LIABLE TO LICENSEE OR ANY OTHER USERS OF PYTHON
+FOR ANY INCIDENTAL, SPECIAL, OR CONSEQUENTIAL DAMAGES OR LOSS AS
+A RESULT OF MODIFYING, DISTRIBUTING, OR OTHERWISE USING PYTHON,
+OR ANY DERIVATIVE THEREOF, EVEN IF ADVISED OF THE POSSIBILITY THEREOF.
+
+6. This License Agreement will automatically terminate upon a material
+breach of its terms and conditions.
+
+7. Nothing in this License Agreement shall be deemed to create any
+relationship of agency, partnership, or joint venture between PSF and
+Licensee.  This License Agreement does not grant permission to use PSF
+trademarks or trade name in a trademark sense to endorse or promote
+products or services of Licensee, or any third party.
+
+8. By copying, installing or otherwise using Python, Licensee
+agrees to be bound by the terms and conditions of this License
+Agreement.
diff --git a/byterun/abstractvm.py b/byterun/abstractvm.py
@@ -0,0 +1,226 @@
+"""Classes to ease the abstraction of pyvm2.VirtualMachine.
+
+This module provides 2 classes that provide different kinds of
+abstraction. AbstractVirtualMachine abstracts operators and other magic method
+uses. AncestorTraversalVirtualMachine changes the execution order of basic
+blocks so that each only executes once.
+"""
+
+import logging
+
+
+from byterun import pycfg
+from byterun import pyvm2
+import six
+
+log = logging.getLogger(__name__)
+
+
+class AbstractVirtualMachine(pyvm2.VirtualMachine):
+    """A base class for abstract interpreters based on VirtualMachine.
+
+    AbstractVirtualMachine replaces the default metacyclic implementation of
+    operators and other operations that actually forward to a python magic
+    method with a virtual machine level attribute get and a call to the
+    returned method.
+    """
+
+    def __init__(self):
+        super(AbstractVirtualMachine, self).__init__()
+        # The key is the instruction suffix and the value is the magic method
+        # name.
+        binary_operator_name_mapping = dict(
+            ADD="__add__",
+            AND="__and__",
+            DIVIDE="__div__",
+            FLOOR_DIVIDE="__floordiv__",
+            LSHIFT="__lshift__",
+            MODULO="__mod__",
+            MULTIPLY="__mul__",
+            OR="__or__",
+            POWER="__pow__",
+            RSHIFT="__rshift__",
+            SUBSCR="__getitem__",
+            SUBTRACT="__sub__",
+            TRUE_DIVIDE="__truediv__",
+            XOR="__xor__",
+            )
+        # Use the above data to generate wrappers for each magic operators. This
+        # replaces the original dict since any operator that is not listed here
+        # will not work, so it is better to have it cause a KeyError.
+        self.binary_operators = dict((op, self.magic_operator(magic))
+                                     for op, magic in
+                                     binary_operator_name_mapping.iteritems())
+        # TODO(ampere): Add support for unary and comparison operators
+
+    def magic_operator(self, name):
+        # TODO(ampere): Implement support for r-operators
+        def magic_operator_wrapper(x, y):
+            return self.call_function(self.load_attr(x, name),
+                                      [y], {})
+        return magic_operator_wrapper
+
+    reversable_operators = set([
+        "__add__", "__sub__", "__mul__",
+        "__div__", "__truediv__", "__floordiv__",
+        "__mod__", "__divmod__", "__pow__",
+        "__lshift__", "__rshift__", "__and__", "__or__", "__xor__"
+        ])
+
+    @staticmethod
+    def reverse_operator_name(name):
+        if name in AbstractVirtualMachine.reversable_operators:
+            return "__r" + name[2:]
+        return None
+
+    def build_slice(self, start, stop, step):
+        return slice(start, stop, step)
+
+    def byte_GET_ITER(self):
+        self.push(self.load_attr(self.pop(), "__iter__"))
+        self.call_function_from_stack(0, [], {})
+
+    def byte_FOR_ITER(self, jump):
+        try:
+            self.push(self.load_attr(self.top(), "next"))
+            self.call_function_from_stack(0, [], {})
+            self.jump(self.frame.f_lasti)
+        except StopIteration:
+            self.pop()
+            self.jump(jump)
+
+    def byte_STORE_MAP(self):
+        # pylint: disable=unbalanced-tuple-unpacking
+        the_map, val, key = self.popn(3)
+        self.store_subscr(the_map, key, val)
+        self.push(the_map)
+
+    def del_subscr(self, obj, key):
+        self.call_function(self.load_attr(obj, "__delitem__"),
+                           [key], {})
+
+    def store_subscr(self, obj, key, val):
+        self.call_function(self.load_attr(obj, "__setitem__"),
+                           [key, val], {})
+
+    def sliceOperator(self, op):  # pylint: disable=invalid-name
+        start = 0
+        end = None          # we will take this to mean end
+        op, count = op[:-2], int(op[-1])
+        if count == 1:
+            start = self.pop()
+        elif count == 2:
+            end = self.pop()
+        elif count == 3:
+            end = self.pop()
+            start = self.pop()
+        l = self.pop()
+        if end is None:
+            end = self.call_function(self.load_attr(l, "__len__"), [], {})
+        if op.startswith('STORE_'):
+            self.call_function(self.load_attr(l, "__setitem__"),
+                               [self.build_slice(start, end, 1), self.pop()],
+                               {})
+        elif op.startswith('DELETE_'):
+            self.call_function(self.load_attr(l, "__delitem__"),
+                               [self.build_slice(start, end, 1)],
+                               {})
+        else:
+            self.push(self.call_function(self.load_attr(l, "__getitem__"),
+                                         [self.build_slice(start, end, 1)],
+                                         {}))
+
+    def byte_UNPACK_SEQUENCE(self, count):
+        seq = self.pop()
+        itr = self.call_function(self.load_attr(seq, "__iter__"), [], {})
+        values = []
+        for _ in range(count):
+            # TODO(ampere): Fix for python 3
+            values.append(self.call_function(self.load_attr(itr, "next"),
+                                             [], {}))
+        for value in reversed(values):
+            self.push(value)
+
+
+class AncestorTraversalVirtualMachine(AbstractVirtualMachine):
+    """An abstract interpreter implementing a traversal of basic blocks.
+
+    This class replaces run_frame with a traversal that executes all basic
+    blocks in ancestor first order starting with the entry block. This uses
+    pycfg.BlockTable.get_ancestors_first_traversal(); see it's documentation for
+    more information about the order.
+
+    As the traversal is done there is no attempt to rollback the state, so
+    parallel paths in the CFG (even those that cannot be run in the same
+    execution) will often see each other's side-effects. Effectively this means
+    that the execution of each basic block needs to commute with the execution
+    of other blocks it is not ordered with.
+    """
+
+    def __init__(self):
+        super(AncestorTraversalVirtualMachine, self).__init__()
+        self.cfg = pycfg.CFG()
+
+    def frame_traversal_setup(self, frame):
+        """Initialize a frame to allow ancestors first traversal.
+
+        Args:
+          frame: The execution frame to update.
+        """
+        frame.block_table = self.cfg.get_block_table(frame.f_code)
+        frame.order = frame.block_table.get_ancestors_first_traversal()
+        assert frame.f_lasti == 0
+
+    def frame_traversal_next(self, frame):
+        """Move the frame instruction pointer to the next instruction.
+
+        This implements the next instruction operation on the ancestors first
+        traversal order.
+
+        Args:
+          frame: The execution frame to update.
+
+        Returns:
+          False if the traversal is done (every instruction in the frames code
+          has been executed. True otherwise.
+        """
+        head = frame.order[0]
+        if frame.f_lasti < head.begin or frame.f_lasti > head.end:
+            frame.order.pop(0)
+            if not frame.order:
+                return False
+            head = frame.order[0]
+            if frame.f_lasti != head.begin:
+                log.debug("natural next %d, order next %d",
+                          frame.f_lasti, head.begin)
+            frame.f_lasti = head.begin
+        return True
+
+    def run_frame(self, frame):
+        """Run a frame until it returns (somehow).
+
+        Exceptions are raised, the return value is returned.
+
+        This implementation executes in ancestors first order. See
+        pycfg.BlockTable.get_ancestors_first_traversal().
+
+        Args:
+          frame: The execution frame.
+
+        Returns:
+          The return value of the frame after execution.
+        """
+        self.push_frame(frame)
+        self.frame_traversal_setup(frame)
+        while True:
+            why = self.run_instruction()
+            # TODO(ampere): Store various breaking "why"s so they can be handled
+            if not self.frame_traversal_next(frame):
+                break
+        self.pop_frame()
+
+        # TODO(ampere): We don't really support exceptions.
+        if why == "exception":
+            six.reraise(*self.last_exception)
+
+        return self.return_value
diff --git a/byterun/execfile.py b/byterun/execfile.py
@@ -105,6 +105,7 @@ def run_python_file(filename, args, package=None):
     main_mod.__file__ = filename
     if package:
         main_mod.__package__ = package
+    # TODO(ampere): This may be incorrect if we are overriding builtins
     main_mod.__builtins__ = BUILTINS
 
     # Set sys.argv and the first path element properly.