A bit of refactoring and some bugfixes.

josiahcarlson · Sep 7, 2010 · 2231300 · 2231300
1 parent 85e4a6c
commit 2231300
Show file tree

Hide file tree

Showing 3 changed files with 421 additions and 144 deletions.
diff --git a/lib/sq_om.py b/lib/sq_om.py
@@ -26,7 +26,7 @@ def call(self, data_seq, *args, **kwargs):
         return method(self, data_seq, *args, **kwargs)
     return call
 
-def _where_clause(table_name, cols, where, kwhere, select=True):
+def _where_clause(where, kwhere):
     assert bool(where) ^ bool(kwhere) < 2, "use a list OR keywords, not both: %r %r"%(where, kwhere)
     if not where:
         where = kwhere
@@ -35,20 +35,21 @@ def _where_clause(table_name, cols, where, kwhere, select=True):
     where_clause = ''
     vals = ()
     if where:
-        colnames, vals = zip(*where)
-        compare = dict((col, '=' if isinstance(val, (list, tuple)) else '=') for col, val in where)
-        # This str(tuple(val)) shenanigans is because Python's sqlite3
-        # library doesn't know how to properly pass a tuple down through the
-        # layers for a proper 'IN' query.  :(
-        vals = tuple(str(tuple(val)) if isinstance(val, (list, tuple)) else val for val in vals)
-        where_clause = ' WHERE ' + ' AND '.join('%s %s ?'%(col, compare[col]) for col in colnames)
-    if select:
-        query = '''SELECT %s FROM %s %s;'''%(
-            ', '.join(cols), table_name, where_clause)
-    else:
-        query = '''DELETE FROM %s %s;'''%(
-            table_name, where_clause)
-    return vals, query
+        clause = []
+        vals = []
+        for col, val in where:
+            if isinstance(val, (list, tuple)):
+                # These shenanigans are because Python's sqlite3 library
+                # doesn't know how to properly pass a tuple down through the
+                # layers for a proper 'IN' query.  :(
+                val = '(%s)'%(','.join(map(repr, val)))
+                clause.append('%s IN %s'%(col, val))
+            else:
+                clause.append('%s = ?'%(col,))
+                vals.append(val)
+        vals = tuple(vals)
+        where_clause = ' WHERE ' + ' AND '.join(clause)
+    return vals, where_clause
 
 class SQLTable(object):
     indexes = ()
@@ -84,49 +85,65 @@ def insert_many(self, data, conn=None):
             '''%(self.table_name, ', '.join(self._cols), ', '.join(len(self._cols)*['?'])),
             data)
 
-    @_check_data
-    def update(self, data, uuid, conn=None):
-        conn = conn or self.db
-        return conn.execute('''
-            UPDATE OR ROLLBACK
-                %s SET %s
-            WHERE _id = ?;
-            '''%(self.table_name, ', '.join('%s = ?'%col for col in self._cols)),
-            tuple(data) + (uuid,))
-
     def select_one(self, cols, where=None, conn=None, **kwhere):
         conn = conn or self.db
-        vals, query = _where_clause(self.table_name, cols, where, kwhere)
-        for result in conn.execute(query, vals):
+        vals, query = _where_clause(where, kwhere)
+        for result in conn.execute('''SELECT %s FROM %s %s'''%(','.join(cols), self.table_name, query), vals):
             return result
         return None
 
     def select(self, cols, where=None, conn=None, **kwhere):
         conn = conn or self.db
-        vals, query = _where_clause(self.table_name, cols, where, kwhere)
+        vals, query = _where_clause(where, kwhere)
+        query = '''SELECT %s FROM %s %s'''%(','.join(cols), self.table_name, query)
         return list(conn.execute(query, vals))
 
     def delete(self, where=None, conn=None, **kwhere):
         conn = conn or self.db
-        vals, query = _where_clause(self.table_name, None, where, kwhere, select=False)
+        vals, query = _where_clause(where, kwhere)
+        query = '''DELETE FROM %s %s'''%(self.table_name, query)
+        return conn.execute(query, vals)
+
+    def update(self, to_update, where=None, conn=None, **kwhere):
+        conn = conn or self.db
+        vals, query = _where_clause(where, kwhere)
+        set = ','.join('%s=?'%(k,) for k,v in to_update)
+        query = '''UPDATE %s SET %s %s'''%(self.table_name, set, query)
+        vals = tuple(v for k,v in to_update) + vals
         return conn.execute(query, vals)
 
 class IndexInfo(SQLTable):
-    columns = 'index_id INTEGER PRIMARY KEY', 'columns TEXT UNIQUE', 'flags INTEGER', 'last_indexed FLOAT'
+    columns = 'index_id INTEGER PRIMARY KEY', 'columns TEXT UNIQUE', 'flags INTEGER', 'last_indexed INTEGER'
     table_name = '_indexes'
 
 class IndexTable(SQLTable):
     columns = 'rowid INTEGER PRIMARY KEY', 'idata BLOB', 'rowref TEXT'
     table_name = '_index'
     indexes = [
-        ['_index_idata', ('idata',), False],
-        ['_index_irowref', ('rowref',), False],
+        ('_index_idata', ('idata',), False),
+        ('_index_irowref', ('rowref',), False),
     ]
     def __init__(self, db):
         SQLTable.__init__(self, db)
         # We don't want to be inserting based on rowid, so we'll pretend it
         # doesn't exist from this side of things.
         self._cols = self._cols[1:]
+    def delete_some(self, start, end, limit=1000):
+        tc = self.db.total_changes
+        with self.db as conn:
+            # Python's sqlite may not be compiled with support for limit on
+            # delete, so we need to hack it with an initial select.
+            last = list(conn.execute('''
+                SELECT idata
+                    FROM _index
+                    WHERE idata >= ? AND idata < ?
+                    LIMIT 1 OFFSET %s'''%(limit,), (buffer(start), buffer(end))))
+            if last:
+                end = buffer(str(last[0][0]))
+            conn.execute('''
+                DELETE FROM _index
+                    WHERE idata >= ? AND idata < ?''', (buffer(start), buffer(end)))
+        return self.db.total_changes - tc
 
 @apply
 def CAN_USE_CLOCK():
@@ -136,7 +153,7 @@ def CAN_USE_CLOCK():
     the properties we require.
     '''
     clocks = [time.clock() for i in xrange(10000)]
-    return len(clocks) != len(set(clocks))
+    return len(clocks) == len(set(clocks))
 
 def _time_seq(_lt=[time.time(), 0], CAN_USE_CLOCK=CAN_USE_CLOCK):
     '''
@@ -151,38 +168,43 @@ def _time_seq(_lt=[time.time(), 0], CAN_USE_CLOCK=CAN_USE_CLOCK):
     We use this sequence as a method of defining insertion/update order for
     the rows in our data table, so that indexing operations can merely walk an
     index over the time column to discover those rows that need to be indexed.
+
+    We'll be returning these values as integers to bypass float precision
+    issues during packing/unpacking.
     '''
+    shift = float(2**22)
     if CAN_USE_CLOCK:
         # This will get us the best possible real time resolution.  Roughly
         # 1.2 microseconds resolution on a 2.4 ghz core 2 duo.
         now = time.time()
         clk = time.clock()
         while 1:
-            yield now + time.clock() - clk
+            yield int(shift * (now + time.clock() - clk))
     else:
         # This will give us up to 4096 insertions per millisecond, which
         # should be sufficient for platforms with a shoddy time.clock().
         # This also ends up being the resolution of IEEE 754 FP doubles with
         # the current magnitude of unix time.
         lt = _lt[0]
         i = _lt[1]
-        shift = float(2**22)
         while 1:
             t = time.time()
             if t != lt:
                 i = 0
                 lt = _lt[0] = t
-            yield t + i / shift
+            yield int(shift * t + i)
             i += 1
             _lt[1] = i
 
 class DataTable(IndexTable):
-    columns = 'rowid INTEGER PRIMARY KEY', '_id TEXT UNIQUE', 'data JSON', 'last_updated FLOAT KEY'
-    indexes = ()
+    columns = 'rowid INTEGER PRIMARY KEY', '_id TEXT UNIQUE', 'data JSON', 'last_updated INTEGER UNIQUE'
     table_name = '_data'
+    indexes = ()
     def insert(self, data, conn=None):
-        return SQLTable.insert(self, (data.pop('_id'), data, time.time()), conn=conn)
+        for t in _time_seq():
+            return SQLTable.insert(self, (data.pop('_id'), data, t), conn=conn)
     def insert_many(self, data, conn=None):
         return SQLTable.insert_many(self, zip((d.pop('_id') for d in data), data, _time_seq()), conn=conn)
     def update(self, data, uuid, conn=None):
-        return SQLTable.update(self, (uuid, data, time.time()), uuid, conn=conn)
+        for t in _time_seq():
+            return SQLTable.update(self, [('data', data), ('last_updated', t)], _id=uuid, conn=conn)