diff --git a/SublimeREPL.sublime-settings b/SublimeREPL.sublime-settings
index b1a5b9ca..133d508e 100644
--- a/SublimeREPL.sublime-settings
+++ b/SublimeREPL.sublime-settings
@@ -1,4 +1,5 @@
 {
 	"win_cmd_encoding": "cp1250",
-	"default_extend_env": {}
+	"default_extend_env": {},
+	"presistent_history_enabled": true
 }
\ No newline at end of file
diff --git a/buzhug/LICENSE b/buzhug/LICENSE
new file mode 100644
index 00000000..ea429199
--- /dev/null
+++ b/buzhug/LICENSE
@@ -0,0 +1,24 @@
+Copyright (c) 2010, Pierre Quentel
+All rights reserved.
+
+Redistribution and use in source and binary forms, with or without
+modification, are permitted provided that the following conditions are met:
+    * Redistributions of source code must retain the above copyright
+      notice, this list of conditions and the following disclaimer.
+    * Redistributions in binary form must reproduce the above copyright
+      notice, this list of conditions and the following disclaimer in the
+      documentation and/or other materials provided with the distribution.
+    * Neither the name of the <organization> nor the
+      names of its contributors may be used to endorse or promote products
+      derived from this software without specific prior written permission.
+
+THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" AND
+ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
+WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
+DISCLAIMED. IN NO EVENT SHALL <COPYRIGHT HOLDER> BE LIABLE FOR ANY
+DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES
+(INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;
+LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND
+ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
+(INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
+SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
\ No newline at end of file
diff --git a/buzhug/__init__.py b/buzhug/__init__.py
new file mode 100644
index 00000000..d0f03242
--- /dev/null
+++ b/buzhug/__init__.py
@@ -0,0 +1 @@
+from buzhug import *
diff --git a/buzhug/buzhug.py b/buzhug/buzhug.py
new file mode 100644
index 00000000..d9585af7
--- /dev/null
+++ b/buzhug/buzhug.py
@@ -0,0 +1,1170 @@
+"""Pure-Python database engine
+
+Licence : BSD
+Author : Pierre Quentel (pierre.quentel@gmail.com)
+
+Access by list comprehension or generator expression or select
+
+Syntax overview :
+    from buzhug import Base
+    db = Base('dummy')
+    db.create(name=str,age=int,birthday=date)
+    db.open()
+
+    db.insert(name='homer',age=23,birthday=date(1994,10,7))
+    # select names for age > 20
+    # list comprehension
+    res = [ r.name for r in db if r.age > 20 ]
+    # select method (faster)
+    res = db.select(['name'],'age > v',v=20)
+    # select for update, then update
+    recs = db.select_for_update(['name'],'age > v',v=20)
+    for record in recs:
+        db.update(record,name=record.name.upper())
+    # direct access by __id__
+    record = db[_id]
+
+    # delete a list of records
+    db.delete(selected_records)
+    # delete one record identified by id
+    del db[_id]
+
+Concurrency control : at update time the version number of the
+record is checked, if it has changed since selecting an exception is raised
+
+Implementation overview
+- all files are in a directory called like the base
+- in this directory there are files with general information, and one file 
+  per field ("field file") ; storage format and methods for storing and
+  retrieving depend on the field type. Uses the classes in buzhug_classes
+- all selections are made by "brutal" browsing of the files (no indexing) ; 
+  for string fields, the very fast "for line in file" loop is used
+
+Version 0.4
+- fixed bug in delete : following inserts would make __getitem__ return
+previously deleted items
+Version 0.5 :
+- client / server mode added
+- option "mode" for the create() method
+Version 0.7 :
+- minor changes for compatibility with Python 2.3
+- method "update" on records
+Version 0.9 :
+- prevent adding a field with the same name as an existing one
+- add a close() method to close all files
+Version 1.0
+- make sort_by compatible with Python 2.3
+- support for the datetime.time types (by Nicolas Pinault)
+Version 1.1
+- implementation change for floats : this change makes existing bases with
+float fields incompatible. Use script conversion_float to upgrade
+Version 1.2
+- method close() forgot to close _id_pos and _del_rows
+- fix a bug for links to other dbs when their path has spaces
+Version 1.3
+- fix a bug in buzhug_algos when selecting by range
+Version 1.4
+- add boolean type
+- default value for fields can be specified in create() and modified by
+  set_default(field_name,default)
+- change conversion of float 0.0 (diidn't preserve order for small positive 
+floats)
+- move methods to manage db information to new module buzhug_info.py
+- add negative indexing. db[-1] returns the last inserted record
+Version 1.5
+- add thread-safe version class TS_Base
+- introduce syntax db(key1=value2[,key2=value2...])
+- allow an iterable of records for update
+- fix bug in Base.has_key(), UnicodeFile.from_block()
+Version 1.6
+- minor bug fix in conversion_float.py
+- add licence text
+Version 1.7
+- fix bug in thread-safe version
+Version 1.8
+- bug in select_for_update if used with a list of fields instead of None
+- bug in __init__.py
+"""
+
+import os
+import threading
+import cStringIO
+import itertools
+import token
+import tokenize
+import re
+import tempfile
+import shutil
+import urllib
+
+import time
+from datetime import date,datetime, time as dtime
+
+# compatibility with Python 2.3
+try:
+    set([1])
+except NameError:
+    from sets import Set as set
+
+from buzhug_files import *
+import buzhug_algos
+import buzhug_info
+
+version = "1.8"
+
+# ------------------------
+# The following classes are used to modelize the objects in the
+# database
+#
+# Each record is an instance of the class Record, which is a list
+# supporting lookup by attributes. The list of attributes is defined in the
+# class attribute 'fields', the list of the types of the attributes
+# is defined in the list 'types'. Lookup by index returns the
+# raw blocks read from the files ; lookup by attribute returns original
+# values with their type. For instance, if fields = ['age'] and
+# types = [ int ], record[0] will return a string representation
+# of the age, record.age will return the original age (an integer)
+# ------------------------
+
+class Record(list):
+    """Generic class for records"""
+
+    def __getattr__(self,k):
+        try:
+            ix = self.fields.index(k)
+        except ValueError:
+            raise AttributeError,'No attribute named %s' %k
+        try:
+            return self.db.f_decode[self.types[ix]](list.__getitem__(self,ix))
+        except:
+            print 'error for key %s type %s value %s' %(k,self.types[ix],
+                list.__getitem__(self,ix))
+            raise
+
+    def __setattr__(self,k,v):
+        try:
+            ix = self.fields.index(k)
+            self[ix] = self.db.f_encode[self.types[ix]](v)
+        except ValueError:
+            list.__setattr__(self,k,v)
+
+    def __repr__(self):
+        elts = []
+        for k in self.fields:
+            if not isinstance(getattr(self,k),unicode):
+                elts.append('%s:%s' %(k,getattr(self,k)))
+            else:
+                elts.append(('%s:%s' %(k,getattr(self,k))).encode('utf-8'))
+        return '<' + ' '.join(elts) +'>'
+
+    def update(self,**kw):
+        self.db.update(self,**kw)
+
+def makeRecordClass(db,record_class,field_names):
+    """Generate a subclass of record_class, specifying a Base instance 
+    and a list of field names and types"""
+
+    class _Record(record_class):
+        pass
+
+    setattr(_Record,'db',db)
+    setattr(_Record,'fields',list(field_names))
+    setattr(_Record,'types',[ db.fields[f] for f in field_names ])
+    return _Record
+
+# -----------------------------------
+# The result of selections is an instance of RecordSet, which is a list
+# with an attribute "names" (the name of the fields specified in the
+# selection). The items in the list are instances of the class Record
+#
+# Instances of ResultSet support a method sort_by(order), which returns
+# the list sorted as specified in the string 'order'
+# -----------------------------------
+class ResultSet(list):
+
+    def __init__(self,names,_list):
+        list.__init__(self,_list)
+        self.names = names
+    
+    def pp(self,width=70):
+        """pretty print"""
+        col_width = width/len(self.names)
+        fmt = '%%-%ss' %col_width
+        print '|'.join([fmt %name for name in self.names])
+        print '|'.join([fmt %('-'*col_width) for name in self.names])
+        for rec in self:
+            line = []
+            for name in self.names:
+                v = fmt %getattr(rec,name)
+                if not isinstance(getattr(rec,name),unicode):
+                    line.append(v)
+                else:
+                    enc = line.append(v.encode('latin-1'))
+            print '|'.join(line)
+
+    def sort_by(self,order):
+        """order is a string with field names separated by + or -
+        For instance, sort_by('name + surname - age') sorts by ascending 
+        name, ascending surname and descending age"""
+        
+        # parse the order string
+        e = cStringIO.StringIO(order).readline
+        cond = []
+        order = '+'
+        for t in tokenize.generate_tokens(e):
+            tt = token.tok_name[t[0]]
+            ts = t[1]
+            if tt == 'OP':
+                if not ts in ['+','-']:
+                    raise SyntaxError,"Bad operator in sort condition: %s" %ts
+                order = ts
+            elif tt == 'NAME':
+                if not ts in self.names:
+                    raise ValueError,"Unknown sort field :%s" %ts
+                cond.append((self.names.index(ts),order))
+        # build the function order_func used to sort records
+        o_f = "def order_func(rec):\n"
+        o_f += "    return ["
+        elts = []
+        for (ix,order) in cond:
+            if order == '+':
+                elts.append("rec[%s]" %ix)
+            else:
+                elts.append("buzhug_algos.rev(rec[%s])" %ix)
+        o_f += ",".join(elts) +"]"        
+        exec o_f in globals()  # this creates the global function order_func
+
+        # apply the key
+        try:
+            self.sort(key=order_func)
+        except TypeError: # for Python 2.3
+            self.sort(lambda x,y: cmp(order_func(x),order_func(y)))
+        return self
+        
+REGEXPTYPE = type(re.compile('a'))
+class Pattern:
+
+    def __init__(self,pattern):
+        self.pattern = pattern
+
+    def match(self,s):
+        return self.pattern.match(s[1:-1])
+        
+    def search(self,s):
+        return self.pattern.search(s[1:-1])
+        
+# -----------------------
+# The class Base is an abstraction of the database. It supports all the
+# usual functions : create a new base, open an existing base, insert
+# a record, delete a record, select a set of records matching a condition,
+# update the values of an existing record, destroy a base
+# Each record has an integer attribute called '__id__', a unique and 
+# unchangeable identifier
+# Deleted records are physically marked for deletion, but not immediately
+# removed. When many records have been deleted, they take useless place in 
+# the files and slow down the queries ; the cleanup() method gets rid of them
+#
+# Record selection
+# -----------------------
+# 1. List comprehensions or generator expressions
+# A base supports iteration, allowing for queries using the Python list
+# comprehension syntax : [ r.name for r in db if r.age > 20 ]. This is the
+# most natural way to express a query and should be used when the response
+# time is not crucial. But since it requires a conversion into the original
+# values for each line in each file, it is slower than using select
+#
+# 2. The select method
+# The first argument to the select method is always the list of the fields
+# to return in the result set. If the empty list is passed, all fields are
+# returned
+# For simple requests that test equality of a set of fields to a set of 
+# values, the syntax is like this : 
+#     select(['name','age'],firstname = 'pierre')
+# returns the records with attributes name and age for which the first name
+# is 'pierre'
+# If the value is a 2-item list, select will return the records for which
+# the field is between these values :
+#    select(['name'],age=[30,35])
+# For more complex requests, pass the select function a string with a
+# valid Python test on the field names. For internal reasons, no literal
+# value should be included in the string ; use variable names and append
+# keyword arguments to specifiy their values
+# For instance :
+#     select(['name','age'],
+#            'firstname in c1 and (country = c2 or age > c3)',
+#            c1 = ('pierre','paul'),c2='France',c3=30)
+# returns the records representing the persons called 'pierre' or 'paul', 
+# either from France or older than 30 years
+#
+# 3. Selection by record id
+# Returned by db[id]. The implementation makes lookup by id almost immediate,
+# regardless of the size of the file
+# -----------------------
+
+class ConflictError(Exception):
+    """Raised if trying to update a record that has changed since selection"""
+    pass
+
+class UpdateError(Exception):
+    """Raised if update is called on a record not selected for update"""
+    pass
+
+class TimeFormatError(Exception):
+    """Raised if an invalid time format is provided to set_string_format"""
+    pass
+
+
+class Base:
+
+    BLOCKSIZE = 131072
+    
+
+    types_map = [ (int,IntegerFile),(float,FloatFile),
+            (str,StringFile),(unicode,UnicodeFile),
+            (date,DateFile),(datetime,DateTimeFile), (dtime, TimeFile),
+            (bool,BooleanFile)]
+
+    def __init__(self,basename,thread_safe=False):
+        self.name = self.__name__ = basename
+        self.types = {} # key = data class name, value = data class
+        self.file_types = {} # key = data class, value = file class
+        self.f_encode = {} # key = data class, value = function to_block
+        self.f_decode = {} # key = data class, value = function from_block
+        self.info_name = os.path.join(basename,'__info__')
+        self.pos_name = os.path.join(basename,'__pos__')
+        for (c_obj,c_file) in self.types_map:
+                self._register_class(c_obj,c_file)
+        # from_string[_class] is the function used to convert a string
+        # into an instance of _class
+        self.from_string = { str:lambda x:x, int:int,
+            float:float}
+        # class used for the records. Default is Record, but it can 
+        # be changed by set_record_class()
+        self.record_class = Record
+
+    def set_record_class(self,record_class):
+        """Set the base class for records"""
+        self.record_class = record_class
+        self._full_rec = makeRecordClass(self,self.record_class,
+            self.field_names)
+        
+    def _register_class(self,class_obj,class_file):
+        """Register a data type
+        class_obj is the data class (eg int)
+        class_file is the class used to manage the file that holds
+           the data of this class (eg IntegerFile in buzhug_files)
+        """
+        self.types.update({class_obj.__name__:class_obj})
+        self.file_types.update({ class_obj:class_file })
+        self.f_encode.update({class_obj:class_file().to_block})
+        self.f_decode.update({class_obj:class_file().from_block})
+
+    def _register_base(self,base):
+        """Register another base for external references"""
+        class ExtFile(ExternalFile):
+            pass
+        setattr(ExtFile,'db',base)
+        self._register_class(base,ExtFile)
+
+    def create(self,*fields,**kw):
+        """Creates a database instance and returns a reference to it
+        fields are tuples (field_name,field_type[,default_value])
+        field_name must not begin by _
+        field_type can be one of the values in the dictionary self.types
+        A keyword 'mode' can be specified:
+           'override' : if the base already exists, remove it and create
+                        a new one
+           'open' : if the base already exists, open it
+        If mode is not set, if the base exists, raise IOError
+        In any case, if a directory of the same name exists, raise an
+        exception
+        """
+        mode = kw.get('mode',None)
+        if os.path.exists(self.name):
+            if os.path.exists(self.info_name):
+                if mode == 'override':
+                    pass
+                elif mode == 'open':
+                    return self.open()
+                else:
+                    raise IOError,"Base %s already exists" %self.name
+            else:
+                if mode != 'open':
+                    raise IOError,"Directory %s already exists" %self.name
+                else:
+                    raise IOError,"Mode 'open' : " \
+                        "Directory %s already exists but no info file found" \
+                        %self.name
+
+        self.field_names = [ f[0] for f in fields ]
+        self.fields = dict([(f[0],f[1]) for f in fields])
+        # set general info about field definition
+        buzhug_info.set_info(self,fields)
+
+        self.field_names = ['__id__','__version__'] + self.field_names
+        self.fields['__id__'] = int
+        self.fields['__version__'] = int
+        # create the directory used for the base
+        if not os.path.exists(self.name):
+            os.mkdir(self.name)
+        # create index file
+        self._id_pos = IntegerFile(self.name,'_id_pos').create()
+        # create positions file
+        open(self.pos_name,'wb').close()
+        self._pos = PositionFile(self).create()
+        # create the file holding a list of the deleted rows (the line number
+        # of deleted records in field files)
+        self._del_rows = DeletedRowsFile(self.name,"__del_rows__").create()
+        # create field files abstractions
+        self._file = {}
+        for f in self.field_names:
+            self._file[f] = self.file_types[self.fields[f]](self.name,f)
+            self._file[f].create()
+        # save information in files __info__ and __defaults__
+        buzhug_info.save_info(self)
+        # create class for records with all values set
+        self._full_rec = makeRecordClass(self,self.record_class,self.field_names)
+        return self
+
+    def open(self):
+        """Open an existing database and return a reference to it
+        Raise IOError if no base is found for the path entered in __init__
+        """
+        if not os.path.exists(self.name) or not os.path.isdir(self.name):
+            raise IOError,"Base %s doesn't exist" %self.name
+        try:
+            _info = open(self.info_name,'rb')
+        except IOError:
+            raise IOError,"No buzhug base in directory %s" %self.name
+        return self._open(_info)
+        
+    def _open(self,info):
+        fields = [ f.split(':',1) for f in info.read().split() ]
+        info.close()
+        self.fields = {}
+        for (k,v) in fields:
+            if v.startswith('<base>'):
+                # reference to an external base
+                base_path = urllib.unquote(v[6:])
+                ext_db = Base(base_path).open()
+                self._register_base(ext_db)
+                self.fields[k] = ext_db
+            else:
+                self.fields[k] = self.types[v]
+        self.field_names = [ k for (k,v) in fields ]
+        self.encode = dict([(k,self.f_encode[self.fields[k]]) 
+            for k in self.field_names])
+        self.decode = dict([(k,self.f_decode[self.fields[k]]) 
+            for k in self.field_names])
+        self._open_files()
+        # read default values
+        self.defaults = buzhug_info.read_defaults(self)
+        return self
+
+    def _open_files(self):
+        self._file = {}
+        for f in self.field_names:
+            self._file[f] = self.file_types[self.fields[f]](self.name,f)
+            self._file[f].open()
+        self._id_pos = IntegerFile(self.name,'_id_pos').open()
+        self._pos = PositionFile(self).open()
+        self._del_rows = DeletedRowsFile(self.name,"__del_rows__").open()
+        self._full_rec = makeRecordClass(self,self.record_class,
+            self.field_names)
+
+    def close(self):
+        """Close all files"""
+        for f in self._file.values():
+            f.close()
+        self._pos.close()
+        self._id_pos.close()
+        self._del_rows.close()
+
+    def destroy(self):
+        """Destroy an existing base"""
+        for dirpath,dirnames,filenames in os.walk(self.name):
+            for filename in filenames:
+                os.remove(os.path.join(dirpath,filename))
+        os.rmdir(self.name)
+
+    def set_default(self,field_name,default):
+        """Set a default value for a field"""
+        fields = []
+        for f in self.field_names[2:]:
+            if f==field_name:
+                fields.append((f,self.fields[f],default))
+            elif self.defaults[f] is None:
+                fields.append((f,self.fields[f]))
+            else:
+                fields.append((f,self.fields[f],self.defaults[f]))
+        buzhug_info.set_info(self,fields)
+
+    def insert(self,*args,**kw):
+        """Public method to insert a record
+        Data can be entered as a list of values ordered like in create(),
+        or as keyword arguments
+        Explicit setting of the id and version is forbidden
+        If some of the fields are missing the value is set to None
+        Return the identifier of the newly inserted record
+        """
+        if args and kw:
+            raise SyntaxError,"Can't use both positional and keyword arguments"
+        if args:
+            # insert a list of values ordered like in the base definition
+            if not len(args) == len(self.field_names)-2:
+                raise TypeError,"Expected %s arguments, found %s" \
+                   %(len(self.field_names)-2,len(args))
+            return self.insert(**dict(zip(self.field_names[2:],args)))
+        if '__id__' in kw.keys():
+            raise NameError,"Specifying the __id__ is not allowed"
+        if '__version__' in kw.keys():
+            raise NameError,"Specifying the __version__ is not allowed"
+        rec = dict([(f,self.defaults[f]) for f in self.field_names[2:]])
+        for (k,v) in kw.iteritems():
+            self._validate(k,v)
+            rec[k] = v
+        # initial version = 0
+        rec['__version__'] = 0
+        # get position in field files
+        pos = [ self._file[f].get_end_pos() for f in self.field_names ]
+        # insert values in field files for field names except __id__
+        for f in self.field_names[1:]:
+            self._file[f].insert(rec[f])
+        # insert positions in the position file
+        _id,line_num = [ int(v) for v in self._pos.insert(pos) ]
+        # insert id value in file __id__
+        self._file['__id__'].insert(_id)
+        # line_num is the line number in the position file
+        self._id_pos.insert(line_num)
+        return _id
+
+    def set_string_format(self,class_,format):
+        """Specify the format used to convert a string into an instance
+        of the class. class_ can be:
+        - unicode : the format is the encoding
+        - date, datetime : format = the format string as defined in strftime
+        """
+        if class_ is unicode:
+            # test encoding ; will raise LookupError if invalid
+            unicode('a').encode(format)
+            # create the conversion function bytestring -> unicode string
+            def _from_string(us):
+                return unicode(us,format)
+            self.from_string[unicode] = _from_string
+        elif class_ is date:
+            # test date format
+            d = date(1994,10,7)
+            t = time.strptime(d.strftime(format),format)
+            if not t[:3] == d.timetuple()[:3]:
+                raise TimeFormatError,'%s is not a valid date format' %format
+            else:
+                # create the conversion function string -> date
+                def _from_string(ds):
+                    return date(*time.strptime(ds,format)[:3])
+                self.from_string[date] = _from_string
+        elif class_ is datetime:
+            # test datetime format
+            dt = datetime(1994,10,7,8,30,15)
+            t = time.strptime(dt.strftime(format),format)
+            if not t[:6] == dt.timetuple()[:6]:
+                raise TimeFormatError,'%s is not a valid datetime format' \
+                    %format
+            else:
+                # create the conversion function string -> date
+                def _from_string(dts):
+                    return datetime(*time.strptime(dts,format)[:6])
+                self.from_string[datetime] = _from_string
+        elif class_ is dtime:
+            # test datetime format
+            dt = dtime(8,30,15)
+            t = time.strptime(dt.strftime(format),format)
+            if not t[3:6] == (dt.hour, dt.minute, dt.second):
+                raise TimeFormatError,'%s is not a valid datetime.time format' \
+                    %format
+            else:
+                # create the conversion function string -> dtime
+                def _from_string(dts):
+                    return dtime(*time.strptime(dts,format)[3:6])
+                self.from_string[dtime] = _from_string
+        else:
+            raise ValueError,"Can't specify a format for class %s" %class_
+
+    def insert_as_strings(self,*args,**kw):
+        """Insert a record with values provided as strings. They must be
+        converted into their original types according to the conversion
+        functions defined in the dictionary from_string
+        """
+        if args and kw:
+            raise SyntaxError,"Can't use both positional and keyword arguments"
+        if args:
+            # insert a list of strings ordered like in the base definition
+            if not len(args) == len(self.field_names)-2:
+                raise TypeError,"Expected %s arguments, found %s" \
+                   %(len(self.field_names)-2,len(args))
+            return self.insert_as_strings(**dict(zip(self.field_names[2:],
+                args)))
+        return self.insert(**self.apply_types(**kw))
+
+    def apply_types(self,**kw):
+        """Transform the strings in kw values to their type
+        Return a dictionary with the same keys and converted values"""
+        or_kw = {}
+        for k in kw.keys():
+            try:
+                t = self.fields[k]
+            except KeyError:
+                raise NameError,"No field named %s" %k
+            if not self.from_string.has_key(t):
+                raise Exception,'No string format defined for %s' %t
+            else:
+                try:
+                    or_kw[k] = self.from_string[t](kw[k])
+                except:
+                    raise TypeError,"Can't convert %s into %s" %(kw[k],t)
+        return or_kw
+
+    def commit(self):
+        """Save all changes on disk"""
+        self.close()
+        self._open_files()
+        
+    def delete(self,records):
+        """Remove the items in the iterable records"""
+        if issubclass(records.__class__,Record):
+            # individual record
+            records = [records]
+        _ids = [ r.__id__ for r in records ]
+        _ids.sort()
+
+        # mark blocks in field files as deleted
+        for _id in _ids:
+            # get the line number in the position file
+            _line_in_pos = self._id_pos.get_value_at_pos(_id*5)
+            # get the positions in field files
+            delete_pos = self._pos.from_block(
+                self._pos.get_block_at(_line_in_pos))
+            # mark the items in field files as deleted
+            for dp,f in zip(delete_pos,self.field_names):
+                self._file[f].mark_as_deleted(dp)
+            # the line number in field files is saved in _del_rows
+            self._del_rows.insert(delete_pos[0]/5)
+            # mark line in position file as deleted
+            self._pos.remove(_line_in_pos)
+            # mark line in _id_pos as deleted
+            self._id_pos.mark_as_deleted(_id*5)
+        self._pos.deleted_lines.sort()
+
+    def cleanup(self):
+        """Physically remove the deleted items in field files
+        This is required after many records have been deleted and
+        occupy useless space on disk
+        """
+        temp_files = [tempfile.TemporaryFile() for f in self.field_names]
+        # count number of lines in position file
+        lnum = 0
+        for l in self._pos:
+            lnum += 1
+        for _id in range(lnum):
+            pos_block = self._pos.get_block_at(_id)
+            if not pos_block[0] == '#':
+                positions = self._pos.from_block(pos_block)
+                new_pos = [] 
+                for i,f in enumerate(self.field_names):
+                    new_pos.append(temp_files[i].tell())
+                    block = self._file[f].get_block_at_pos(positions[i])
+                    temp_files[i].write(block)
+                self._pos.update_positions(_id,new_pos)
+
+        # delete old files, replace them by temp files
+        for i,f in enumerate(self.field_names):
+            self._file[f].close()
+            self._file[f].create()
+            temp_files[i].seek(0)
+            shutil.copyfileobj(temp_files[i],self._file[f])
+            # explicitely close the temporary file
+            temp_files[i].close()
+        self.commit()
+        # reset deleted rows file
+        self._del_rows = DeletedRowsFile(self.name,"__del_rows__").create()
+
+    def select(self,names=None,request=None,**args):
+        """Select the records in the base that verify a predicate and return
+        the specified names. If names is [] or None then all the fields are 
+        returned
+        
+        The predicate can be expressed :
+        - by a request string and keyword arguments for the values
+        - by field_name = value keywords to test equality of fields to values
+
+        Return an instance of ResultSet
+        
+        Examples :
+        db.select() # return all the records in the base
+        db.select(['name']) # return the value of field name 
+                            # for all the records in the base
+        db.select(None,age=30) # return the records with age = 30 
+                               # with all fields set
+        db.select(['name'],age=30) # return the same list with only the
+                               # field 'name' set (faster)
+        db.select(['name'],'age > c',c=30) # records with age > 30 and
+                               # only field 'name' set
+        """
+        res,names = self._select(names,request,**args)
+        return ResultSet(names,res.values())
+    
+    def select_for_update(self,names=None,request=None,**args):
+        """Same syntax as select, only checks that the field __version__
+        is returned. This field is used for concurrency control ; if
+        a user selects a record, then updates it, the program checks if the
+        version on disk is the same as the users's version ; if another
+        user has updated it in the meantime it will have changed
+        
+        select_for_update takes a little more time than select, this is
+        why there are two different methods"""
+        if not names:
+            names = self.field_names
+        else:
+            names += [ f for f in ['__id__','__version__'] if not f in names ]
+        res,names = self._select(names,request,**args)
+        return ResultSet(names,res.values())
+
+    def __call__(self,**kw):
+        return self.select_for_update(**kw)
+
+    def _select(self,_names,_request,**args):
+        """Private method that performs actual selection
+        The field files are browsed line by line. A test function is built
+        to compare the raw data found in these files to the arguments
+        The arguments are first converted to a string that can be compared
+        to the raw data found in the files
+        This is much faster than converting the raw data into their
+        original type and compare the result to the arguments
+        """
+
+        if not _names: # names unspecified or None
+            _names = self.field_names
+
+        _namespace = {}
+        if args.has_key('_namespace'):
+            _namespace = args['_namespace']
+            del args['_namespace']
+
+        # If there are regular expression objects in the keywords,
+        # transform them into instances of the class Pattern
+        # The methods match and search of these instances will return
+        # the return value of match and search applied to the string
+        # stripped from its first and last character
+        regexps = []
+        for k,v in args.iteritems():
+            if type(v) is REGEXPTYPE:
+                _namespace[k] = Pattern(v)
+                regexps.append(k)
+
+        # remove these keywords from args, they are in _namespace
+        for k in regexps:
+            del args[k]
+
+        if _request is None:
+            f_args = [ k for k in args.keys() 
+                if hasattr(self._file[k],'block_len') ]
+            # if there is at least one fixed length field to search, use the
+            # fast_select algorithm
+            if f_args:
+                res,names = buzhug_algos.fast_select(self,_names,**args)
+                _Record = makeRecordClass(self,self.record_class,names)
+                for k in res.keys():
+                    res[k] = _Record(res[k])
+                return res,names
+            conds = []
+            for i,k in enumerate(args.keys()):
+                conds.append('%s == _c[%s]' %(k,i))
+            _request = ' and '.join(conds)
+            _c = []
+            for (k,v) in args.iteritems():
+                t = self.fields[k]  # field type
+                if isinstance(v,(tuple,list)):
+                    _c.append([self.f_encode[t](x) for x in v])
+                else:
+                    _c.append(self.f_encode[t](v))
+            for n in args.keys():
+                if not n in _names:
+                    _names.append(n)
+        else:
+            for (k,v) in args.iteritems():
+                if isinstance(v,Record):
+                    # comparison with a record of another base
+                    ft = self.file_types[self.types[v.db.name]]
+                    args[k] = ft().to_block(v)
+                elif isinstance(v,(tuple,list)):
+                    args[k] = [ self.f_encode[x.__class__](x) for x in v ]
+                else:
+                    args[k] = self.file_types[v.__class__]().to_block(v)
+
+        w1 = [ re.compile(r'\b(?P<name>%s)\b' %f) for f in self.field_names ]
+        # get field names in _request and not in names
+        for n in w1:
+            mo = n.search(_request)
+            if mo:
+                name = mo.group('name')
+                if not name in _names:
+                    _names.append(name)
+
+        # replace field names by their rank in record
+        def repl(mo):
+            return '_rec[%s]' %_names.index(mo.group('name'))
+
+        w = [ re.compile(r'\b(?P<name>%s)\b' %f) for f in _names ]
+        for n in w:
+            _request = n.sub(repl,_request)
+
+        # generate the loop to browse the files and test each set of results
+        _res = {}
+        loop = "for num,_rec in enumerate(self._iterate(*_names)):\n"
+        if _request:
+            loop +="    if %s:\n" %_request
+        else:
+            # _request is empty : select all items 
+            # except those marked as deleted
+            loop +="    if _rec[0][0] != '#':\n"
+        loop +="        _res[num] = _rec"
+
+        # prepare namespace
+        args.update(_namespace)
+
+        # execute the loop
+        exec loop in locals(),args
+
+        # exclude deleted rows from the results
+        if self._del_rows.deleted_rows:
+            _to_delete = set(_res.keys()) & set(self._del_rows.deleted_rows)
+            for k in _to_delete:
+                del _res[k]
+        
+        # return the list of selected items, with return fields set
+        return _res,_names
+
+    def update(self,record,**kw):
+        """Update the record with the values in kw
+        If only fixed length fields have changed, simply put the new values
+        at the same position in field files
+        Otherwise, remove existing record then insert the new version"""
+        if not isinstance(record,Record) \
+            and isinstance(record,(list,tuple)):
+            for rec in record:
+                self.update(rec,**kw)
+            return
+        only_fixed_length = True
+        if '__id__' in kw.keys():
+            raise NameError,"Can't update __id__"
+        if '__version__' in kw.keys():
+            raise NameError,"Can't update __version__"
+        for (k,v) in kw.iteritems():
+            self._validate(k,v)
+            setattr(record,k,v)
+            if not hasattr(self.file_types[self.fields[k]],
+                'block_len'):
+                only_fixed_length = False
+
+        if not hasattr(record,'__id__') or not hasattr(record,'__version__'):
+            # refuse to update a record that was not selected for update
+            raise UpdateError,'The record was not selected for update'
+
+        _id = record.__id__
+        # line number of the record in position file
+        _line_in_pos = self._id_pos.get_value_at_pos(5*_id)
+        
+        # if the record was selected for update it has a __version__
+        # attribute. If the version for the same id in the position
+        # file is not the same, refuse to update
+        current_version = self[_id].__version__
+        if not record.__version__ == current_version:
+            raise ConflictError,'The record has changed since selection'
+
+        # increment version
+        record.__version__ += 1
+        # position of blocks in field files
+        field_pos = self._pos.from_block(self._pos.get_block_at(_line_in_pos))
+
+        if only_fixed_length:
+            # only fixed length fields modified : just change the values
+            kw['__version__'] = record.__version__
+            for k,v in kw.iteritems():
+                ix = self.field_names.index(k)
+                self._file[k].write_value_at_pos(field_pos[ix],v)
+        else:
+            # the record to update may not have all the database fields
+            # for missing fields, just write a copy at the end of field file
+            new_pos = {}
+            missing_fields = [ (i,f) for (i,f) in enumerate(self.field_names)
+                if not hasattr(record,f) ]
+            for i,f in missing_fields:
+                pos = field_pos[i]
+                block = self._file[f].get_block_at_pos(pos)
+                new_pos[f] = self._file[f].get_end_pos()
+                self._file[f].write(block)
+                self._file[f].seek(0,2)
+
+            # record fields
+            set_fields = [ f for f in self.field_names if hasattr(record,f) ]
+            # write new values in field files
+            for f in set_fields:
+                new_pos[f] = self._file[f].get_end_pos()
+                self._file[f].insert(getattr(record,f))
+
+            # update positions in the position file
+            pos = [ new_pos[f] for f in self.field_names ]
+            self._pos.update(_line_in_pos,pos)
+
+            # for previous version of the record, 
+            # mark row in field files as deleted
+            for dp,f in zip(field_pos,self.field_names):
+                self._file[f].mark_as_deleted(dp)
+            # add a deleted row
+            self._del_rows.insert(field_pos[0]/5)
+
+    def add_field(self,field_name,field_type,after=None,default=None):
+        """Add a new field after the specified field, or in the beginning if
+        no field is specified"""
+        if field_name in self.field_names:
+            raise NameError,"Field %s already exists" %field_name
+        field_def = [field_name,field_type]
+        if default is not None:
+            field_def.append(default)
+
+        # validate field and update dictionary defaults
+        buzhug_info.validate_field(self,field_def)
+
+        if after is None:
+            indx = 2 # insert after __version__
+        elif not after in self.field_names:
+            raise NameError,"No field named %s" %after
+        else:
+            indx = 1+self.field_names.index(after)
+        self.field_names.insert(indx,field_name)
+        self.fields[field_name] = field_type
+        # create field file
+        self._file[field_name] = \
+            self.file_types[self.fields[field_name]](self.name,field_name)
+        self._file[field_name].create()
+        # populate field file with default value and update position file
+        self._pos.add_field(field_name,indx,default)
+        buzhug_info.save_info(self)
+        self._full_rec = makeRecordClass(self,self.record_class,
+            self.field_names)
+
+    def drop_field(self,field_name):
+        """Remove the specified field name"""
+        if not field_name in self.field_names:
+            raise NameError,"No field named %s" %field_name
+        if field_name == '__id__':
+            raise ValueError,"Field __id__ can't be removed"
+        if field_name == '__version__':
+            raise ValueError,"Field __version__ can't be removed"
+        indx = self.field_names.index(field_name)
+        self.field_names.remove(field_name)
+        del self.defaults[field_name]
+        buzhug_info.save_info(self)
+        del self.fields[field_name]
+        del self._file[field_name]
+        self._pos.drop_field(field_name,indx)
+        self._full_rec = makeRecordClass(self,self.record_class,
+            self.field_names)
+
+    def _validate(self,k,v):
+        """Validate the couple key,value"""
+        if not k in self.fields.keys():
+            raise NameError,"No field named %s" %k
+        if v is None:
+            return
+        # if self.fields[k] is an instance of Base, the value must be an
+        # instance of a subclass of Record with its class attribute 
+        # db == self.fields[k]
+        if isinstance(self.fields[k],Base):
+            if not issubclass(v.__class__,Record):
+                raise TypeError,"Bad type for %s : expected %s, got %s %s" \
+                      %(k,self.fields[k],v,v.__class__)
+            if v.__class__.db.name != self.fields[k].name:
+                raise TypeError,"Bad base for %s : expected %s, got %s" \
+                      %(k,self.fields[k].name,v.__class__.db.name)
+        else:
+            if not isinstance(v,self.fields[k]):
+                raise TypeError,"Bad type for %s : expected %s, got %s %s" \
+                      %(k,self.fields[k],v,v.__class__)
+
+    def _iterate(self,*names):
+        """_iterate on the specified names only"""
+        Record = makeRecordClass(self,self.record_class,names)
+        files = [ self._file[f] for f in names ]
+        for record in itertools.izip(*files):
+            yield Record(record)
+
+    def __getitem__(self,num):
+        """Direct access by record id"""
+        if num<0:
+            num = len(self)+num
+        # first find the line in position file
+        block_pos = self._id_pos.get_block_at_pos(5*num)
+        if block_pos[0] == '#':
+            raise IndexError,'No item at position %s' %num
+        else:
+            _id_pos = self._id_pos.from_block(block_pos)
+        # block in position file
+        p_block = self._pos.get_block_at(_id_pos)
+        pos = self._pos.from_block(p_block)
+        record = [ self._file[f].get_block_at_pos(p)
+            for (f,p) in zip(self.field_names,pos) ]
+        rec = self._full_rec(record)
+        return rec
+
+    def __delitem__(self,num):
+        """Delete the item at id num"""
+        self.delete([self[num]])
+
+    def __len__(self):
+        return self._pos._count
+
+    def has_key(self,num):
+        # first find the line in position file
+        block_pos = self._id_pos.get_block_at_pos(5*num)
+        if not block_pos or block_pos[0] == '#':
+            return False
+        return True
+
+    def __contains__(self,num):
+        return self.has_key(num)
+
+    def keys(self):
+        return [ r.__id__ for r in self.select(['__id__']) ]
+
+    def __iter__(self):
+        """Iterate on all records
+        XXX TO DO : optimize : if no deleted record, 
+        remove the test record[0][0] != "#"
+        """
+        files = [ self._file[f] for f in self.field_names ]
+        for record in itertools.izip(*files):
+            if record[0][0] != "#":
+                r = self._full_rec(record)
+                yield r
+
+# thread-safe base ; copied from the logging module
+_lock = None
+
+def _acquireLock():
+    """
+    Acquire the module-level lock for serializing access to shared data.
+
+    This should be released with _releaseLock().
+    """
+    global _lock
+    if (not _lock):
+        _lock = threading.RLock()
+    if _lock:
+        _lock.acquire()
+
+def _releaseLock():
+    """
+    Release the module-level lock acquired by calling _acquireLock().
+    """
+    if _lock:
+        _lock.release()
+
+class TS_Base(Base):
+
+    def create(self,*args,**kw):
+        _acquireLock()
+        try:
+            res = Base.create(self,*args,**kw)
+        finally:
+            _releaseLock()
+        return res
+
+    def open(self,*args,**kw):
+        _acquireLock()
+        try:
+            res = Base.open(self,*args,**kw)
+        finally:
+            _releaseLock()
+        return res
+
+    def close(self,*args,**kw):
+        _acquireLock()
+        try:
+            res = Base.close(self,*args,**kw)
+        finally:
+            _releaseLock()
+        return res
+
+    def destroy(self,*args,**kw):
+        _acquireLock()
+        try:
+            res = Base.destroy(self,*args,**kw)
+        finally:
+            _releaseLock()
+        return res
+
+    def set_default(self,*args,**kw):
+        _acquireLock()
+        try:
+            res = Base.set_default(self,*args,**kw)
+        finally:
+            _releaseLock()
+        return res
+
+    def insert(self,*args,**kw):
+        _acquireLock()
+        try:
+            res = Base.insert(self,*args,**kw)
+        finally:
+            _releaseLock()
+        return res
+
+    def update(self,*args,**kw):
+        _acquireLock()
+        try:
+            res = Base.update(self,*args,**kw)
+        finally:
+            _releaseLock()
+        return res
+
+    def delete(self,*args,**kw):
+        _acquireLock()
+        try:
+            res = Base.delete(self,*args,**kw)
+        finally:
+            _releaseLock()
+        return res
+
+    def cleanup(self,*args,**kw):
+        _acquireLock()
+        try:
+            res = Base.cleanup(self,*args,**kw)
+        finally:
+            _releaseLock()
+        return res
+
+    def commit(self,*args,**kw):
+        _acquireLock()
+        try:
+            res = Base.commit(self,*args,**kw)
+        finally:
+            _releaseLock()
+        return res
+
+    def add_field(self,*args,**kw):
+        _acquireLock()
+        try:
+            res = Base.add_field(self,*args,**kw)
+        finally:
+            _releaseLock()
+        return res
+
+    def drop_field(self,*args,**kw):
+        _acquireLock()
+        try:
+            res = Base.drop_field(self,*args,**kw)
+        finally:
+            _releaseLock()
+        return res
+
+    
\ No newline at end of file
diff --git a/buzhug/buzhug_algos.py b/buzhug/buzhug_algos.py
new file mode 100644
index 00000000..5c142120
--- /dev/null
+++ b/buzhug/buzhug_algos.py
@@ -0,0 +1,175 @@
+"""Implementation of fast search algorithms
+Used in select when one of the search fields has a fixed-length size
+
+Instead of taking all the blocks in field files one after the other, a big
+number of blocks are read and the search is made on the buffer
+"""
+
+from datetime import date, datetime
+import itertools
+
+# compatibility with Python 2.3
+try:
+    set([1])
+except NameError:
+    from sets import Set as set
+
+def rev(s):
+    """ function used to compare strings in decreasing order"""
+    return ''.join([chr(255-ord(c)) for c in s])
+
+def make_search_func(db,field,value):
+    """Return the search function on a field
+    If value is a pair of values (v1,v2), all blocks between v1 and v2
+    will be returned ; if value is a single value then all blocks with
+    this value will be returned
+    """
+    bl = db._file[field].block_len  # block length
+    if isinstance(value,(list,tuple)):
+        value = list(value)
+        if not len(value)==2:
+            raise ValueError,"If argument is a list, only 2 values \
+                should be passed (found %s)" %len(value)
+        if not db.fields[field] in [int,float,date,datetime]:
+            raise TypeError,"Search between values is only allowed for " \
+                "int, float, date and datetime (found %s)" %db.fields[field]
+        db._validate(field,value[0])
+        db._validate(field,value[1])
+        value.sort()
+        # convert values in blocks (strings representation in field files)
+        s1,s2 = [ db.f_encode[db.fields[field]](v) for v in value ]
+        # search the common leading characters in s1 and s2
+        common = ''
+        for i in range(len(s1)):
+            if s1[i] == s2[i]:
+                common += s1[i]
+            else:
+                break
+        lc = len(common)
+        Min = s1[lc:] # part of s1 not common with s2
+        Max = s2[lc:] # part of s2 not common with s1
+
+        def _search(buf):
+            """Function searching blocks in the buffer such that
+            s1 <= block <= s2
+            Return a dictionary mapping rank of the block to the block
+            
+            The algorithm searches occurences of 'common', then checks
+            that the rest of the block is between Min and Max
+            """
+            ranks = {}
+            pos = 0
+            while True:
+                # search occurences of the common part between s1 and s2
+                pos = buf.find(common,pos)
+                if pos == -1:
+                    break
+                if pos % bl == 0:
+                    # pos is a block start
+                    block = buf[pos:pos+bl]
+                    # rest of the block
+                    rest = buf[pos+lc:pos+bl]
+                    # compare rest of block to Min and Max
+                    if Min <= rest <= Max:
+                        ranks[pos/bl] = block
+                pos += 1
+            return ranks
+
+    else:
+        v = db.f_encode[db.fields[field]](value)
+
+        def _search(buf):
+            """Function searching blocks in the buffer such that
+            block == v
+            Return a dictionary mapping rank of the block to the block
+            
+            The algorithm searches occurences of the block v in the 
+            buffer
+            """
+            ranks = {}
+            pos = 0
+            while True:
+                pos = buf.find(v,pos)
+                if pos>-1:
+                    if pos % bl == 0:
+                        # pos is a block start
+                        ranks[pos/bl] = buf[pos:pos+bl]
+                    pos += 1
+                else:
+                    break
+            return ranks
+
+    return _search
+
+def fast_select(db,names,**args):
+    """Handles requests like select(['name'],age=23,name='pierre') when
+    one of the arg keys is fixed length type ; uses a fast search algo
+    instead of browsing all the records
+    
+    The search functions are defined for all fixed-length arguments and
+    used to select a subset of record rows in field files
+    """
+    # fixed and variable length fields
+    f_args = [ (k,v) for k,v in args.iteritems() 
+        if hasattr(db._file[k],'block_len') ]
+    v_args = [ (k,v) for (k,v) in args.iteritems() 
+        if not hasattr(db._file[k],'block_len') ]
+    arg_names = [ k for k,v in f_args + v_args ]
+    no_args = [ n for n in names if not n in arg_names ]
+    names = arg_names + no_args
+
+    [ db._file[k].seek(0) for k in names + args.keys() ]
+    max_len = max([ db._file[k[0]].block_len for k in f_args ])
+    num_blocks = db.BLOCKSIZE / max_len
+    funcs = dict([(k,make_search_func(db,k,v)) 
+                    for (k,v) in f_args])
+    fl_ranks = [] # absolute ranks in fixed length files
+    bl_offset = 0 # offset of current chunck
+    res = {}
+    while True:
+        buf = {}
+        ranks = {}
+        # read a chunk of num_blocks blocks in each fixed-length file
+        for i,(k,v) in enumerate(f_args):
+            # rank[field] stores the rank of found values in
+            # the buffer, between 0 and num_blocks-1
+            bl = db._file[k].block_len
+            buf[k] = db._file[k].read(num_blocks*bl)
+            ranks[k] = funcs[k](buf[k])
+        # test end of files
+        if not buf[f_args[0][0]]:
+            break
+        # valid records are those with the same rank in all files
+        rank_set=set(ranks[f_args[0][0]].keys())
+        if len(f_args)>1:
+            for (k,v) in f_args[1:]:
+                rank_set = rank_set.intersection(set(ranks[k].keys()))
+        for c in rank_set:
+            res[bl_offset+c] = [ ranks[k][c] for k,v in f_args ]
+        bl_offset += num_blocks
+
+    fl_ranks = res.keys()
+    fl_ranks.sort()
+
+    # The field files for the other arguments are browsed ; if their
+    # row is in the subset, test if the value for variable length arguments
+    # is equal to the keyword value
+    vl_files = [ db._file[k] for k,v in v_args ]
+    nbvl = len(vl_files)
+    vl_values = tuple([ db._file[k].to_block(v) for (k,v) in v_args ])
+    no_args_files = [ db._file[k] for k in no_args ]
+    other_files = vl_files + no_args_files
+    for f in other_files:
+        f.seek(0)
+
+    for i,lines in enumerate(itertools.izip(*other_files)):
+        try:
+            if i == fl_ranks[0]:
+                fl_ranks.pop(0)
+                if lines[:nbvl] == vl_values:
+                    res[i]+=list(lines)
+                else:
+                    del res[i]
+        except IndexError:
+            break
+    return res,names
diff --git a/buzhug/buzhug_files.py b/buzhug/buzhug_files.py
new file mode 100644
index 00000000..3fe1f454
--- /dev/null
+++ b/buzhug/buzhug_files.py
@@ -0,0 +1,583 @@
+"""This module defines the classes used to modelize the files in which 
+information is stored
+
+One file is used for each field of the base. The values stored are first
+converted into "blocks", which are bytestrings ready to be written in
+physical files in the file system. Symmetrically, data is read from the
+physical file as a bytestring, and can be converted into a value
+
+To optimize the speed of the select() method, the comparison between
+a searched value and a record value is made by converting the searched 
+value into a "block", then compare it to the blocks in the file : this is 
+much faster than converting each block in the file to a value
+
+A consequence of this is that the conversion between value and block must
+preserve the order : if value1 > value2 then block1 > block2. For instance
+we can't convert an integer into its string representation by str(),
+because 10 > 2 (integers) but '10' < '2' (strings). The function used here
+is block = struct('>i',value+sys.maxint)
+
+Since the "for line in _file" loop is extremely fast, whenever possible the
+blocks are stored on one line (lines are separated by \n). Storage of Python
+bytestrings and of Unicode objects use this format (characters \n and \r must
+be escaped to keep the block on one line) ; so do date and datetime
+
+Integers are converted into blocks of 4 characters, since one of them can be
+one of the line break characters we can't use the "for line in _file" loop.
+Browsing the file consists in reading 4096 blocks at a time and yielding the
+blocks one after the other
+
+Deleted blocks begin with "#", uninitialized values with '!', valid valued
+with '-'
+"""
+import sys
+import os
+import tempfile
+import shutil
+
+class File:
+
+    def __init__(self,base='',name=''):
+        self.name = name
+        self.base = base
+        self.path = os.path.join(base,name)
+
+    def create(self):
+        if not os.path.isdir(self.base):
+            os.mkdir(self.base)
+        file(self.path,'w').close()
+        self.fileobj = open(self.path,'r+b')
+        return self
+
+    def open(self):
+        self.fileobj = open(self.path,'r+b')
+        return self
+
+    def get_end_pos(self):
+        self.fileobj.seek(0,2)
+        return self.fileobj.tell()
+
+    def get_pos(self):
+        return self.fileobj.tell()
+
+    def insert(self,value):
+        self.fileobj.seek(0,2)
+        self.fileobj.write(self.to_block(value))
+        self.fileobj.seek(0,2)
+
+    def close(self):
+        self.fileobj.close()
+
+    def mark_as_deleted(self,pos):
+        """mark the block at position pos as deleted"""
+        self.fileobj.seek(pos)
+        self.fileobj.write('#')
+        self.fileobj.seek(pos)
+
+    def get_value_at_pos(self,pos):
+        return self.from_block(self.get_block_at_pos(pos))
+   
+    def write_value_at_pos(self,pos,value):
+        self.fileobj.seek(pos)
+        self.fileobj.write(self.to_block(value))
+        self.fileobj.seek(pos)
+        
+    def tell(self):
+        return self.fileobj.tell()
+    
+    def seek(self,*args):
+        return self.fileobj.seek(*args)
+    
+    def read(self,size=-1):
+        return self.fileobj.read(size)
+
+    def write(self,data):
+        self.fileobj.write(data)
+
+class VariableLengthFile(File):
+    """For variable length data (strings, unicode) blocks are strings
+    on one line"""
+
+    def get_block_at(self,num):
+        self.fileobj.seek(0)
+        for i,line in enumerate(self.fileobj):
+            if i == num:
+                return line
+
+    def get_block_at_pos(self,pos):
+        self.fileobj.seek(pos)
+        return self.fileobj.readline()
+
+    def read_block(self):
+        return self.fileobj.readline()
+
+    def __iter__(self):
+        self.fileobj.seek(0)
+        for line in self.fileobj:
+            yield line
+
+class FixedLengthFile(File):
+    """For fixed length data blocks are strings of length block_len"""
+
+    def get_block_at(self,num):
+        self.fileobj.seek(self.block_len*num)
+        return self.fileobj.read(self.block_len)
+
+    def read_block(self):
+        return self.fileobj.read(self.block_len)
+
+    def get_block_at_pos(self,pos):
+        self.fileobj.seek(pos)
+        return self.fileobj.read(self.block_len)
+   
+    def get_block_at(self,num):
+        return self.get_block_at_pos(self.block_len*num)
+
+    def __iter__(self):
+        self.fileobj.seek(0)
+        chunk_size = self.block_len*(131072/self.block_len)
+        while True:
+            buf = self.fileobj.read(chunk_size)
+            if not buf:
+                raise StopIteration
+            for i in range(len(buf)/self.block_len):
+                yield buf[self.block_len*i:self.block_len*(i+1)]
+
+class StringFile(VariableLengthFile):
+
+    def to_block(self,value):
+        if value is None:
+            return '!\n'
+        elif not isinstance(value,str):
+            raise ValueError,'Bad type : expected str, got %s %s' %(value,
+                    value.__class__)
+        else:
+            # escape CR & LF so that the block is on one line
+            value = value.replace('\\','\\\\')
+            value = value.replace('\n','\\n')
+            value = value.replace('\r','\\r')
+            return '-' + value + '\n'
+    
+    def from_block(self,block):
+        if block == '!\n':
+            return None
+        else:
+            # this is the fastest algo I've found to unescape CR & LF
+            # patched by Jorge Vargas
+            b = block[1:-1]
+            res = ''
+            i = 0
+            while i<len(b):
+                if b[i] == '\\':
+                    j = i
+                    while j<len(b) and b[j] == '\\':
+                        j += 1
+                    res += '\\'*((j-i)/2)
+                    if (j-i) % 2:   # odd number of slashes
+                        if b[j] == 'n':
+                            res += '\n'
+                        elif b[j] == 'r':
+                            res += '\r'
+                        i = j+1
+                    else:
+                        i = j
+                else:
+                    res += b[i]
+                    i += 1
+            return res
+    
+class UnicodeFile(StringFile):
+    """Unicode strings are converted to their UTF-8 encoding"""
+
+    def to_block(self,value):
+        if value is None:
+            return '!\n'
+        elif not isinstance(value,unicode):
+            raise ValueError,'Bad type : expected unicode, got %s %s' %(value,
+                    value.__class__)
+        else:
+            return StringFile.to_block(self,value.encode('utf-8'))
+    
+    def from_block(self,block):
+        if block == '!\n':
+            return None
+        else:
+            return StringFile.from_block(self,block).decode('utf-8')
+
+
+# Generic class for dates
+# Although dates have a fixed length file, this class derives from 
+# VariableLengthFile because select is faster this way
+# block_len is set because this forces the use of the fast select algos
+
+from datetime import date, datetime, time as dtime
+
+class DateFile(VariableLengthFile):
+
+    block_len = 10 # value set to force use of the fast select algos
+
+    def to_block(self,value):
+        if value is None:
+            return '!xxxxxxxx\n'
+        elif not isinstance(value,date):
+            raise ValueError,'Bad type : expected datetime.date, got %s %s' \
+                %(value,value.__class__)
+        else:
+            if value.year>=1900:
+                return value.strftime('-%Y%m%d')+'\n'
+            else:
+                # strftime doesn't work for year<1900
+                return "-%04d%02d%02d\n" %(value.year,value.month,value.day)
+    
+    def from_block(self,block):
+        if block[0] == '!':
+            return None
+        else:
+            return date(int(block[1:5]),int(block[5:7]),int(block[7:-1]))  
+   
+class DateTimeFile(VariableLengthFile):
+
+    block_len = 16 # value set to force use of the fast select algos
+
+    def to_block(self,value):
+        if value is None:
+            return '!xxxxxxxxxxxxxx\n'
+        elif not isinstance(value,date):
+            raise ValueError,'Bad type : expected datetime.date, got %s %s' \
+                %(value,value.__class__)
+        else:
+            if value.year>=1900:
+                return value.strftime('-%Y%m%d%H%M%S')+'\n'
+            else:
+                # strftime doesn't work for year<1900
+                _date = "-%04d%02d%02d%02d%02D%02d\n" %(value.year,
+                    value.month,value.day,value.hour,value.minute,
+                    value.second)
+                return _date
+    
+    def from_block(self,block):
+        if block[0] == '!':
+            return None
+        else:
+            return datetime(int(block[1:5]),int(block[5:7]),int(block[7:9]),
+                int(block[9:11]),int(block[11:13]),int(block[13:15]))
+
+class TimeFile(VariableLengthFile):
+
+    # code by Nicolas Pinault
+
+    block_len = 8 # value set to force use of the fast select algos
+
+    def to_block(self,value):
+        if value is None:
+            return '!xxxxxx\n'
+        elif not isinstance(value, dtime):
+            raise ValueError,'Bad type : expected datetime.time, got %s %s' \
+                %(value,value.__class__)
+        else:
+            return value.strftime('-%H%M%S')+'\n'
+    
+    def from_block(self,block):
+        if block[0] == '!':
+            return None
+        else:
+            return dtime(int(block[1:3]),int(block[3:5]),int(block[5:7]))
+
+class BooleanFile(FixedLengthFile):
+
+    block_len = 2
+
+    def to_block(self,value):
+        if value is None:
+            return '!'+chr(0)
+        elif not isinstance(value,bool):
+            raise ValueError,'Bad type : expected bool, got %s %s' \
+                %(value,value.__class__)
+        else:
+            if value:
+                return '-1'
+            else:
+                return '-0'
+    def from_block(self,block):
+        if block[0]=='!':
+            return None
+        elif block == "-0":
+            return False
+        else:
+            return True
+    
+import struct
+
+class IntegerFile(FixedLengthFile):
+
+    MIDINT = 2**30
+    block_len = 5
+
+    def to_block(self,value):
+        if value is None:
+            return '!'+chr(0)*4
+        elif not isinstance(value,int):
+            raise ValueError,'Bad type : expected int, got %s %s' \
+                %(value,value.__class__)
+        else:
+            if value <= -sys.maxint/2:
+                raise OverflowError,"Integer value must be > %s, got %s" \
+                    %(-sys.maxint/2,value)
+            if value > sys.maxint/2:
+                raise OverflowError,"Integer value must be <= %s, got %s" \
+                    %(sys.maxint/2,value)
+            return '-'+struct.pack('>i',value+self.MIDINT)
+
+    def from_block(self,block):
+        if block[0]=='!':
+            return None
+        else:
+            return struct.unpack('>i',block[1:])[0]-self.MIDINT
+
+import math
+
+class FloatFile(FixedLengthFile):
+
+    """Conversion of float numbers :
+    1. take the mantissa and exponent of value : value = mant * 2**exp
+    Mantissa is always such that 0.5 <= abs(mant) < 1
+    The range for exp is (probably) platform-dependant ; typically from -2048
+    to +2048
+    2. exponent is converted to a positive integer e1 : 0<=e1<=65535
+    If value is negative : e1 = 16384 - exp (decreases when mantissa
+       increases, to preserve order)
+    If value is positive : e1 = 16384*3 + exp
+    
+    This conversion will work in all cases if abs(exp) < 16384
+    
+    3. e1 is converted into a 2-byte string by struct.pack('>H',e1)
+    
+    4. mantissa conversion :
+    - if value is positive : struct.pack('>d',mant)
+    - if value is negative : struct.pack('>d',1.1 + mant)
+    This conversion preserves order, and since all results begin with the same
+    byte chr(63), this first byte can be stripped
+
+    This implementation has changed in version 1.1. Use script conversion_float
+    to upgrade databases made with older versions
+    """
+    
+    block_len = 10
+    offsetneg = 16384
+    offsetpos = 16384*3
+
+    def to_block(self,value):
+        if value is None:
+            return '!'+chr(0)*9
+        elif not isinstance(value,float):
+            raise ValueError,'Bad type : expected float, got %s %s' \
+                %(value,value.__class__)
+        elif value == 0.0:
+            return '-'+chr(128)+chr(0)*8
+        else:
+            # get mantissa and exponent
+            # f = mant*2**exp, 0.5 <= abs(mant) < 1
+            mant,exp = math.frexp(value)
+            if value>=0:
+                pack_exp = struct.pack('>H',exp+self.offsetpos)
+                return '-'+pack_exp+struct.pack('>d',mant)[1:]
+            else:
+                pack_exp = struct.pack('>H',self.offsetneg-exp)
+                return '-'+pack_exp+struct.pack('>d',1.1+mant)[1:]
+
+    def from_block(self,block):
+        if block[0]=='!':
+            return None
+        else:
+            s = block[1:]
+            if ord(s[0])==128:
+                return 0.0
+            elif ord(s[0])<128:
+                # negative number
+                exp = self.offsetneg-struct.unpack('>H',s[:2])[0]
+                mant = struct.unpack('>d',chr(63)+s[2:])[0] - 1.1
+            else:
+                exp = struct.unpack('>H',s[:2])[0]-self.offsetpos
+                mant = struct.unpack('>d',chr(63)+s[2:])[0]
+            return math.ldexp(mant,exp)
+
+class PositionFile(FixedLengthFile):
+    """A position file is used to reference records by their id
+    The information stored about a record is the position of the 
+    record fields in the respective field files
+    """
+
+    def __init__(self,baseobj):
+        """Creates a position file for baseobj, an instance of buzhug.Base
+        """
+        self.baseobj = baseobj
+        self.base = baseobj.name
+        self.path = os.path.join(self.base,'__pos__')
+        self.deleted_lines = []
+        self.block_len = 1+4*len(baseobj.field_names)
+        self._count = 0 # number of records in the base
+        self.next_id = 0
+    
+    def open(self):
+        self.fileobj = open(self.path,'r+b')
+        # get deleted items, identified by a leading '#'
+        self.deleted_lines, self._count = [],0
+        for line_num,line in enumerate(self):
+            if line[0]=='#':
+                self.deleted_lines.append(line_num)
+            else:
+                self._count += 1
+        # the file with a mapping between id and line in the
+        # position file. Has as many blocks of 5 bytes as already
+        # attributed ids
+        _id_pos = self.baseobj._id_pos
+        _id_pos.seek(0,2)
+        self.next_id = _id_pos.tell()/5
+        return self
+
+    def insert(self,value):
+        """Method called when a record is inserted in the base. value
+        is the list of the positions in field files
+        Return the id of the inserted record and the line number in 
+        the position file
+        """
+        if self.deleted_lines:
+            # reuse the first deleted record available
+            num = self.deleted_lines.pop(0)
+            pos = num*self.block_len
+            block = self.get_block_at(num)
+        else:
+            # append a new record at the end of the file
+            self.fileobj.seek(0,2)
+            pos = self.fileobj.tell()
+            num = pos/self.block_len
+        _id = self.next_id
+        self.fileobj.seek(pos)
+        self.fileobj.write(self.to_block(value))
+        self.fileobj.seek(0,2)
+        self._count += 1
+        self.next_id += 1
+        return _id,num
+
+    def update(self,_line,new_positions):
+        """Method used if the record identified by _line has changed with 
+        variable length fields modified : in this case the new fields are 
+        appended at the end of the field files and their new positions must 
+        be updated"""
+        pos = _line*self.block_len
+        self.fileobj.seek(pos)
+        self.fileobj.write(self.to_block(new_positions))
+        self.fileobj.seek(0,2)
+
+    def update_positions(self,_line,new_positions):
+        """Only update positions in field files for record at _line"""
+        pos = _line*self.block_len
+        # skip flag
+        self.fileobj.seek(pos+1)
+        self.fileobj.write(''.join([struct.pack('>i',v) 
+            for v in new_positions]))
+        self.fileobj.seek(pos+3)
+
+    def remove(self,_line):
+        self.fileobj.seek(_line*self.block_len)
+        if self.fileobj.read(1) == '#':
+            return  # if record is already removed, ignore silently
+        self.fileobj.seek(_line*self.block_len)
+        self.fileobj.write('#')
+        self.fileobj.seek(_line*self.block_len)
+        self.deleted_lines.append(_line)
+        self._count -= 1
+
+    def add_field(self,field_name,indx,default):
+        """Update the file to insert the new field at specified index"""
+        ff = self.baseobj._file[field_name]
+        tf = tempfile.TemporaryFile()
+        self.fileobj.seek(0)
+        pos = 1 + 4*indx   # the place to insert positions in the field file
+        while True:
+            line = self.fileobj.read(self.block_len)
+            if not line:
+                break
+            line = line[:pos] + struct.pack('>i',ff.tell()) + line[pos:]
+            tf.write(line)
+            ff.insert(default)
+        tf.seek(0)
+        self.create()
+        shutil.copyfileobj(tf,self.fileobj)
+        tf.close()
+        self.block_len += 4
+
+    def drop_field(self,field_name,indx):
+        """Update the file to remove the field"""
+        tf = tempfile.TemporaryFile()
+        self.fileobj.seek(0)
+        pos = 1 + 4*indx   # the position for the field in the block
+        while True:
+            line = self.fileobj.read(self.block_len)
+            if not line:
+                break
+            line = line[:pos] + line[pos+4:]
+            tf.write(line)
+        tf.seek(0)
+        self.create()
+        shutil.copyfileobj(tf,self.fileobj)
+        tf.close()
+        self.block_len -= 4
+
+    def to_block(self,value):
+        # value = positions in field files
+        return '-'+''.join([struct.pack('>i',v) for v in value])
+
+    def from_block(self,block):
+        """Returns a list : position of field in their files"""
+        return list(struct.unpack('>'+'i'*(len(block[1:])/4),block[1:]))
+
+class DeletedRowsFile(VariableLengthFile):
+    """File that references the deleted rows. Stores integers on variable
+    length format because it's faster and we don't need a conversion that
+    preserves the order"""
+
+    def create(self):
+        VariableLengthFile.create(self)
+        self.deleted_rows = []
+        return self
+
+    def open(self):
+        self.fileobj = open(self.path,'r+b')
+        self.deleted_rows = [ int(line[:-1]) for line in self ]
+        return self
+    
+    def insert(self,value):
+        VariableLengthFile.insert(self,value)
+        self.deleted_rows.append(value)
+
+    def to_block(self,value):
+        return str(value)+'\n'
+    
+    def from_block(self,block):
+        return int(block[:-1])
+
+class ExternalFile(FixedLengthFile):
+    """Class for references to another base"""
+
+    block_len = 5
+    
+    def to_block(self,value):
+        if value is None:
+            return '!'+chr(0)*4
+        else:
+            v = [ value.__id__ ]
+            return '-'+struct.pack('>i',value.__id__)
+
+    def from_block(self,block):
+        if block[0]=='!':
+            return None
+        _id = struct.unpack('>i',block[1:])[0]
+        try:
+            return self.db[_id]
+        except IndexError:
+            # if the referenced record has been deleted, return
+            # an uninitialized record (all fields set to None,
+            # including __id__)
+            rec = ['!']*len(self.db.field_names)
+            return self.db._full_rec(rec)
diff --git a/buzhug/buzhug_info.py b/buzhug/buzhug_info.py
new file mode 100644
index 00000000..53ac5939
--- /dev/null
+++ b/buzhug/buzhug_info.py
@@ -0,0 +1,88 @@
+"""Manage general information about buzhug bases :
+field definitions with types and default values"""
+
+import os
+import urllib
+
+def set_info(base,fields):
+    base.defaults = {}
+    for field in fields:
+        validate_field(base,field)
+
+def validate_field(base,field_def):
+    """Validate field definition"""
+    name,typ = field_def[:2]
+    if name in ['__id__','__version__']:
+        raise ValueError,'Field name "%s" is reserved' %name
+    elif name.startswith('_'):
+        raise ValueError,"Error for %s : names can't begin with _" \
+            % name
+    if typ not in base.types.values():
+        if isinstance(typ,base.__class__): # external link
+            base._register_base(typ)
+        else:
+            raise TypeError,"type %s not allowed" %typ    
+    if len(field_def)>2:
+        # if a default value is provided, check if it is valid
+        default = field_def[2]
+        if isinstance(typ,base.__class__):
+            if not hasattr(default.__class__,"db") or \
+                not default.__class__.db is typ:
+                raise ValueError,'Incorrect default value for field "%s"' \
+                    " : expected %s, got %s (class %s)" %(name,typ,
+                        default,default.__class__)
+        elif not isinstance(default,typ):
+            raise ValueError,'Incorrect default value for field "%s"' \
+                " : expected %s, got %s (class %s)" %(name,typ,
+                    default,default.__class__)
+        base.defaults[name] = default
+    else:
+        base.defaults[name] = None
+
+def save_info(base):
+    """Save field information in files __info___ and __defaults__"""
+    _info = open(base.info_name,'wb')
+    fields = []
+    for k in base.field_names:
+        if isinstance(base.fields[k],base.__class__):
+            fields.append((k,'<base>'+urllib.quote(base.fields[k].name)))
+        else:
+            fields.append((k,base.fields[k].__name__))
+    _info.write(' '.join(['%s:%s' %(k,v) for (k,v) in fields]))
+    _info.close()
+    out = open(os.path.join(base.name,"__defaults__"),"wb")
+    for field_name,default_value in base.defaults.iteritems():
+        if field_name in ["__id__","__version__"]:
+            continue
+        value = base._file[field_name].to_block(default_value)
+        out.write("%s %s" %(field_name,value))
+    out.close()
+
+def read_defaults(base):
+    import buzhug_files
+    defaults = dict([(f,None) for f in base.field_names[2:]])
+    if os.path.exists(os.path.join(base.name,"__defaults__")):
+        defs = open(os.path.join(base.name,"__defaults__"),"rb").read()
+        ix = 0
+        f_name = ""
+        while ix<len(defs):
+            if defs[ix]==" ":
+                ix += 1
+                if issubclass(base._file[f_name].__class__,
+                    buzhug_files.FixedLengthFile):
+                    length = base._file[f_name].block_len
+                    block = defs[ix:ix+length]
+                    ix += length
+                else:
+                    block = ""
+                    while not defs[ix] == "\n":
+                        block += defs[ix]
+                        ix += 1
+                    block += "\n"
+                    ix += 1
+                defaults[f_name] = base._file[f_name].from_block(block)
+                f_name = ""
+            else:
+                f_name += defs[ix]
+                ix += 1
+    return defaults
\ No newline at end of file
diff --git a/buzhug/buzhug_test.py b/buzhug/buzhug_test.py
new file mode 100644
index 00000000..f3220d0e
--- /dev/null
+++ b/buzhug/buzhug_test.py
@@ -0,0 +1,406 @@
+import os
+import random
+import re
+
+from datetime import date, datetime, time as dtime
+from buzhug import Base, TS_Base, Record
+import buzhug,buzhug_files
+
+
+names = ['pierre','claire','simon','camille','jean',
+    'florence','marie-anne']
+fr_names = [ 'andr\x82','fran\x87ois','h\x82l\x8ane' ] # latin-1 encoding
+
+def run_test(thread_safe=False):
+
+    if not thread_safe:
+        db = Base(r'dummy') 
+    else:
+        db = TS_Base('dummy')
+
+    db.create(('name',str), ('fr_name',unicode),
+        ('age',int),
+        ('size',int,300),
+        ('birth',date,date(1994,1,14)),
+        ('afloat',float,1.0),
+        ('birth_hour', dtime,dtime(10,10,10)),
+        mode='override')
+
+    # test float conversions
+    if thread_safe is False:
+        f = db._file["afloat"]
+        def all(v):
+            return [ord(c) for c in v]
+
+        for i in range(10):
+            afloat = random.uniform(-10**random.randint(-307,307),
+                    10**random.randint(-307,307))
+            try:
+                assert cmp(afloat,0.0) == cmp(f.to_block(afloat),f.to_block(0.0))
+            except:
+                print afloat
+                print "afloat > 0.0 ?",afloat>0.0
+                print "blocks ?",f.to_block(afloat)>f.to_block(0.0)
+                print all(f.to_block(afloat)),all(f.to_block(0.0))
+                raise
+
+    assert db.defaults["age"] == None
+    assert db.defaults["size"] == 300
+    assert db.defaults["afloat"] == 1.0
+    assert db.defaults["birth_hour"] == dtime(10,10,10)
+    assert db.defaults["birth"] == date(1994,1,14)
+
+    for i in range(100):
+        db.insert(name=random.choice(names),
+             fr_name = unicode(random.choice(fr_names),'latin-1'),
+             age=random.randint(7,47),size=random.randint(110,175),
+             birth=date(random.randint(1858,1999),random.randint(1,12),10),
+             afloat = random.uniform(-10**random.randint(-307,307),
+                10**random.randint(-307,307)),
+             birth_hour = dtime(random.randint(0, 23), random.randint(0, 59), random.randint(0, 59)))
+
+    assert len(db)==100
+    assert isinstance(db[50].fr_name,unicode)
+    print db[50].fr_name.encode('latin-1')
+
+    db.open()
+    # test if default values have not been modified after open()
+    assert db.defaults["age"] == None
+    assert db.defaults["size"] == 300
+    assert db.defaults["afloat"] == 1.0
+    assert db.defaults["birth_hour"] == dtime(10,10,10)
+    assert db.defaults["birth"] == date(1994,1,14)
+
+    for i in range(5):
+        # insert a list
+        db.insert(random.choice(names),
+             unicode(random.choice(fr_names),'latin-1'),
+             random.randint(7,47),random.randint(110,175),
+             date(random.randint(1958,1999),random.randint(1,12),10),
+             random.uniform(-10**random.randint(-307,307),
+                10**random.randint(-307,307)),
+             dtime(random.randint(0, 23), random.randint(0, 59), random.randint(0, 59)))
+        db.insert(name=random.choice(names)) # missing fields
+        for field in db.field_names[2:]:
+            if field == "name":
+                continue
+            try:
+                assert getattr(db[-1],field) == db.defaults[field]
+            except:
+                print "attribute %s not set to default value %s" %(field,db[-1])
+                raise
+
+    # insert as string
+    db.set_string_format(unicode,'latin-1')
+    db.set_string_format(date,'%d-%m-%y')
+    db.set_string_format(dtime,'%H-%M-%S')
+    db.insert_as_strings(name="testname",fr_name=random.choice(fr_names),
+        age=10,size=123,birth="07-10-95", birth_hour="20-53-3")
+
+    assert db[-1].birth == date(1995,10,7)
+    assert db[-1].name == "testname"
+    assert db[-1].age == 10
+    assert db[-1].afloat == db.defaults["afloat"]
+
+    db.insert_as_strings("testname",random.choice(fr_names),
+        11,134,"09-12-94",1.0, "5-6-13")
+
+    assert db[len(db)-1].birth == date(1994,12,9)
+    assert db[-1].name == "testname"
+    assert db[-1].age == 11
+    assert db[-1].size == 134
+    assert db[-1].afloat == 1.0
+
+    # search between 2 dates
+    print '\nBirth between 1960 and 1970'
+    for r in db.select(None,birth=[date(1960,1,1),date(1970,12,13)]):
+        print r.name,r.birth
+
+    print "sorted"
+    for r in db.select(None,birth=[date(1960,1,1),date(1970,12,13)]).sort_by('+name-birth'):
+        print r.name,r.birth
+
+    f = buzhug_files.FloatFile().to_block
+    def all(v):
+        return [ord(c) for c in f(v)]
+
+    # search between 2 floats
+
+    # selection by list comprehension
+    s1 = [ r for r in db if 0.0 <= r.afloat <= 1e50 ]
+    # selection by select
+    s2 = db.select(None,'x<=afloat<=y',x=0.0,y=1e50)
+    # selction by select with interval
+    s3 = db.select(None,afloat=[0.0,1e50])
+
+    try:
+        assert len(s1) == len(s2) == len(s3)
+    except:
+        print "%s records by list comprehension, " %len(s1)
+        print "%s by select by formula," %len(s2)
+        print "%s by select by interval" %len(s3)
+
+    for r in s1:
+        try:
+            assert r in s2
+        except:
+            print all(r.afloat)
+
+    for r in s2:
+        try:
+            assert r in s1
+        except:
+            print "in select but not in list comprehension",r
+            raise
+    r = db[0]
+    assert r.__class__.db is db
+
+    fr=random.choice(fr_names)
+    s1 = [ r for r in db if r.age == 30 and r.fr_name == unicode(fr,'latin-1')]
+    s2 = db.select(['name','fr_name'],age=30,fr_name = unicode(fr,'latin-1'))
+
+    assert len(s1)==len(s2)
+
+    # different ways to count the number of items
+    assert len(db)  == sum([1 for r in db]) == len(db.select(['name']))
+
+    # check if version number is correctly incremented
+    for i in range(5):
+        recs = db.select_for_update(['name'],'True')
+        version = recs[0].__version__
+        recs[0].update()
+        assert db[0].__version__ == version + 1
+
+    # check if cleanup doesn't change db length
+    length_before = len(db)
+    db.cleanup()
+    assert len(db) == length_before
+
+    # check if selection by select on __id__ returns the same as direct
+    # access by id
+    recs = db.select([],'__id__ == c',c=20)
+    assert recs[0] == db[20]
+
+    # check that has_key returns False for invalid hey
+    assert not db.has_key(1000)
+
+    # drop field
+    db.drop_field('name')
+    # check if field was actually removed from base definition and rows
+    assert not "name" in db.fields
+    assert not hasattr(db[20],"name")
+
+    # add field
+    db.add_field('name',str,default="marcel")
+    # check if field was added with the correct default value
+    assert "name" in db.fields
+    assert hasattr(db[20],"name")
+    assert db[20].name == "marcel"
+
+    # change default value
+    db.set_default("name","julie")
+    db.insert(age=20)
+    assert db[-1].name == "julie"
+
+    # delete a record
+
+    db.delete([db[10]])
+    # check if record has been deleted
+    try:
+        print db[10]
+        raise Exception,"Row 10 should have been deleted"
+    except IndexError:
+        pass
+
+    assert 10 not in db
+    assert len(db) == length_before
+
+    # selections    
+
+    # selection by generator expression
+    # age between 30 et 32
+    d_ids = []
+    for r in [r for r in db if 33> r.age >= 30]:
+        d_ids.append(r.__id__)
+
+    length = len(db)
+    # remove these items
+    db.delete([r for r in db if 33> r.age >= 30])
+    # check if correct number of records removed
+    assert len(db) == length - len(d_ids)
+    # check if all records have been removed
+    assert not [r for r in db if 33> r.age >= 30]
+
+    # updates
+    # select name = pierre
+    s1 = db.select(['__id__','name','age','birth'],name='pierre')
+    # make 'pierre' uppercase
+    for record in db.select_for_update(None,'name == x',x='pierre'):
+        db.update(record,name = record.name.upper())
+    # check if attribute was correctly updated
+    for rec in s1:
+        assert db[rec.__id__] == "Pierre"
+
+    # increment ages
+    for record in db.select_for_update([],'True'):
+        age = record.age
+        if not record.age is None:
+            db.update(record,age = record.age+1)
+            # check
+            assert db[record.__id__].age == age + 1
+
+    for record in [r for r in db]:
+        age = record.age
+        if not record.age is None:
+            db.update(record,age = record.age+1)
+            # check
+            assert db[record.__id__].age == age + 1
+
+    # change dates
+    for record in db.select_for_update([],'age>v',v=35):
+        db.update(record,birth = date(random.randint(1958,1999),
+                                random.randint(1,12),10))
+
+    db.commit()
+
+    # check length after commit
+    assert sum([1 for r in db]) == len(db)
+
+    # insert new records
+    for i in range(50):
+        db.insert(name=random.choice(names),
+             age=random.randint(7,47),size=random.randint(110,175))
+
+    # check that record 10 is still deleted
+    try:
+        print db[10]
+        raise Exception,"Row 10 should have been deleted"
+    except IndexError:
+        pass
+
+    print db.keys()
+    print "has key 10 ?",db.has_key(10)
+    assert 10 not in db
+    #raw_input()
+
+    # check that deleted_lines was cleared by commit()
+    assert not db._pos.deleted_lines
+    print db._del_rows.deleted_rows
+
+    length = len(db) # before cleanup
+
+    # physically remove the deleted items    
+    db.cleanup()
+    # check that deleted_lines and deleted_rows are clean
+    assert not db._pos.deleted_lines
+    assert not db._del_rows.deleted_rows
+
+    # check that record 10 is still deleted
+    try:
+        print db[10]
+        raise Exception,"Row 10 should have been deleted"
+    except IndexError:
+        pass
+
+    assert 10 not in db
+
+    # check that length was not changed by cleanup
+    assert len(db) == length
+    assert len([ r for r in db]) == length
+
+    # age > 30
+    for r in db.select(['__id__','name','age'],
+        'name == c1 and age > c2',
+        c1 = 'pierre',c2 = 30):
+        assert r.name == "pierre"
+        assert r.age > 30
+
+    # name =="PIERRE" and age > 30
+    for r in db.select(['__id__','name','age','birth'],
+                'name == c1 and age > c2',
+                c1 = 'PIERRE',c2 = 30):
+        assert r.name == 'PIERRE'
+        assert r.age > 30
+
+    # test with !=
+    for r in db.select(['__id__'],'name != c1',c1='claire'):
+        assert r.name != 'claire'
+
+    # age > id
+    # with select
+    s1 = db.select(['name','__id__','age'],'age > __id__')
+    for r in s1:
+        assert r.age > r.__id__
+    # with iter
+    s2 = [ r for r in db if r.age > r.__id__ ]
+    for r in s2:
+        assert r.age > r.__id__
+
+    assert len(s1) == len(s2)
+
+    # birth > date(1978,1,1)
+    # with select
+    s1 = db.select(['name','__id__','age'],'birth > v',v=date(1978,1,1))
+    for r in s1:
+        assert r.birth > date(1978,1,1)
+    # with iter
+
+    s2 = [ r for r in db if r.birth and r.birth > date(1978,1,1) ]
+    for r in s2:
+        assert r.birth > date(1978,1,1)
+
+    assert len(s1) == len(s2)
+
+    # test with floats
+    for i in range(10):
+        x = random.uniform(-10**random.randint(-307,307),
+                10**random.randint(-307,307))
+        s1 = [ r for r in db if r.afloat > x ]
+        s2 = db.select(['name'],'afloat > v',v=x)
+        assert len(s1)==len(s2)
+
+    # base with external link
+    houses = Base('houses')
+    houses.create(('address',str),('flag',bool),('resident',db,db[0]),mode="override")
+
+    addresses = ['Giono','Proust','Mauriac','Gide','Bernanos','Racine',
+        'La Fontaine']
+    ks = db.keys()
+    for i in range(50):
+        x = random.choice(ks)
+        address = random.choice(addresses)
+        houses.insert(address=address,flag = address[0]>"H",resident=db[x])
+
+    # houses with jean
+    s1 = []
+    for h in houses:
+        if h.resident.name == 'jean':
+            s1.append(h)
+
+    # by select : ???
+    #s2 = houses.select([],'resident.name == v',v='jean')
+    # assert len(s1) == len(s2)
+
+    h1 = Base('houses')
+    h1.open()
+
+    l1 = len(h1.select([],flag=True))
+    l2 = len(h1.select([],flag=False))
+    assert l1 + l2 == len(h1)
+
+    class DictRecord(Record):
+        def __getitem__(self, k):
+            item = self
+            names = k.split('.')
+            for name in names:
+                item = getattr(item, name)
+            return item
+
+    h1.set_record_class(DictRecord)
+    print '\nrecord_class = DictRecord, h1[0]'
+    print h1[0]
+    print "\nResident name: %(resident.name)s\nAddress: %(address)s" % h1[0]
+
+if __name__ == "__main__":
+    run_test(thread_safe = True)
+    run_test(thread_safe = False)
\ No newline at end of file
diff --git a/buzhug/conversion_float.py b/buzhug/conversion_float.py
new file mode 100644
index 00000000..ba2d037f
--- /dev/null
+++ b/buzhug/conversion_float.py
@@ -0,0 +1,131 @@
+"""
+Conversion program to upgrade databases with float fields for
+version 1.1
+
+The implementation in versions <= 1.0 caused a DeprecationWarning
+for Python version 2.5. The conversion function must be changed
+and this makes databases built with old versions incompatible
+
+Use this script to upgrade to the new version : select the directory
+for the database in the window, this will upgrade all float fields
+
+For safety reasons, a backup copy of old files for these fields is
+saved in the directory with current datetime appended at the end of 
+file name. In case of any problem, remove new file for the field and 
+rename backup file by removing the datetime string
+"""
+import os
+import struct
+import random
+import math
+
+class OldFloatFile:
+
+    block_len = 10
+    MIDSHORT = 3000 + 128*256
+    MAXSHORT = 256*256
+    X = MAXSHORT - MIDSHORT
+
+    def from_block(self,block):
+        if block[0]=='!':
+            return None
+        else:
+            s = block[1:]
+            if ord(s[0]) < 128:
+                # negative number
+                pack_exp = s[:2]
+                exp = 3000 - struct.unpack('>h',pack_exp)[0]
+                mant = struct.unpack('>d',chr(63)+s[2:])[0] - 1.1
+            else:
+                exp = self.X + struct.unpack('>h',s[:2])[0]
+                mant = struct.unpack('>d',chr(63)+s[2:])[0]
+            return math.ldexp(mant,exp)
+
+class FloatFile:
+
+    block_len = 10
+    offsetneg = 16384
+    offsetpos = 16384*3
+
+    def to_block(self,value):
+        if value is None:
+            return '!'+chr(0)*9
+        elif not isinstance(value,float):
+            raise ValueError,'Bad type : expected float, got %s %s' \
+                %(value,value.__class__)
+        else:
+            # get mantissa and exponent
+            # f = mant*2**exp, 0.5 <= abs(mant) < 1
+            mant,exp = math.frexp(value)
+            if value>=0:
+                pack_exp = struct.pack('>H',exp+self.offsetpos)
+                return '-'+pack_exp+struct.pack('>d',mant)[1:]
+            else:
+                pack_exp = struct.pack('>H',self.offsetneg-exp)
+                return '-'+pack_exp+struct.pack('>d',1.1+mant)[1:]
+
+    def from_block(self,block):
+        if block[0]=='!':
+            return None
+        else:
+            s = block[1:]
+            if ord(s[0])<128:
+                # negative number
+                exp = self.offsetneg-struct.unpack('>H',s[:2])[0]
+                mant = struct.unpack('>d',chr(63)+s[2:])[0] - 1.1
+            else:
+                exp = struct.unpack('>H',s[:2])[0]-self.offsetpos
+                mant = struct.unpack('>d',chr(63)+s[2:])[0]
+            return math.ldexp(mant,exp)
+
+def conv(old):
+    # update base to new version
+    of = OldFloatFile()
+    nf = FloatFile()
+    for (f,t) in old.fields.iteritems():
+        if t is float:
+            old_path = db._file[f].path
+            new_path = os.path.join(db._file[f].base,"new_"+db._file[f].name)
+            new_file = open(new_path,"wb")
+            for i,r in enumerate(db._file[f]):
+                v = of.from_block(r)
+                if v is None:
+                    new_block = r
+                else:
+                    new_block = nf.to_block(v)
+                    if nf.from_block(new_block) != v:
+                        raise ValueError,"conversion error : %s != %s" \
+                            %(v,nf.from_block(new_block))
+                new_file.write(new_block)
+            print i,"lines"
+            new_file.close()
+
+            # double-check if values are the same between old and new file
+            db._file[f].open()
+            new_file = open(new_path,"rb")
+            bl = db._file[f].block_len
+            while True:
+                old = db._file[f].read(bl)
+                if not old:
+                    break
+                new = new_file.read(bl)
+                if not of.from_block(old) == nf.from_block(new):
+                    raise ValueError, "conversion error : %s != %s" \
+                        %(of.from_block(old),nf.from_block(new))
+
+            new_file.close()
+            # replace old file
+            db.close()
+            # for safety, backup old file
+            import datetime
+            backup_name = db._file[f].name+datetime.datetime.now().strftime("%y%m%d%H%M%S")
+            os.rename(db._file[f].path,os.path.join(db._file[f].base,backup_name))
+            os.rename(new_path,old_path)            
+
+import buzhug                
+import tkFileDialog
+
+path = tkFileDialog.askdirectory()
+if path :
+    db = buzhug.Base(path).open()
+    conv(db)
diff --git a/sublimerepl.py b/sublimerepl.py
index ae2aa719..19738cf4 100644
--- a/sublimerepl.py
+++ b/sublimerepl.py
@@ -9,11 +9,13 @@
 import sublime_plugin
 import repl
 import os
+import buzhug
 
 repl_views = {}
 
 PLATFORM = sublime.platform().lower()
 SUBLIMEREPL_DIR = os.getcwdu()
+SETTINGS_FILE = 'SublimeREPL.sublime-settings'
 
 def repl_view(view):
     id = view.settings().get("repl_id")
@@ -54,7 +56,7 @@ def subst_for_translate(window):
     res["file_path"] = os.path.dirname(filename)
     res["file_basename"] = os.path.basename(filename)
 
-    settings = sublime.load_settings('SublimeREPL.sublime-settings')
+    settings = sublime.load_settings(SETTINGS_FILE)
     for key in ["win_cmd_encoding"]:
         res[key] = settings.get(key)
     return res
@@ -131,12 +133,27 @@ def next_command(self):
 
 class History(object):
     def __init__(self):
-        self._stack = []
+        self._last = None
 
     def push(self, command):
         cmd = command.rstrip()
-        if not cmd:
+        if not cmd or cmd == self._last:
             return
+        self.append(cmd)
+        self._last = cmd
+
+    def append(self, cmd):
+        raise NotImplemented
+
+    def match(self, command_prefix):
+        raise NotImplemented
+
+class MemHistory(History):
+    def __init__(self):
+        super(MemHistory, self).__init__()
+        self._stack = []
+
+    def append(self, cmd):
         self._stack.append(cmd)
 
     def match(self, command_prefix):
@@ -146,6 +163,28 @@ def match(self, command_prefix):
                 matching_commands.append(cmd)
         return HistoryMatchList(command_prefix, matching_commands)
 
+
+class PersistentHistory(History):
+    def __init__(self, external_id):
+        import datetime
+        super(PersistentHistory, self).__init__()
+        path = os.path.join(sublime.packages_path(), "User", "SublimeREPLHistory")
+        self._db = buzhug.TS_Base(path)
+        self._external_id = external_id
+        self._db.create(("external_id", unicode), ("command", unicode), ("ts", datetime.datetime), mode="open")
+
+    def append(self, cmd):
+        from datetime import datetime
+        self._db.insert(external_id=self._external_id, command=cmd, ts=datetime.now())
+
+    def match(self, command_prefix):
+        import re
+        pattern = re.compile("^" + re.escape(command_prefix) + ".*")
+        retults = self._db.select(None, 'external_id==eid and p.match(command)', eid=self._external_id, p=pattern)
+        retults.sort_by("+ts")
+        return HistoryMatchList(command_prefix, [x.command for x in retults])
+
+
 class ReplView(object):
     def __init__(self, view, repl, syntax):
         view.settings().set("repl_id", repl.id)
@@ -160,7 +199,10 @@ def __init__(self, view, repl, syntax):
         self._repl_reader = ReplReader(repl)
         self._repl_reader.start()
 
-        self._history = History()
+        if self.external_id and sublime.load_settings(SETTINGS_FILE).get("presistent_history_enabled"):
+            self._history = PersistentHistory(self.external_id)
+        else:
+            self._history = MemHistory()
         self._history_match = None
         
         # begin refreshing attached view