# The BSTree data structure

## Agenda

- API
- Implementation
    - Search
    - Addition
    - Removal
    - Iteration / Traversal
- Runtime complexity

## API

In [None]:
class BSTree:
    class Node:
        def __init__(self, val, left=None, right=None):
            self.val = val
            self.left = left
            self.right = right
            
    def __init__(self):
        self.size = 0
        self.root = None
    
    def __contains__(self, val):
        """Returns `True` if val is in this tree and `False` otherwise."""
        pass
    
    def add(self, val):
        """Adds `val` to this tree while maintaining BSTree properties."""
        assert val not in self
        pass    

    def __delitem__(self, val):
        """Removes `val` from this tree while maintaining BSTree properties."""
        assert val in self
        pass
    
    def __iter__(self):
        """Returns an iterator over all the values in the tree, in ascending order."""
        pass

    def __len__(self):
        return self.size
    
    def height(self):
        """Returns the height of the root of the tree."""
        def height_rec(t):
            if not t:
                return 0
            else:
                return 1 + max(height_rec(t.left), height_rec(t.right))
        return height_rec(self.root)

    def pprint(self, width=64):
        """Attempts to pretty-print this tree's contents."""
        height = self.height()
        nodes  = [(self.root, 0)]
        prev_level = 0
        repr_str = ''
        while nodes:
            n,level = nodes.pop(0)
            if prev_level != level:
                prev_level = level
                repr_str += '\n'
            if not n:
                if level < height-1:
                    nodes.extend([(None, level+1), (None, level+1)])
                repr_str += '{val:^{width}}'.format(val='-', width=width//2**level)
            elif n:
                if n.left or level < height-1:
                    nodes.append((n.left, level+1))
                if n.right or level < height-1:
                    nodes.append((n.right, level+1))
                repr_str += '{val:^{width}}'.format(val=n.val, width=width//2**level)
        print(repr_str)

In [None]:
t = BSTree()
t.root = BSTree.Node(5,
                    left=BSTree.Node(2),
                    right=BSTree.Node(10))
t.size = 3

In [None]:
t.height()

In [None]:
t.pprint()

## Implementation

### Search

In [None]:
class BSTree(BSTree):
    def __contains__(self, val):
        pass

In [None]:
t = BSTree()
t.root = BSTree.Node(5,
                    left=BSTree.Node(2),
                    right=BSTree.Node(10))
t.size = 3

In [None]:
5 in t

### Addition

In [None]:
class BSTree(BSTree):
    def add(self, val):
        assert val not in self
        pass

In [None]:
import random
t = BSTree()
vals = list(range(5))
random.shuffle(vals)
for x in vals:
    t.add(x)
t.pprint()

### Removal

In [None]:
class BSTree(BSTree):
    def __delitem__(self, val):
        assert val in self
        pass

In [None]:
t = BSTree()
for x in [10, 5, 15, 2, 17]:
    t.add(x)
t.pprint()

In [None]:
del t[2]
t.pprint()

In [None]:
t = BSTree()
for x in [10, 5, 15, 2, 17]:
    t.add(x)
t.pprint()

In [None]:
del t[5]
t.pprint()

In [None]:
t = BSTree()
for x in [10, 5, 15, 2, 17]:
    t.add(x)
t.pprint()

In [None]:
del t[15]
t.pprint()

In [None]:
t = BSTree()
for x in [10, 5, 15, 2, 17]:
    t.add(x)
t.pprint()

In [None]:
del t[10]
t.pprint()

In [None]:
class BSTree(BSTree):
    def __delitem__(self, val):
        assert val in self
        def delitem_rec(node):
            if val < node.val:
                node.left = delitem_rec(node.left)
                return node
            elif val > node.val:
                node.right = delitem_rec(node.right)
                return node
            else:
                if not node.left and not node.right:
                    return None
                elif node.left and not node.right:
                    return node.left
                elif node.right and not node.left:
                    return node.right
                else:
                    # handle the complex case
                    return node
                        
        self.root = delitem_rec(self.root)
        self.size -= 1

In [None]:
t = BSTree()
for x in [10, 5, 2, 7, 9, 8, 1, 15, 12, 18]:
    t.add(x)
t.pprint()

In [None]:
del t[15]
t.pprint()

In [None]:
t = BSTree()
for x in [10, 5, 2, 7, 9, 8, 1, 15, 12, 18]:
    t.add(x)
t.pprint()

In [None]:
del t[5]
t.pprint()

In [None]:
t = BSTree()
for x in [10, 5, 2, 7, 9, 8, 1, 15, 12, 18]:
    t.add(x)
t.pprint()

In [None]:
del t[10]
t.pprint()

### Iteration / Traversal

In [None]:
class BSTree(BSTree):
    def __iter__(self):
        pass

In [None]:
import random
t = BSTree()
vals = list(range(20))
random.shuffle(vals)
for x in vals:
    t.add(x)
for x in t:
    print(x)

### Iteration by Level

In [None]:
class BSTree(BSTree):
    def __iter__(self):
        pass

In [None]:
import random
t = BSTree()
vals = list(range(10))
random.shuffle(vals)
for x in vals:
    t.add(x)
t.pprint()

In [None]:
for x in t:
    print(x)

## Runtime Complexity

The runtime complexity of the search, add, and delete methods of the binary search tree are dependent, ultimately, on the depth of their recursive implementation. The depth of recursion is in turn dependent on the height of the binary search tree.

Given $N$ nodes, the height of a binary search tree is, in the worst case = ?

This gives us the following worst-case runtime complexities:

- Search = O(?)
- Add = O(?)
- Delete = O(?)

How can we improve this runtime complexity? What should be our target runtime complexity?