# Task 1 
## Implementing a Simple Hash Table with Collision Handling 

In [1]:
import math

class HashTable:
    def __init__(self, size=10, collision_method="chaining"):
        self.size = size
        self.table = [None] * self.size
        self.collision_method = collision_method

    def _hash(self, key):
        return hash(key) % self.size

    def insert(self, key, value):
        index = self._hash(key)
        
        if self.collision_method == "chaining":
            if self.table[index] is None:
                self.table[index] = [(key, value)]
            else:
                for i, (k, v) in enumerate(self.table[index]):
                    if k == key:
                        self.table[index][i] = (key, value)
                        return
                self.table[index].append((key, value))
        elif self.collision_method == "linear_probing":
            original_index = index
            while self.table[index] is not None:
                if self.table[index][0] == key:
                    self.table[index] = (key, value)
                    return
                index = (index + 1) % self.size
                if index == original_index:
                    raise Exception("Hash table is full")
            self.table[index] = (key, value)

    def get(self, key):
        index = self._hash(key)
        
        if self.collision_method == "chaining":
            if self.table[index] is not None:
                for k, v in self.table[index]:
                    if k == key:
                        return v
            return None
        
        elif self.collision_method == "linear_probing":
            original_index = index
            while self.table[index] is not None:
                if self.table[index][0] == key:
                    return self.table[index][1]
                index = (index + 1) % self.size
                if index == original_index:
                    break
            return None

    def delete(self, key):
        index = self._hash(key)
        
        if self.collision_method == "chaining":
            if self.table[index] is not None:
                for i, (k, v) in enumerate(self.table[index]):
                    if k == key:
                        del self.table[index][i]
                        return True
            return False
        
        elif self.collision_method == "linear_probing":
            original_index = index
            while self.table[index] is not None:
                if self.table[index][0] == key:
                    self.table[index] = None
                    return True
                index = (index + 1) % self.size
                if index == original_index:
                    break
            return False

    def __str__(self):
        return str(self.table)


print("Testing HashTable with Chaining (Linked List) Collision Handling:")
ht_chaining = HashTable(collision_method="chaining")
ht_chaining.insert("apple", 1)
ht_chaining.insert("banana", 2)
ht_chaining.insert("orange", 3)
ht_chaining.insert("grape", 4)
ht_chaining.insert("banana", 5)

print("Table after insertions:", ht_chaining)
print("Get 'banana':", ht_chaining.get("banana"))
print("Get 'grape':", ht_chaining.get("grape"))
print("Get 'pear':", ht_chaining.get("pear"))

ht_chaining.delete("banana")
print("Table after deleting 'banana':", ht_chaining)

print("\nTesting HashTable with Linear Probing Collision Handling:")
ht_probing = HashTable(collision_method="linear_probing")
ht_probing.insert("apple", 1)
ht_probing.insert("banana", 2)
ht_probing.insert("orange", 3)
ht_probing.insert("grape", 4)
ht_probing.insert("banana", 5)

print("Table after insertions:", ht_probing)
print("Get 'banana':", ht_probing.get("banana"))
print("Get 'grape':", ht_probing.get("grape"))
print("Get 'pear':", ht_probing.get("pear"))

ht_probing.delete("banana")
print("Table after deleting 'banana':", ht_probing)

Testing HashTable with Chaining (Linked List) Collision Handling:
Table after insertions: [None, None, [('apple', 1)], [('orange', 3)], None, [('grape', 4)], None, None, None, [('banana', 5)]]
Get 'banana': 5
Get 'grape': 4
Get 'pear': None
Table after deleting 'banana': [None, None, [('apple', 1)], [('orange', 3)], None, [('grape', 4)], None, None, None, []]

Testing HashTable with Linear Probing Collision Handling:
Table after insertions: [None, None, ('apple', 1), ('orange', 3), None, ('grape', 4), None, None, None, ('banana', 5)]
Get 'banana': 5
Get 'grape': 4
Get 'pear': None
Table after deleting 'banana': [None, None, ('apple', 1), ('orange', 3), None, ('grape', 4), None, None, None, None]


# Task 2  
## Implementing a Custom Hash Function and Analyzing Collisions 

In [None]:
pip install matplotlib

In [None]:
import random
import matplotlib.pyplot as plt

class HashTable:
    def __init__(self, size=100, hash_function="custom"):
        self.size = size
        self.table = [None] * self.size
        self.collisions = 0
        self.hash_function = hash_function
    
    def custom_hash(self, key):
        hash_value = 0
        if isinstance(key, int):
            return key % self.size
        for char in str(key):
            hash_value = (hash_value * 31 + ord(char)) % self.size
        return hash_value
    
    def python_hash(self, key):
        return hash(key) % self.size
    
    def insert(self, key):
        if self.hash_function == "custom":
            index = self.custom_hash(key)
        else:
            index = self.python_hash(key)
        
        original_index = index
        while self.table[index] is not None:
            self.collisions += 1
            index = (index + 1) % self.size
            if index == original_index:
                raise Exception("Hash table is full")
        self.table[index] = key
    
    def reset(self):
        self.table = [None] * self.size
        self.collisions = 0

    def get_collision_count(self):
        return self.collisions
    
    def get_table(self):
        return self.table

def insert_large_dataset(hash_table, dataset_size):
    random.seed(42)
    for _ in range(dataset_size):
        key = random.randint(1, 1000000)
        hash_table.insert(key)

def plot_histogram(hash_table, hash_function):
    hash_values = []
    for key in hash_table.get_table():
        if key is not None:
            if hash_function == "custom":
                hash_values.append(hash_table.custom_hash(key))
            else:
                hash_values.append(hash_table.python_hash(key))
    
    plt.hist(hash_values, bins=30, edgecolor="black")
    plt.title(f"Distribution of Hash Values using {hash_function} Hash Function")
    plt.xlabel("Hash Value")
    plt.ylabel("Frequency")
    plt.show()

dataset_size = 1000
table_size = 100

ht_custom = HashTable(size=table_size, hash_function="custom")
insert_large_dataset(ht_custom, dataset_size)
print(f"Collisions with custom hash function: {ht_custom.get_collision_count()}")
plot_histogram(ht_custom, "custom")

ht_python = HashTable(size=table_size, hash_function="python")
insert_large_dataset(ht_python, dataset_size)
print(f"Collisions with Python hash function: {ht_python.get_collision_count()}")
plot_histogram(ht_python, "python")

# Task 3 
## Implementing a Caching Mechanism using Hashing (LRU Cache)  

In [4]:
class Node:
    def __init__(self, key, value):
        self.key = key
        self.value = value
        self.prev = None
        self.next = None

class LRUCache:
    def __init__(self, capacity: int):
        self.capacity = capacity
        self.cache = {}
        self.head = Node(0, 0)
        self.tail = Node(0, 0)
        self.head.next = self.tail
        self.tail.prev = self.head

    def _remove(self, node: Node):
        prev_node = node.prev
        next_node = node.next
        prev_node.next = next_node
        next_node.prev = prev_node

    def _add_to_front(self, node: Node):
        node.prev = self.head
        node.next = self.head.next
        self.head.next.prev = node
        self.head.next = node

    def get(self, key: int) -> int:
        if key in self.cache:
            node = self.cache[key]
            self._remove(node)
            self._add_to_front(node)
            return node.value
        return -1

    def put(self, key: int, value: int) -> None:
        if key in self.cache:
            node = self.cache[key]
            node.value = value
            self._remove(node)
            self._add_to_front(node)
        else:
            if len(self.cache) >= self.capacity:
                lru_node = self.tail.prev
                self._remove(lru_node)
                del self.cache[lru_node.key]
            new_node = Node(key, value)
            self.cache[key] = new_node
            self._add_to_front(new_node)

def test_lru_cache():
    cache = LRUCache(3)

    cache.put(1, 1)
    cache.put(2, 2)
    cache.put(3, 3)
    
    print(cache.get(1))  # returns 1

    cache.put(4, 4)  
    print(cache.get(2))  # returns -1
    print(cache.get(3))  # returns 3
    cache.put(5, 5)  
    print(cache.get(1))  # returns -1
    print(cache.get(4))  # returns 4

test_lru_cache()

1
-1
3
-1
4
