In [9]:
import numpy as np

def read_data(file_path):
    with open(file_path, 'r') as file:
        k = int(file.readline().strip())
        _, dim = map(int, file.readline().strip().split())
        target = np.array(list(map(float, file.readline().strip().split())))
        data = []
        for i, line in enumerate(file):
            elements = line.strip().split()
            data.append((i, np.array(list(map(float, elements[:-1]))), elements[-1]))
        return k, dim, target, data

def euclidean_distance(point1, point2):
    return np.linalg.norm(point1 - point2)

def nearest_neighbors(k, target, data):
    distances = [(euclidean_distance(target, point), i, point, cls) for i, point, cls in data]
    distances.sort()
    return distances[:k]

def main():
    file_path = '../tests/test_10000000_2.txt'  # Change this to your file path
    k, _, target, data = read_data(file_path)
    neighbors = nearest_neighbors(k, target, data)
    print(f"The {k} nearest neighbors to the target {target} are:")
    for i, (distance, index, point, cls) in enumerate(neighbors, start=1):
        print(f"Neighbor {i}: Index = {index}, Distance = {distance}, Point = {point}, Class = {cls}")

if __name__ == "__main__":
    main()


The 5 nearest neighbors to the target [0.52779334 0.16805235] are:
Neighbor 1: Index = 5385596, Distance = 7.321434342576356e-05, Point = [0.52781698 0.16798306], Class = 0
Neighbor 2: Index = 5586861, Distance = 0.00014039886092114093, Point = [0.52790922 0.16797308], Class = 0
Neighbor 3: Index = 1440551, Distance = 0.00021854587389177028, Point = [0.52798451 0.16815825], Class = 0
Neighbor 4: Index = 4352519, Distance = 0.000306072581994888, Point = [0.52763685 0.16778931], Class = 0
Neighbor 5: Index = 7116525, Distance = 0.00039872494989017096, Point = [0.52803572 0.16836895], Class = 1
