In [24]:
import numpy as np

def read_data(file_path):
    with open(file_path, 'r') as file:
        k = int(file.readline().strip())
        _, dim = map(int, file.readline().strip().split())
        target = np.array(list(map(float, file.readline().strip().split())))
        data = []
        for i, line in enumerate(file):
            elements = line.strip().split()
            data.append((i, np.array(list(map(float, elements[:-1]))), elements[-1]))
        return k, dim, target, data

def euclidean_distance(point1, point2):
    return np.linalg.norm(point1 - point2)

def nearest_neighbors(k, target, data):
    distances = [(euclidean_distance(target, point), i, point, cls) for i, point, cls in data]
    distances.sort()
    return distances[:k]

def main():
    file_path = '../tests/test_100000_2.txt'  # Change this to your file path
    k, _, target, data = read_data(file_path)
    neighbors = nearest_neighbors(k, target, data)
    print(f"The {k} nearest neighbors to the target {target} are:")
    for i, (distance, index, point, cls) in enumerate(neighbors, start=1):
        print(f"Neighbor {i}: Index = {index}, Distance = {distance}, Point = {point}, Class = {cls}")

if __name__ == "__main__":
    main()


The 5 nearest neighbors to the target [0.17065415 0.96277909] are:
Neighbor 1: Index = 65157, Distance = 0.0009629712334354765, Point = [0.1709776  0.96187207], Class = 0
Neighbor 2: Index = 6442, Distance = 0.0021316758904974128, Point = [0.17017819 0.96070123], Class = 1
Neighbor 3: Index = 16515, Distance = 0.0028149433248297988, Point = [0.16904693 0.96046809], Class = 0
Neighbor 4: Index = 83540, Distance = 0.0028761670564966366, Point = [0.16794506 0.9618131 ], Class = 0
Neighbor 5: Index = 9957, Distance = 0.003253292292813717, Point = [0.17325854 0.96472873], Class = 1
