In [1]:
import numpy as np

def read_data(file_path):
    with open(file_path, 'r') as file:
        k = int(file.readline().strip())
        _, dim = map(int, file.readline().strip().split())
        target = np.array(list(map(float, file.readline().strip().split())))
        data = []
        for i, line in enumerate(file):
            elements = line.strip().split()
            data.append((i, np.array(list(map(float, elements[:-1]))), elements[-1]))
        return k, dim, target, data

def euclidean_distance(point1, point2):
    return np.linalg.norm(point1 - point2)

def nearest_neighbors(k, target, data):
    distances = [(euclidean_distance(target, point), i, point, cls) for i, point, cls in data]
    distances.sort()
    return distances[:k]

def main():
    file_path = '../tests/test_1000000_2.txt'  # Change this to your file path
    k, _, target, data = read_data(file_path)
    neighbors = nearest_neighbors(k, target, data)
    print(f"The {k} nearest neighbors to the target {target} are:")
    for i, (distance, index, point, cls) in enumerate(neighbors, start=1):
        print(f"Neighbor {i}: Index = {index}, Distance = {distance}, Point = {point}, Class = {cls}")

if __name__ == "__main__":
    main()


The 5 nearest neighbors to the target [0.05258246 0.3017383 ] are:
Neighbor 1: Index = 634452, Distance = 0.00019202440194769063, Point = [0.05242023 0.30163556], Class = 0
Neighbor 2: Index = 980052, Distance = 0.0012304294563180924, Point = [0.0525011  0.30296604], Class = 0
Neighbor 3: Index = 764178, Distance = 0.0012470817447754164, Point = [0.05172992 0.30264846], Class = 0
Neighbor 4: Index = 845420, Distance = 0.001249274059512119, Point = [0.05315436 0.30284898], Class = 0
Neighbor 5: Index = 256456, Distance = 0.0013531954643986898, Point = [0.05204694 0.30298102], Class = 1
