In [None]:
# Iris classification with K-Nearest Neighbors
# This notebook loads the local `dataset/iris.data`, trains a KNN classifier,
# evaluates it, and saves the trained model to `model.joblib`.

import pathlib
import numpy as np
import pandas as pd
from sklearn.model_selection import train_test_split, GridSearchCV
from sklearn.neighbors import KNeighborsClassifier
from sklearn.preprocessing import StandardScaler
from sklearn.pipeline import Pipeline
from sklearn.metrics import accuracy_score, classification_report, confusion_matrix
import joblib

DATA_PATH = pathlib.Path('dataset') / 'iris.data'
df = pd.read_csv(DATA_PATH, header=None)
df.columns = ['sepal_length','sepal_width','petal_length','petal_width','class']
df['class'] = df['class'].astype(str)

# Quick look
print('Rows, cols:', df.shape)
print(df['class'].value_counts())
df.head()

X = df.iloc[:, :4].values
y = df['class'].values

# Split
X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.2, random_state=42, stratify=y)

# Pipeline: scaling + KNN
pipe = Pipeline([('scaler', StandardScaler()), ('knn', KNeighborsClassifier())])

# Grid search for best k and weights
param_grid = {
    'knn__n_neighbors': [3,5,7,9],
    'knn__weights': ['uniform','distance'],
    'knn__p': [1,2]  # 1=Manhattan, 2=Euclidean
}
gs = GridSearchCV(pipe, param_grid, cv=5, n_jobs=-1)
gs.fit(X_train, y_train)

print('Best params:', gs.best_params_)

best = gs.best_estimator_
y_pred = best.predict(X_test)

print('Accuracy:', accuracy_score(y_test, y_pred))
print('
















print('Example prediction for', example, '->', predict_sample(example))example = [5.1,3.5,1.4,0.2]  # expect Iris-setosa# Example    return model.predict(sample_arr)[0]    sample_arr = np.array(sample).reshape(1, -1)    model = joblib.load('model.joblib')    # sample: iterable of 4 feature valuesdef predict_sample(sample):# Small helper: predict on a custom sampleprint('Saved model to model.joblib')joblib.dump(best, 'model.joblib')# Save modelprint('Confusion matrix:
', confusion_matrix(y_test, y_pred))Classification report:
', classification_report(y_test, y_pred))