In [1]:
""" Q1. Write a Python code to implement the KNN classifier algorithm on load_iris dataset in
sklearn.datasets. """

from sklearn.datasets import load_iris
from sklearn.model_selection import train_test_split
from sklearn.neighbors import KNeighborsClassifier
from sklearn.metrics import accuracy_score

# Load the iris dataset
iris = load_iris()
X, y = iris.data, iris.target

# Split the data into training and testing sets
X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.2, random_state=42)

# Initialize KNN classifier
knn_classifier = KNeighborsClassifier(n_neighbors=3)

# Fit the classifier to the training data
knn_classifier.fit(X_train, y_train)

# Make predictions on the test set
y_pred = knn_classifier.predict(X_test)

# Evaluate the accuracy
accuracy = accuracy_score(y_test, y_pred)

print(f'Accuracy: {accuracy}')

Accuracy: 1.0


In [6]:
""" Q3. Write a Python code snippet to find the optimal value of K for the KNN classifier algorithm using
cross-validation on load_iris dataset in sklearn.datasets. """

from sklearn.model_selection import GridSearchCV

# Assuming X, y, X_train, X_test, y_train, y_test are already defined

# Define the parameter grid
param_grid = {'n_neighbors': range(1, 21)}

# Initialize KNN classifier
knn_classifier = KNeighborsClassifier()

# Perform grid search with cross-validation
grid_search = GridSearchCV(knn_classifier, param_grid, cv=5)
grid_search.fit(X_train, y_train)

# Get the optimal value of K
optimal_k = grid_search.best_params_['n_neighbors']
print(f'Optimal K: {optimal_k}')

Optimal K: 3


In [7]:
""" Q4. Implement the KNN regressor algorithm with feature scaling on load_boston dataset in
sklearn.datasets. """

from sklearn.preprocessing import StandardScaler

# Assuming X, y, X_train, X_test, y_train, y_test are already defined

# Standardize the features
scaler = StandardScaler()
X_train_scaled = scaler.fit_transform(X_train)
X_test_scaled = scaler.transform(X_test)

# Initialize KNN regressor
knn_regressor = KNeighborsRegressor(n_neighbors=3)

# Fit the regressor to the scaled training data
knn_regressor.fit(X_train_scaled, y_train)

# Make predictions on the scaled test set
y_pred_scaled = knn_regressor.predict(X_test_scaled)

# Evaluate the mean squared error
mse_scaled = mean_squared_error(y_test, y_pred_scaled)
print(f'Mean Squared Error with Feature Scaling: {mse_scaled}')

Mean Squared Error with Feature Scaling: 0.007407407407407404


In [8]:
""" Q5. Write a Python code snippet to implement the KNN classifier algorithm with weighted voting on
load_iris dataset in sklearn.datasets. """

# Assuming X, y, X_train, X_test, y_train, y_test are already defined

# Initialize KNN classifier with weighted voting
knn_classifier_weighted = KNeighborsClassifier(n_neighbors=3, weights='distance')

# Fit the classifier to the training data
knn_classifier_weighted.fit(X_train, y_train)

# Make predictions on the test set
y_pred_weighted = knn_classifier_weighted.predict(X_test)

# Evaluate the accuracy with weighted voting
accuracy_weighted = accuracy_score(y_test, y_pred_weighted)
print(f'Accuracy with Weighted Voting: {accuracy_weighted}')

Accuracy with Weighted Voting: 1.0


In [9]:
""" Q6. Implement a function to standardise the features before applying KNN classifier. """

from sklearn.preprocessing import StandardScaler

def standardize_features(X_train, X_test):
    scaler = StandardScaler()
    X_train_std = scaler.fit_transform(X_train)
    X_test_std = scaler.transform(X_test)
    return X_train_std, X_test_std

# Usage:
# X_train_std, X_test_std = standardize_features(X_train, X_test)
# Then use X_train_std, X_test_std in the KNN classifier


In [10]:
""" Q7. Write a Python function to calculate the euclidean distance between two points. """

import numpy as np

def euclidean_distance(point1, point2):
    return np.sqrt(np.sum((point1 - point2)**2))

# Usage:
# dist = euclidean_distance(point1, point2)

In [11]:
""" Q8. Write a Python function to calculate the manhattan distance between two points. """

def manhattan_distance(point1, point2):
    return np.sum(np.abs(point1 - point2))

# Usage:
# dist_manhattan = manhattan_distance(point1, point2)