## import libarary

In [2]:
import numpy as np
import cv2
import tensorflow as tf
from sklearn.neighbors import KNeighborsClassifier
from sklearn.metrics import accuracy_score, confusion_matrix
from tensorflow.keras import datasets
import tensorflow_datasets as tfds
import matplotlib.pyplot as plot



##  Load the Caltech101 dataset


In [4]:
# Load the Caltech101 dataset
dataset, info = tfds.load('caltech101', with_info=True, as_supervised=True)

# Split the dataset into training and testing
train_data = dataset['train']
test_data = dataset['test']

## Convert train and test data into numpy arrays


In [6]:
def process_data(data, image_size=(32, 32)):
    images = []
    labels = []

    for image, label in data:
        # Resize image to the desired shape
        image_resized = cv2.resize(image.numpy(), image_size)
        images.append(image_resized)
        labels.append(label.numpy())
    
    return np.array(images), np.array(labels)

## Load and preprocess training and testing data


In [8]:
X_train, y_train = process_data(train_data)
X_test, y_test = process_data(test_data)

In [9]:
X_train.shape

(3059, 32, 32, 3)

## Convert images to grayscale


In [11]:
X_train_gray = np.array([cv2.cvtColor(img, cv2.COLOR_BGR2GRAY) for img in X_train])
X_test_gray = np.array([cv2.cvtColor(img, cv2.COLOR_BGR2GRAY) for img in X_test])


In [12]:
X_train_gray.shape

(3059, 32, 32)

##  Resize the images to (32, 32) for HOG computation


In [14]:
X_train_resized = np.array([cv2.resize(img, (32, 32)) for img in X_train_gray])
X_test_resized = np.array([cv2.resize(img, (32, 32)) for img in X_test_gray])

## Define HOG descriptor parameters

In [16]:
winSize = (32,32)
blockSize = (8,8)
blockStride = (4,4)
cellSize = (4,4)
nbins = 9

## Initialize the HOG descriptor

In [18]:
hog = cv2.HOGDescriptor(winSize,blockSize,blockStride,cellSize,nbins)

## Extract HOG features from the training data


In [20]:
hog_features_train = [hog.compute(image).flatten() for image in X_train_resized]
hog_features_test = [hog.compute(image).flatten() for image in X_test_resized]

## Convert the list of features into numpy arrays

In [22]:
hog_features_xtrain = np.array(hog_features_train)
hog_features_test = np.array(hog_features_test)

In [51]:
import numpy as np
from collections import Counter

def euclidean_distance(x1, x2):
    distance = np.sqrt(np.sum((x1-x2)**2))
    return distance

class KNN:
    def __init__(self, k=3):
        self.k = k

    def fit(self, X, y):
        self.X_train = X
        self.y_train = y

    def predict(self, X):
        predictions = [self._predict(x) for x in X]
        return predictions

    def _predict(self, x):
        # compute the distance
        distances = [euclidean_distance(x, x_train) for x_train in self.X_train]
    
        # get the closest k
        k_indices = np.argsort(distances)[:self.k]
        k_nearest_labels = [self.y_train[i] for i in k_indices]

        # majority voye
        most_common = Counter(k_nearest_labels).most_common()
        return most_common[0][0]

## Training the kNN model on the Training set


In [53]:
classifier = KNN(k=5)
classifier.fit(hog_features_xtrain, y_train.flatten())

## Make predictions on the test set

In [55]:
y_pred = classifier.predict(hog_features_test)


## Evaluate the classifier's performance


In [57]:
accuracy = accuracy_score(y_test.flatten(), y_pred)
print("Accuracy: ", accuracy)


Accuracy:  0.4714872637633525
