In [1]:
import numpy as np
from sklearn.datasets import load_iris
from sklearn.model_selection import train_test_split
from sklearn.metrics import accuracy_score

In [2]:
iris = load_iris()
X = iris.data
y = iris.target
X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.3, random_state=42)

classes = np.unique(y_train)
mean = {}
var = {}
prior = {}

for c in classes:
    X_c = X_train[y_train == c]
    mean[c] = X_c.mean(axis=0)
    var[c] = X_c.var(axis=0)
    prior[c] = X_c.shape[0] / X_train.shape[0]

def gaussian_density(x, mean, var):
    numerator = np.exp(- (x - mean)**2 / (2 * var))
    denominator = np.sqrt(2 * np.pi * var)
    return numerator / denominator

def predict(X):
    preds = []
    for x in X:
        posteriors = []
        for c in classes:
            prior_c = np.log(prior[c])
            class_conditional = np.sum(np.log(gaussian_density(x, mean[c], var[c])))
            posterior = prior_c + class_conditional
            posteriors.append(posterior)
        preds.append(np.argmax(posteriors))
    return np.array(preds)

y_pred = predict(X_test)
print("Manual Gaussian Naive Bayes Accuracy:", accuracy_score(y_test, y_pred))


Manual Gaussian Naive Bayes Accuracy: 0.9777777777777777


In [3]:
from sklearn.naive_bayes import GaussianNB
from sklearn.metrics import classification_report

iris = load_iris()
X = iris.data
y = iris.target

X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.3, random_state=42)
gnb = GaussianNB()
gnb.fit(X_train, y_train)
y_pred = gnb.predict(X_test)

print("In-built GaussianNB Accuracy:", accuracy_score(y_test, y_pred))
print("\nClassification Report:\n", classification_report(y_test, y_pred))


In-built GaussianNB Accuracy: 0.9777777777777777

Classification Report:
               precision    recall  f1-score   support

           0       1.00      1.00      1.00        19
           1       1.00      0.92      0.96        13
           2       0.93      1.00      0.96        13

    accuracy                           0.98        45
   macro avg       0.98      0.97      0.97        45
weighted avg       0.98      0.98      0.98        45



In [4]:
from sklearn.datasets import load_iris
from sklearn.neighbors import KNeighborsClassifier
from sklearn.model_selection import GridSearchCV, train_test_split

iris = load_iris()
X = iris.data
y = iris.target
X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.3, random_state=42)

knn = KNeighborsClassifier()
param_grid = {'n_neighbors': list(range(1, 21))}
grid = GridSearchCV(knn, param_grid, cv=5, scoring='accuracy')
grid.fit(X_train, y_train)

print("Best K value:", grid.best_params_['n_neighbors'])
print("Best Cross-validation Accuracy:", grid.best_score_)
best_knn = grid.best_estimator_
print("Test Accuracy:", best_knn.score(X_test, y_test))


Best K value: 1
Best Cross-validation Accuracy: 0.9523809523809523
Test Accuracy: 1.0
