In [14]:
import numpy as np
from sklearn import datasets
from sklearn.utils import shuffle

In [15]:
def train_nb(X, y):
    """
    Train the Naive Bayes classifier. For NB this is just
    computing the necessary probabilities to perform classification
    1. The probability P(ci) for every class -> prior (the prior comes from the distribution of labels)
    2. The mean and std -> mean, std (The mean and variance are applied to each feature in the input data X)

    Inputs:
    - X: A numpy array of shape (num_train, D) containing the training data
    consisting of num_train samples each of dimension D.
    - y: A numpy array of shape (N,) containing the training labels, where
        y[i] is the label for X[i].

    Outputs:
    - prior : list with length equal to the number of classes
    - mean : A numpy array of shape (num_classes, num_features)
    - std  : A numpy array of shape (num_classes, num_features)

    **** train() should be run with X as training data
    """
    # use list comprehension

    # Separate training points by class
    unique_y = np.unique (y) # returns a list of all differente values in y -> all possible classes
    points_by_class = [[x for x, t in zip (X, y) if t == c] for c in unique_y]

    #########################################################################
    # TODO:                                                                 #
    # compute class prior                                                   #
    #########################################################################
    
    total = X.shape[0] #total number of data points
    prior = [len(x)/total for x in points_by_class]

    #########################################################################
    # TODO:                                                                 #
    # Estimate mean and std for each class / feature                        #
    #########################################################################
    
    #colMeanC0 = x_iris[y_iris==0].mean(axis = 0)
    mean = [X[y==c].mean(axis = 0) for c in unique_y]
    std = [X[y==c].var(axis = 0) for c in unique_y]
    
    return prior, np.array(mean), np.array(std)


In [16]:
def normal_distribution(x, mean, std):
    """
    Compute normal distribution
    output size: (num_input_data, num_features)

    """
    #########################################################################
    # TODO : Compute normal distribution                                    #
    #########################################################################

    #normal =

    return normal

In [92]:
def predict(X, prior, mean, std):
    """
    Using the dustributions from before, predict labels for test data (or train data) using this classifier.
    We predict the class of the data maximizing the likelihood or you can
     maximize the log likelihood to make it numericaly more stable.
     (This is possible since f(x)=log(x) is a monotone function)

    You have to compute:
    - Compute the conditional probabilities  P(x|c) (or log P(x|c) )
    - The posterior (if you compute the log likelihood the product  becomes sum)
    - Make the prediction

    Inputs:
    - X: A numpy array of shape (num_test, D) containing test data consisting
        of num_test samples each of dimension D.
    - prior, mean, std: output of train() function

    Returns:
    - y_pred : A numpy array of shape (num_test,) containing predicted labels for the
    test data, where y[i] is the predicted label for the test point X[i].

    *** predict() should be run with X as test data, based on mean and variance and prior from the training data
        (to compute the training accuracy run with X as train data)

    """
    # use list comprehension

    #################################################################################
    #        # Compute the conditional probabilities  P(x|c)                        #
    #             # There are three loops in the code.                              #
    #             # 1. through each sample.                                         #
    #             # 2. through each class.                                          #
    #             # 3. through each attribute and apply the Normal/ logNormal distribution. #
    #        # Compute the posterior                                                #
    #                                                                               #
    #################################################################################


    #########################################################################
    #                           TODO
    #             compute the posterior and predict                         #
    # - hint for prediction: class having the biggest probability[argmax()] #
    #########################################################################
    y_predd = []
    #pre = la proba prior pour chaque classe
    for x in X:
        eachClass = []
        for c in range(0,len(prior)):
            eachClass.append(prior[c] * np.prod([np.exp(-1*np.square((x[attrN]-mean[c][attrN])/(2*std[c][attrN]))) for attrN in range(0,len(x))]))
        y_predd.append(np.argmax(eachClass))
        
    return y_predd


In [93]:
def load_IRIS(test=True):
    iris = datasets.load_iris()
    X, y = shuffle(iris.data, iris.target, random_state= 400)
    if test:
        X_train = X[:100, :]
        y_train = y[:100]
        X_test = X[100:, :]
        y_test = y[100:]
        return X_train, y_train, X_test, y_test
    else:
        X = iris.data
        y = iris.target
        return X, y

In [94]:
# load the iris data set
x_iris, y_iris = load_IRIS(test=False)
X_train, y_train, X_test, y_test = load_IRIS(test=True)
# chech the shape of the data anf target
print('Data shape:', x_iris.shape)
print('Target shape:', y_iris.shape)

Data shape: (150, 4)
Target shape: (150,)


In [95]:
prior, mean, var = train_nb(x_iris, y_iris)
print(prior)
print(mean.shape)
y_predict = predict(X_test, prior, mean, var)

for i in range(0,len(y_predict)):
    rep = y_test[i] == y_predict[i]
    print("vrai : ",y_test[i], " __ predict : ", y_predict[i], " __ rep : ", rep)

[0.3333333333333333, 0.3333333333333333, 0.3333333333333333]
(3, 4)
vrai :  1  __ predict :  1  __ rep :  True
vrai :  2  __ predict :  2  __ rep :  True
vrai :  1  __ predict :  1  __ rep :  True
vrai :  1  __ predict :  1  __ rep :  True
vrai :  2  __ predict :  2  __ rep :  True
vrai :  0  __ predict :  1  __ rep :  False
vrai :  2  __ predict :  2  __ rep :  True
vrai :  1  __ predict :  1  __ rep :  True
vrai :  2  __ predict :  2  __ rep :  True
vrai :  1  __ predict :  1  __ rep :  True
vrai :  0  __ predict :  0  __ rep :  True
vrai :  1  __ predict :  1  __ rep :  True
vrai :  0  __ predict :  0  __ rep :  True
vrai :  1  __ predict :  1  __ rep :  True
vrai :  1  __ predict :  1  __ rep :  True
vrai :  1  __ predict :  1  __ rep :  True
vrai :  0  __ predict :  0  __ rep :  True
vrai :  2  __ predict :  2  __ rep :  True
vrai :  0  __ predict :  0  __ rep :  True
vrai :  2  __ predict :  2  __ rep :  True
vrai :  2  __ predict :  2  __ rep :  True
vrai :  2  __ predict :  2  