In [1]:
import numpy as np
from sklearn import datasets
from numpy.random import MT19937
from numpy.random import RandomState, SeedSequence

In [2]:
#                    Description of the dataset
#  data : {ndarray, dataframe} of shape (150, 4)
#             The data matrix. If `as_frame=True`, `data` will be a pandas
#             DataFrame.
#         target: {ndarray, Series} of shape (150,)
#             The classification target. If `as_frame=True`, `target` will be
#             a pandas Series.
#         feature_names: list
#             The names of the dataset columns.
#         target_names: list
#             The names of target classes.
#         frame: DataFrame of shape (150, 5)
#             Only present when `as_frame=True`. DataFrame with `data` and
#             `target`.

In [3]:
# Creating an output array
def target_array(raw_target):
    target = []
    for i in range(len(raw_target)):
        if raw_target[i] == 0:
            target.append([1, 0, 0])
        elif raw_target[i] == 1:
            target.append([0, 1, 0])
        else:
            target.append([0, 0, 1])
    return np.array(target, dtype="uint8")
    

In [4]:
# Loading the Iris dataset
iris = datasets.load_iris()

data = iris.data
target = target_array(iris.target)

# Mixing data
rs1 = RandomState(MT19937(SeedSequence(0)))
rs1.shuffle(data)
rs2 = RandomState(MT19937(SeedSequence(0)))
rs2.shuffle(target)

In [5]:

# Sigmoid 
# Activation function
def activation_func(x):
    z = 1 / (1 + (np.e ** -x))
    return z


# Derivative of the activation function
def deriv_activation_func(x):
    z = activation_func(x)
    return z * (1 - z)
    

0 - input layer  
1 - hidden layer  
2 - output layer  
weights_1_to_2 - Weights linking the hidden layer and the output layer

In [6]:
# Neural network learning function
def neural_network_training(weights_0_to_1,
                            weights_1_to_2,
                            data,
                            target,
                            number_training_data,
                            epochs=5,
                            alpha=0.5):
    epoch_print_step = 100
    for epoch in range(epochs):
        if epoch % epoch_print_step == 0:
            print(f"\nepoch: {epoch + 1}")
        for i in range(number_training_data):
            # Forward propagation
            layer_0 = data[i:i + 1]
            layer_1 = activation_func(np.dot(layer_0, weights_0_to_1))
            layer_2 = np.dot(layer_1, weights_1_to_2)

            # Error calculation
            layer_2_delta = layer_2 - target[i:i + 1]
            layer_1_delta = layer_2_delta.dot(weights_1_to_2.T) * deriv_activation_func(layer_1)
            
            # Backpropagation
            weights_1_to_2 -= alpha * layer_1.T.dot(layer_2_delta)
            weights_0_to_1 -= alpha * layer_0.T.dot(layer_1_delta)
            
            # Output of a part of the data
            if epoch % epoch_print_step == 0 and i >= 10 and i <= 13:
                print(f"{np.argmax(layer_2) == np.argmax(target[i])} Error: {np.sum((layer_2 - target[i]) ** 2):.5f}, out = {layer_2}, target = {target[i]}")
  
    return weights_0_to_1, weights_1_to_2

In [7]:
# Declaring parameters for a neural network
# epochs = 1000
epochs = 401
alpha = 0.002

number_test_data = 30
len_data = len(data)
number_training_data = len_data - number_test_data
layer_1_size = 7

np.random.seed(1)
weights_0_to_1 = np.random.rand(len(data[0]), layer_1_size)
weights_1_to_2 = np.random.rand(layer_1_size, len(target[0]))

In [8]:
# Neural network training
weights_0_to_1, weights_1_to_2 = neural_network_training(weights_0_to_1,
                                                         weights_1_to_2,
                                                         data,
                                                         target,
                                                         number_training_data,
                                                         epochs,
                                                         alpha)


epoch: 1
False Error: 25.54148, out = [[3.94733738 2.84074416 2.56352651]], target = [0 1 0]
False Error: 25.18416, out = [[3.91645734 2.83583354 2.54464839]], target = [0 1 0]
False Error: 24.52973, out = [[3.86569491 2.81239944 2.51024651]], target = [0 1 0]
True Error: 19.38313, out = [[3.59542583 2.69429709 2.32113275]], target = [1 0 0]

epoch: 101
False Error: 0.66315, out = [[0.11318183 0.35784689 0.48782673]], target = [0 1 0]
False Error: 0.63308, out = [[-0.04612703  0.43093368  0.55417976]], target = [0 1 0]
False Error: 0.66040, out = [[0.17506613 0.36160125 0.47137845]], target = [0 1 0]
True Error: 0.01403, out = [[ 0.96828721  0.09436308 -0.06421402]], target = [1 0 0]

epoch: 201
False Error: 0.56846, out = [[0.0447029  0.40405496 0.45968266]], target = [0 1 0]
False Error: 0.53804, out = [[-0.03050791  0.45932017  0.49474313]], target = [0 1 0]
False Error: 0.62178, out = [[0.08159361 0.3885914  0.49122522]], target = [0 1 0]
True Error: 0.01440, out = [[ 0.95024803  

In [9]:
def сhecking_accuracy(data, target):    
    if np.argmax(data) == np.argmax(target):
        print("True")
        return
    print(f"False: {data}, {target}")

In [10]:
def neural_network_test(weights_0_to_1,
                        weights_1_to_2,
                        data,
                        target,
                        number_test_data,
                        len_data):
    # print(len_data - number_test_data, len_data)
    for i in range(len_data - number_test_data, len_data):
        layer_0 = data[i:i + 1]
        layer_1 = activation_func(np.dot(layer_0, weights_0_to_1))
        layer_2 = np.dot(layer_1, weights_1_to_2)
        # error = np.sum((layer_2 - target[i]) ** 2)
        
        сhecking_accuracy(layer_2, target[i])
        # print(f"target = out: {np.argmax(target[i]) == np.argmax(layer_2)}\terror = {error:.4f}")
        # print(f"target = {target[i]}, out = {layer_2},\terror = {error:.4f}")

In [11]:
neural_network_test(weights_0_to_1,
                    weights_1_to_2,
                    data,
                    target,
                    number_test_data,
                    len_data)

False: [[0.0007769  0.37166118 0.6624042 ]], [0 1 0]
True
False: [[0.05885595 0.28284957 0.73122963]], [0 1 0]
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
False: [[0.0715963  0.29858262 0.68679694]], [0 1 0]
True
True
True


In [12]:
def neural_network(weights_0_to_1,
                   weights_1_to_2,
                   data):
    layer_0 = data
    layer_1 = activation_func(np.dot(layer_0, weights_0_to_1))
    layer_2 = np.dot(layer_1, weights_1_to_2)    
    return layer_2

In [13]:
for i in range(20):
    number = np.random.randint(0, 150)
    prediction = neural_network(weights_0_to_1,
                                weights_1_to_2,
                                data[number])
    сhecking_accuracy(prediction, target[number])

True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
True
False: [0.05669564 0.34435836 0.62726512], [0 1 0]
