In [55]:
import gzip
import pickle
import torch

from tqdm import tqdm

In [56]:
class Model:
    LEARNING_RATE = 0.01

    def __init__(self, input_dimensions, output_dimensions):
        self.input_dimensions = input_dimensions
        self.output_dimensions = output_dimensions
        self.biases = None  # shape: (1, 10)
        self.weights = None  # shape: (784, 10)
        self.training_set = None
        self.validation_set = None
        self.testing_set = None

    @staticmethod
    def sigmoid(z):
        return 1.0 / (1.0 + torch.exp(-z))

    def load_input(self):
        def _map_data(given_set):
            data = given_set[0]
            tags = given_set[1]
            output = []

            for index in range(len(tags)):
                output += [(torch.from_numpy(data[index]).view(1, self.input_dimensions), tags[index])]

            return output

        with gzip.open("mnist.pkl.gz", "rb") as fd:
            training_set, validation_set, testing_set = pickle.load(fd, encoding='latin')

        self.training_set = _map_data(training_set)
        self.validation_set = _map_data(validation_set)
        self.testing_set = _map_data(testing_set)

    def load_params(self):
        self.biases = torch.rand(1, self.output_dimensions, dtype=torch.float32)  # 1, 784
        self.weights = torch.rand(self.input_dimensions, self.output_dimensions, dtype=torch.float32)  # 784, 10

    def train_online(self, data_set, max_iterations, learning_rate):
        iterations = max_iterations
        all_classified = False

        while not all_classified and iterations > 0:
            iterations -= 1
            all_classified = True
            for input_values, correct_tag in tqdm(data_set, unit=" entries",
                                                  desc=f"Epoch {max_iterations - iterations}/{max_iterations}"):
                expected_result = torch.tensor([1 if i == correct_tag else 0 for i in range(self.output_dimensions)],
                                               dtype=torch.float32)
                output = torch.matmul(input_values, self.weights) + self.biases
                activated_output = Model.sigmoid(output)

                self.weights = self.weights + torch.matmul(input_values.view(self.input_dimensions, 1),
                                                           (expected_result - activated_output).view(1,
                                                                                                     self.output_dimensions)) * learning_rate
                self.biases = self.biases + (expected_result - activated_output) * learning_rate

                if not torch.equal(activated_output, expected_result):
                    all_classified = False

    def train_mini_batch(self, data_set, max_iterations, nr_batches, learning_rate):
        iterations = max_iterations
        all_classified = False
        while not all_classified and iterations > 0:
            iterations -= 1
            all_classified = True
            batch_size = len(data_set) // nr_batches

            for batch_index in tqdm(range(nr_batches), unit=" mini batches",
                                    desc=f"Epoch {max_iterations - iterations}/{max_iterations}"):
                delta_weights = torch.zeros(self.input_dimensions, self.output_dimensions, dtype=torch.float32)
                delta_biases = torch.zeros(self.output_dimensions, dtype=torch.float32)
                batch = data_set[batch_index * batch_size: (batch_index + 1) * batch_size]

                for input_values, correct_tag in batch:
                    expected_result = torch.tensor(
                        [1 if i == correct_tag else 0 for i in range(self.output_dimensions)], dtype=torch.float32)
                    output = torch.matmul(input_values, self.weights) + self.biases
                    activated_output = Model.sigmoid(output)

                    delta_weights = delta_weights + torch.matmul(input_values.view(self.input_dimensions, 1),
                                                                 (expected_result - activated_output).view(1,
                                                                                                           self.output_dimensions)) * learning_rate
                    delta_biases = delta_biases + (expected_result - activated_output) * learning_rate

                    if not torch.equal(activated_output, expected_result):
                        all_classified = False

                self.weights += delta_weights
                self.biases += delta_biases

    def predict(self, input_values):
        output = torch.matmul(input_values, self.weights) + self.biases
        activated_output = Model.sigmoid(output)
        return torch.argmax(activated_output).item()

    def test_model(self, data_set):
        wrong_predictions = 0
        correct_predictions = 0

        for input_values, correct_tag in data_set:
            predicted_value = self.predict(input_values)
            if predicted_value == correct_tag:
                correct_predictions += 1
            else:
                wrong_predictions += 1

        print(f"Correct: {correct_predictions}, "
              f"Wrong: {wrong_predictions},"
              f" Total: {correct_predictions + wrong_predictions}, "
              f"Accuracy: {int(correct_predictions / (correct_predictions + wrong_predictions) * 10000.) / 100}%\n")

In [57]:
model = Model(784, 10)
model.load_input()
model.load_params()
print('Results BEFORE training:')
model.test_model(model.testing_set)

model.train_online(model.training_set, 10, 0.05)

print('Results on testing set AFTER online training:')
model.test_model(model.testing_set)

print('Results on validation set AFTER online training:')
model.test_model(model.validation_set)

Results BEFORE training:
Correct: 1002, Wrong: 8998, Total: 10000, Accuracy: 10.02%


Epoch 1/10: 100%|██████████| 50000/50000 [00:01<00:00, 34287.25 entries/s]
Epoch 2/10: 100%|██████████| 50000/50000 [00:01<00:00, 34328.02 entries/s]
Epoch 3/10: 100%|██████████| 50000/50000 [00:01<00:00, 34298.89 entries/s]
Epoch 4/10: 100%|██████████| 50000/50000 [00:01<00:00, 32856.00 entries/s]
Epoch 5/10: 100%|██████████| 50000/50000 [00:01<00:00, 32802.79 entries/s]
Epoch 6/10: 100%|██████████| 50000/50000 [00:01<00:00, 32802.31 entries/s]
Epoch 7/10: 100%|██████████| 50000/50000 [00:01<00:00, 33858.63 entries/s]
Epoch 8/10: 100%|██████████| 50000/50000 [00:01<00:00, 34527.43 entries/s]
Epoch 9/10: 100%|██████████| 50000/50000 [00:01<00:00, 34495.96 entries/s]
Epoch 10/10: 100%|██████████| 50000/50000 [00:01<00:00, 34504.30 entries/s]


Results on testing set AFTER online training:
Correct: 8950, Wrong: 1050, Total: 10000, Accuracy: 89.5%

Results on validation set AFTER online training:
Correct: 8986, Wrong: 1014, Total: 10000, Accuracy: 89.86%


In [58]:
model = Model(784, 10)
model.load_input()
model.load_params()

print('Results BEFORE training:')
model.test_model(model.testing_set)

model.train_mini_batch(model.training_set, 10, 256, Model.LEARNING_RATE)

print('Results on testing set AFTER mini-batch training:')
model.test_model(model.testing_set)

print('Results on validation set AFTER mini-batch training:')
model.test_model(model.validation_set)

Results BEFORE training:
Correct: 980, Wrong: 9020, Total: 10000, Accuracy: 9.8%


Epoch 1/10: 100%|██████████| 256/256 [00:01<00:00, 176.57 mini batches/s]
Epoch 2/10: 100%|██████████| 256/256 [00:01<00:00, 175.84 mini batches/s]
Epoch 3/10: 100%|██████████| 256/256 [00:01<00:00, 175.98 mini batches/s]
Epoch 4/10: 100%|██████████| 256/256 [00:01<00:00, 177.24 mini batches/s]
Epoch 5/10: 100%|██████████| 256/256 [00:01<00:00, 176.97 mini batches/s]
Epoch 6/10: 100%|██████████| 256/256 [00:01<00:00, 177.05 mini batches/s]
Epoch 7/10: 100%|██████████| 256/256 [00:01<00:00, 177.23 mini batches/s]
Epoch 8/10: 100%|██████████| 256/256 [00:01<00:00, 176.91 mini batches/s]
Epoch 9/10: 100%|██████████| 256/256 [00:01<00:00, 177.17 mini batches/s]
Epoch 10/10: 100%|██████████| 256/256 [00:01<00:00, 177.12 mini batches/s]


Results on testing set AFTER mini-batch training:
Correct: 9043, Wrong: 957, Total: 10000, Accuracy: 90.43%

Results on validation set AFTER mini-batch training:
Correct: 9130, Wrong: 870, Total: 10000, Accuracy: 91.3%
