**Importam datele din Keras**

In [1]:
import numpy as np
from tensorflow.keras.datasets import mnist


(train_images, train_labels), (test_images, test_labels) = mnist.load_data()
#print the shapes of the training dataset. Just for checking.
train_images.shape, train_labels.shape

((60000, 28, 28), (60000,))

**Facem reshape la date si le scalam**

In [2]:
from tensorflow.keras.utils import to_categorical


train_images = train_images.reshape((60000, 28*28))
train_images = train_images.astype('float32')/255
test_images = test_images.reshape((10000, 28*28))
test_images = test_images.astype('float32')/255
train_labels = to_categorical(train_labels)
test_labels = to_categorical(test_labels)

**Definim modelul si il compilam**

In [3]:
from keras import models
from keras import layers
from keras import losses
from keras import optimizers
from keras import regularizers


model = models.Sequential()
# Layer 1
model.add(layers.Dense(512, 
                       activation='relu', 
                       input_shape=(28*28,), 
                       kernel_regularizer=regularizers.l2(0.001)))
model.add(layers.Dropout(0.2))

# Layer 2
model.add(layers.Dense(100, activation='linear'))
model.add(layers.ReLU())

# Layer3
model.add(layers.Dense(10, activation='softmax'))

# Compile the model
# network.compile(optimizer='rmsprop', loss='categorical_crossentropy', metrics=['accuracy'])
optimizer = optimizers.Adam(lr=0.0001)
loss_function = losses.categorical_crossentropy
model.compile(optimizer=optimizer, loss=loss_function, metrics=['accuracy'])

Using TensorFlow backend.


In [4]:
model.summary()

Model: "sequential_1"
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
dense_1 (Dense)              (None, 512)               401920    
_________________________________________________________________
dropout_1 (Dropout)          (None, 512)               0         
_________________________________________________________________
dense_2 (Dense)              (None, 100)               51300     
_________________________________________________________________
re_lu_1 (ReLU)               (None, 100)               0         
_________________________________________________________________
dense_3 (Dense)              (None, 10)                1010      
Total params: 454,230
Trainable params: 454,230
Non-trainable params: 0
_________________________________________________________________


**Antrenam modelul**

In [5]:
from keras import callbacks


# my_callbacks = [callbacks.ModelCheckpoint(filepath='model.{epoch:02d}-{val_loss:.2f}-{val_accuracy:.2f}.h5', monitor='val_accuracy', save_best_only=True)]

model.fit(train_images, train_labels,
          validation_data=(test_images, test_labels),
          epochs=10, batch_size=128/*, callbacks=my_callbacks*/)

Train on 60000 samples, validate on 10000 samples
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10


<keras.callbacks.callbacks.History at 0x22d00803b08>

**Salvam si incarcam modelul**

In [6]:
from keras.models import load_model


model.save('mynetwork.h5')
trained_model = load_model('mynetwork.h5')
test_pred = trained_model.predict(np.array([test_images[0]]))

In [7]:
trained_model = load_model('mynetwork.h5')
trained_model.fit(train_images, train_labels,
              validation_data=(test_images, test_labels),
                  epochs=5, batch_size=128, callbacks=my_callbacks)

Train on 60000 samples, validate on 10000 samples
Epoch 1/5
Epoch 2/5
Epoch 3/5
Epoch 4/5
Epoch 5/5


<keras.callbacks.callbacks.History at 0x22d01323848>

**Evaluam modelul**

In [8]:
results = model.evaluate(test_images, test_labels, batch_size=128)
print("test loss, test acc:", results)

test loss, test acc: [0.19568800922632218, 0.9733999967575073]


**(Optional) O retea neuronala convolutionala**

Utila pentru proiectele unde trebuie sa antrenati pe pixeli.

In [9]:
import numpy as np
from tensorflow import keras
from tensorflow.keras import layers

# Model / data parameters
num_classes = 10
input_shape = (28, 28, 1)

# the data, split between train and test sets
(x_train, y_train), (x_test, y_test) = keras.datasets.mnist.load_data()

# Scale images to the [0, 1] range
x_train = x_train.astype("float32") / 255
x_test = x_test.astype("float32") / 255
# Make sure images have shape (28, 28, 1)
x_train = np.expand_dims(x_train, -1)
x_test = np.expand_dims(x_test, -1)
print("x_train shape:", x_train.shape)
print(x_train.shape[0], "train samples")
print(x_test.shape[0], "test samples")


# convert class vectors to binary class matrices
y_train = keras.utils.to_categorical(y_train, num_classes)
y_test = keras.utils.to_categorical(y_test, num_classes)

model = keras.Sequential(
    [
        keras.Input(shape=input_shape),
        layers.Conv2D(32, kernel_size=(3, 3), activation="relu"),
        layers.MaxPooling2D(pool_size=(2, 2)),
        layers.Conv2D(64, kernel_size=(3, 3), activation="relu"),
        layers.MaxPooling2D(pool_size=(2, 2)),
        layers.Flatten(),
        layers.Dropout(0.5),
        layers.Dense(num_classes, activation="softmax"),
    ]
)

model.summary()

batch_size = 128
epochs = 15

model.compile(loss="categorical_crossentropy", optimizer="adam", metrics=["accuracy"])

model.fit(x_train, y_train, batch_size=batch_size, epochs=epochs, validation_split=0.1)

x_train shape: (60000, 28, 28, 1)
60000 train samples
10000 test samples
Model: "sequential"
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
conv2d (Conv2D)              (None, 26, 26, 32)        320       
_________________________________________________________________
max_pooling2d (MaxPooling2D) (None, 13, 13, 32)        0         
_________________________________________________________________
conv2d_1 (Conv2D)            (None, 11, 11, 64)        18496     
_________________________________________________________________
max_pooling2d_1 (MaxPooling2 (None, 5, 5, 64)          0         
_________________________________________________________________
flatten (Flatten)            (None, 1600)              0         
_________________________________________________________________
dropout (Dropout)            (None, 1600)              0         
_________________________________________________

<tensorflow.python.keras.callbacks.History at 0x22d066dddc8>