In [1]:
# mlflow tracking
import mlflow
mlflow.tensorflow.autolog()

In [2]:
# ml libraries
from tensorflow.keras.datasets import mnist
from tensorflow.keras.models import Sequential
from tensorflow.keras.layers import Flatten, Dense
from tensorflow.keras.optimizers import SGD
from tensorflow.keras.callbacks import ModelCheckpoint
from tensorflow.keras import regularizers
from tensorflow.keras.saving import load_model

In [3]:
# parameters
parameters = {
    'learning_rate':0.01,
    'momentum':0.1,
    'beta1':0.5,
    'beta2':0.5,
    'epochs':20,
    'batch_size':10,
    'loss':'sparse_categorical_crossentropy'
             }

In [4]:
# defining train and test data from mnist dataset
(x_train, y_train), (x_test, y_test) = mnist.load_data()
x_train = x_train.reshape(60000, 28, 28)
x_test = x_test.reshape(10000, 28, 28)

x_train, x_test = x_train/225, x_test/225

In [5]:
# model body
model = Sequential()
model.add(Flatten(input_shape=(28, 28)))
model.add(Dense(100, activation='relu'))
model.add(Dense(50, activation='relu'))
model.add(Dense(10, activation='tanh'))
model.add(Dense(10, activation='softmax'))

model.summary()

Model: "sequential"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 flatten (Flatten)           (None, 784)               0         
                                                                 
 dense (Dense)               (None, 100)               78500     
                                                                 
 dense_1 (Dense)             (None, 50)                5050      
                                                                 
 dense_2 (Dense)             (None, 10)                510       
                                                                 
 dense_3 (Dense)             (None, 10)                110       
                                                                 
Total params: 84170 (328.79 KB)
Trainable params: 84170 (328.79 KB)
Non-trainable params: 0 (0.00 Byte)
_________________________________________________________________


In [5]:
# loading best modell of the 3 experiments done before
model3 = load_model('sequentialBEST3.keras')

In [6]:
# configuration of loss, metrics, optimizer, etc
SGDM = SGD(learning_rate=parameters['learning_rate'], momentum=parameters['momentum'])

# configuring the checkpoints to obtain the best model after resuming training on loaded model 'model3'
checkpoint = ModelCheckpoint('best', save_best_only=True, monitor='val_loss', mode='min', verbose=1)

In [None]:
#compile model
model.compile(optimizer=SGDM, loss=parameters['loss'], metrics=['accuracy'])

In [9]:
# training loaded model 'model3'
model3.fit(x=x_train, y=y_train, validation_data=(x_test, y_test), batch_size=parameters['batch_size'], 
          epochs=parameters['epochs'], callbacks=[checkpoint], verbose=1)

2023/09/25 20:55:09 INFO mlflow.utils.autologging_utils: Created MLflow autologging run with ID '317780c28fc844e3b049de6c08d267e3', which will track hyperparameters, performance metrics, model artifacts, and lineage information for the current tensorflow workflow


Epoch 1/20
Epoch 1: val_loss improved from inf to 0.08685, saving model to best
INFO:tensorflow:Assets written to: best\assets


INFO:tensorflow:Assets written to: best\assets


Epoch 2/20
Epoch 2: val_loss improved from 0.08685 to 0.08553, saving model to best
INFO:tensorflow:Assets written to: best\assets


INFO:tensorflow:Assets written to: best\assets


Epoch 3/20
Epoch 3: val_loss improved from 0.08553 to 0.08358, saving model to best
INFO:tensorflow:Assets written to: best\assets


INFO:tensorflow:Assets written to: best\assets


Epoch 4/20
Epoch 4: val_loss did not improve from 0.08358
Epoch 5/20
Epoch 5: val_loss did not improve from 0.08358
Epoch 6/20
Epoch 6: val_loss did not improve from 0.08358
Epoch 7/20
Epoch 7: val_loss did not improve from 0.08358
Epoch 8/20
Epoch 8: val_loss did not improve from 0.08358
Epoch 9/20
Epoch 9: val_loss did not improve from 0.08358
Epoch 10/20
Epoch 10: val_loss did not improve from 0.08358
Epoch 11/20
Epoch 11: val_loss did not improve from 0.08358
Epoch 12/20
Epoch 12: val_loss did not improve from 0.08358
Epoch 13/20
Epoch 13: val_loss did not improve from 0.08358
Epoch 14/20
Epoch 14: val_loss did not improve from 0.08358
Epoch 15/20
Epoch 15: val_loss did not improve from 0.08358
Epoch 16/20
Epoch 16: val_loss did not improve from 0.08358
Epoch 17/20
Epoch 17: val_loss did not improve from 0.08358
Epoch 18/20
Epoch 18: val_loss did not improve from 0.08358
Epoch 19/20
Epoch 19: val_loss did not improve from 0.08358
Epoch 20/20
Epoch 20: val_loss did not improve from 



INFO:tensorflow:Assets written to: C:\Users\jtole\AppData\Local\Temp\tmpka3m4ia0\model\data\model\assets


INFO:tensorflow:Assets written to: C:\Users\jtole\AppData\Local\Temp\tmpka3m4ia0\model\data\model\assets


<keras.src.callbacks.History at 0x25102166050>

In [10]:
# evaluation of loaded model
model3.evaluate(x_test, y_test, verbose=1)



[0.08994003385305405, 0.9787999987602234]

In [7]:
model3.summary()

Model: "sequential"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 flatten (Flatten)           (None, 784)               0         
                                                                 
 dense (Dense)               (None, 100)               78500     
                                                                 
 dense_1 (Dense)             (None, 50)                5050      
                                                                 
 dense_2 (Dense)             (None, 10)                510       
                                                                 
 dense_3 (Dense)             (None, 10)                110       
                                                                 
Total params: 84170 (328.79 KB)
Trainable params: 84170 (328.79 KB)
Non-trainable params: 0 (0.00 Byte)
_________________________________________________________________


In [10]:
model3.pop()
model3.summary()

Model: "sequential"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 flatten (Flatten)           (None, 784)               0         
                                                                 
 dense (Dense)               (None, 100)               78500     
                                                                 
Total params: 78500 (306.64 KB)
Trainable params: 78500 (306.64 KB)
Non-trainable params: 0 (0.00 Byte)
_________________________________________________________________


In [12]:
model3.add(Dense(50, activation='relu', kernel_regularizer='l2'))
model3.add(Dense(10, activation='tanh'))
model3.add(Dense(10, activation='softmax'))
model3.summary()

# loading to the model state where weights were the best, it is before detecting overfitting
model3.load_weights('best')

Model: "sequential"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 flatten (Flatten)           (None, 784)               0         
                                                                 
 dense (Dense)               (None, 100)               78500     
                                                                 
 dense_1 (Dense)             (None, 50)                5050      
                                                                 
 dense_2 (Dense)             (None, 10)                510       
                                                                 
 dense_3 (Dense)             (None, 10)                110       
                                                                 
Total params: 84170 (328.79 KB)
Trainable params: 84170 (328.79 KB)
Non-trainable params: 0 (0.00 Byte)
_________________________________________________________________


<tensorflow.python.checkpoint.checkpoint.CheckpointLoadStatus at 0x27136efd750>

In [13]:
checkpoint_L2 = ModelCheckpoint('best_L2', save_best_only=True, monitor='val_loss', mode='min', verbose=1)

model3.compile(optimizer=SGDM, loss=parameters['loss'], metrics=['accuracy'])

model3.fit(x=x_train, y=y_train, validation_data=(x_test, y_test), batch_size=parameters['batch_size'], 
          epochs=parameters['epochs'], callbacks=[checkpoint_L2], verbose=1)

2023/09/25 21:53:50 INFO mlflow.utils.autologging_utils: Created MLflow autologging run with ID 'd63de22b82cd4d76b5213e046e411178', which will track hyperparameters, performance metrics, model artifacts, and lineage information for the current tensorflow workflow


Epoch 1/20
Epoch 1: val_loss improved from inf to 0.18390, saving model to best_L2
INFO:tensorflow:Assets written to: best_L2\assets


INFO:tensorflow:Assets written to: best_L2\assets


Epoch 2/20
Epoch 2: val_loss improved from 0.18390 to 0.13059, saving model to best_L2
INFO:tensorflow:Assets written to: best_L2\assets


INFO:tensorflow:Assets written to: best_L2\assets


Epoch 3/20
Epoch 3: val_loss did not improve from 0.13059
Epoch 4/20
Epoch 4: val_loss did not improve from 0.13059
Epoch 5/20
Epoch 5: val_loss improved from 0.13059 to 0.12035, saving model to best_L2
INFO:tensorflow:Assets written to: best_L2\assets


INFO:tensorflow:Assets written to: best_L2\assets


Epoch 6/20
Epoch 6: val_loss did not improve from 0.12035
Epoch 7/20
Epoch 7: val_loss improved from 0.12035 to 0.11848, saving model to best_L2
INFO:tensorflow:Assets written to: best_L2\assets


INFO:tensorflow:Assets written to: best_L2\assets


Epoch 8/20
Epoch 8: val_loss did not improve from 0.11848
Epoch 9/20
Epoch 9: val_loss improved from 0.11848 to 0.11481, saving model to best_L2
INFO:tensorflow:Assets written to: best_L2\assets


INFO:tensorflow:Assets written to: best_L2\assets


Epoch 10/20
Epoch 10: val_loss did not improve from 0.11481
Epoch 11/20
Epoch 11: val_loss did not improve from 0.11481
Epoch 12/20
Epoch 12: val_loss did not improve from 0.11481
Epoch 13/20
Epoch 13: val_loss did not improve from 0.11481
Epoch 14/20
Epoch 14: val_loss improved from 0.11481 to 0.11104, saving model to best_L2
INFO:tensorflow:Assets written to: best_L2\assets


INFO:tensorflow:Assets written to: best_L2\assets


Epoch 15/20
Epoch 15: val_loss did not improve from 0.11104
Epoch 16/20
Epoch 16: val_loss improved from 0.11104 to 0.10334, saving model to best_L2
INFO:tensorflow:Assets written to: best_L2\assets


INFO:tensorflow:Assets written to: best_L2\assets


Epoch 17/20
Epoch 17: val_loss did not improve from 0.10334
Epoch 18/20
Epoch 18: val_loss did not improve from 0.10334
Epoch 19/20
Epoch 19: val_loss did not improve from 0.10334
Epoch 20/20
Epoch 20: val_loss did not improve from 0.10334




INFO:tensorflow:Assets written to: C:\Users\jtole\AppData\Local\Temp\tmpz58i5kqt\model\data\model\assets


INFO:tensorflow:Assets written to: C:\Users\jtole\AppData\Local\Temp\tmpz58i5kqt\model\data\model\assets


<keras.src.callbacks.History at 0x27137df3bb0>

In [14]:
# evaluation of loaded model
model3.evaluate(x_test, y_test, verbose=1)



[0.113724485039711, 0.9769999980926514]