In [3]:
import os 
import tensorflow as tf
os.environ["TF_CPP_MIN_LOG_LEVEL"] = "2"

from tensorflow import keras

There are two basics API of keras:
- Sequential API 
- Functional API

# Load dataset

In [19]:
from keras import layers
from keras.datasets import mnist

In [20]:
(x_train, y_train), (x_test, y_test) = mnist.load_data()
print(x_train.shape)
print(y_train.shape)

(60000, 28, 28)
(60000,)


In [21]:
x_train = x_train.reshape(-1, 28*28).astype("float32") / 255.0 # normilize values to [-1, 1]
print(type(x_train))
x_test = x_test.reshape(-1, 28*28).astype("float32") / 255.0


<class 'numpy.ndarray'>


In [22]:
x_train =tf.convert_to_tensor(x_train) 
# but it's not nessesary it's going to be done internally by tensorflow itself 

2023-07-18 18:20:05.417870: W tensorflow/tsl/framework/cpu_allocator_impl.cc:83] Allocation of 188160000 exceeds 10% of free system memory.


# SQ API

## Very convenient but not very flexible

In [23]:
model = keras.Sequential(
    layers=[
        layers.Dense(512, activation="relu"),
        layers.Dense(256, activation="relu"),
        layers.Dense(10),
    ]
)

model.compile(
    loss=keras.losses.SparseCategoricalCrossentropy(from_logits=True),
    optimizer=keras.optimizers.Adam(learning_rate=0.001),
    metrics=["accuracy"]    
)

model.fit(x_train, y_train, batch_size=32, epochs=5, verbose=2)

model.evaluate(x_test, y_test, batch_size=32, verbose=2)

Epoch 1/5
1875/1875 - 10s - loss: 0.1869 - accuracy: 0.9424 - 10s/epoch - 5ms/step
Epoch 2/5
1875/1875 - 22s - loss: 0.0807 - accuracy: 0.9750 - 22s/epoch - 12ms/step
Epoch 3/5
1875/1875 - 24s - loss: 0.0547 - accuracy: 0.9829 - 24s/epoch - 13ms/step
Epoch 4/5
1875/1875 - 21s - loss: 0.0413 - accuracy: 0.9865 - 21s/epoch - 11ms/step
Epoch 5/5
1875/1875 - 21s - loss: 0.0331 - accuracy: 0.9897 - 21s/epoch - 11ms/step


2023-07-18 18:28:03.227141: W tensorflow/tsl/framework/cpu_allocator_impl.cc:83] Allocation of 31360000 exceeds 10% of free system memory.


313/313 - 2s - loss: 0.0702 - accuracy: 0.9804 - 2s/epoch - 6ms/step


[0.07024834305047989, 0.980400025844574]

In [27]:
model = keras.Sequential(
    layers=[
        keras.Input(shape=(28*28)),
        layers.Dense(512, activation="relu"),
        layers.Dense(256, activation="relu"),
        layers.Dense(10),
    ]
)
print(model.summary())

Model: "sequential_2"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_6 (Dense)             (None, 512)               401920    
                                                                 
 dense_7 (Dense)             (None, 256)               131328    
                                                                 
 dense_8 (Dense)             (None, 10)                2570      
                                                                 
Total params: 535818 (2.04 MB)
Trainable params: 535818 (2.04 MB)
Non-trainable params: 0 (0.00 Byte)
_________________________________________________________________
None


In [29]:
model = keras.Sequential(
    layers=[
        layers.Dense(512, activation="relu"),
        layers.Dense(256, activation="relu"),
        layers.Dense(10),
    ]
)
print(model.summary())

ValueError: This model has not yet been built. Build the model first by calling `build()` or by calling the model on a batch of data.

In [31]:
model1 = keras.Sequential()

model1.add(keras.Input(shape=(28*28)))
model1.add(keras.layers.Dense(512, activation="relu"))
model1.add(keras.layers.Dense(256, activation="relu"))
model1.add(keras.layers.Dense(10))

model1.summary()

Model: "sequential_6"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_18 (Dense)            (None, 512)               401920    
                                                                 
 dense_19 (Dense)            (None, 256)               131328    
                                                                 
 dense_20 (Dense)            (None, 10)                2570      
                                                                 
Total params: 535818 (2.04 MB)
Trainable params: 535818 (2.04 MB)
Non-trainable params: 0 (0.00 Byte)
_________________________________________________________________


# FUN API

## A bit more flexible 

In [33]:
inputs = keras.Input(shape=(28*28))
x = layers.Dense(512, activation="relu", name="Fucking layer")(inputs)
x = layers.Dense(256, activation="relu")(x)
outputs = layers.Dense(10, activation="softmax")(x)

model2 = keras.Model(inputs=inputs, outputs=outputs)

model2.compile(
    loss=keras.losses.SparseCategoricalCrossentropy(from_logits=True),
    optimizer=keras.optimizers.Adam(learning_rate=0.001),
    metrics=["accuracy"]    
)

model2.fit(x_train, y_train, batch_size=32, epochs=5, verbose=2)

model2.evaluate(x_test, y_test, batch_size=32, verbose=2)

Epoch 1/5


  output, from_logits = _get_logits(


1875/1875 - 31s - loss: 0.1866 - accuracy: 0.9433 - 31s/epoch - 17ms/step
Epoch 2/5
1875/1875 - 26s - loss: 0.0805 - accuracy: 0.9743 - 26s/epoch - 14ms/step
Epoch 3/5
1875/1875 - 22s - loss: 0.0541 - accuracy: 0.9827 - 22s/epoch - 12ms/step
Epoch 4/5
1875/1875 - 27s - loss: 0.0402 - accuracy: 0.9865 - 27s/epoch - 14ms/step
Epoch 5/5
1875/1875 - 10s - loss: 0.0342 - accuracy: 0.9893 - 10s/epoch - 5ms/step


2023-07-18 18:37:30.403970: W tensorflow/tsl/framework/cpu_allocator_impl.cc:83] Allocation of 31360000 exceeds 10% of free system memory.


313/313 - 0s - loss: 0.0727 - accuracy: 0.9804 - 420ms/epoch - 1ms/step


[0.07273514568805695, 0.980400025844574]

In [34]:
model2.summary()

Model: "model_1"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 input_6 (InputLayer)        [(None, 784)]             0         
                                                                 
 dense_24 (Dense)            (None, 512)               401920    
                                                                 
 dense_25 (Dense)            (None, 256)               131328    
                                                                 
 dense_26 (Dense)            (None, 10)                2570      
                                                                 
Total params: 535818 (2.04 MB)
Trainable params: 535818 (2.04 MB)
Non-trainable params: 0 (0.00 Byte)
_________________________________________________________________


In [None]:
# model2.predict(x_test)