# Import required libraries

In [1]:
from sklearn.model_selection import train_test_split
from sklearn.preprocessing import LabelBinarizer
from tensorflow.keras import Input
from tensorflow.keras.datasets import mnist
from tensorflow.keras.layers import Dense
from tensorflow.keras.models import Model
from tensorflow.keras.models import Sequential

# Create model using Sequential API

In [2]:
layers = [Dense(256, input_shape=(28*28*1,), activation='sigmoid'),
         Dense(128, activation='sigmoid'),
         Dense(10, activation='softmax')]
sequential_model_list = Sequential(layers)

# Create model using add() method

In [3]:
sm = Sequential()
sm.add(Dense(256, input_shape=(28*28*1,), activation='sigmoid'))
sm.add(Dense(128, activation='sigmoid'))
sm.add(Dense(10, activation='softmax'))

# Create model using the Functional API

In [4]:
input_layer = Input(shape=(28*28*1,))
dense1 = Dense(256, activation='sigmoid')(input_layer)
dense2 = Dense(126, activation='sigmoid')(dense1)
predictions = Dense(10, activation='softmax')(dense2)
functional_model = Model(inputs=input_layer, outputs=predictions)

# Create a model using object-oriented approach

In [5]:
class ClassModel(Model):
    def __init__(self):
        super(ClassModel, self).__init__()

        self.dense_1 = Dense(256, activation='sigmoid')
        self.dense_2 = Dense(256, activation='sigmoid')
        self.predictions = Dense(10, activation='softmax')

    def call(self, inputs, **kwargs):
        x = self.dense_1(inputs)
        x = self.dense_2(x)

        return self.predictions(x)


class_model = ClassModel()

# Prepare the data

In [6]:
(X_train, y_train), (X_test, y_test) = mnist.load_data()
X_train = X_train.reshape((X_train.shape[0], 28*28*1))
X_test = X_test.reshape((X_test.shape[0], 28*28*1))

# One-hot encode the labels

In [7]:
label_binarizer = LabelBinarizer()
y_train = label_binarizer.fit_transform(y_train)
y_test = label_binarizer.fit_transform(y_test)

# Taking 20% of data for validation

In [8]:
X_train, X_valid, y_train, y_valid = train_test_split(X_train, y_train, train_size=0.8)