<a href="https://colab.research.google.com/github/tjwei/NCTU_DeepLearning/blob/master/tf2_tutorial/02_tf2_Basics.ipynb" target="_parent"><img src="https://colab.research.google.com/assets/colab-badge.svg" alt="Open In Colab"/></a>

In [0]:
#!pip install tensorflow-gpu==2.0.0-rc1

In [2]:
import tensorflow as tf
tf.__version__

'2.0.0-rc1'

In [3]:
matrix1 = tf.constant([[3., 3.]])

matrix2 = tf.constant([[2.],[2.]])

matrix1, matrix2

(<tf.Tensor: id=0, shape=(1, 2), dtype=float32, numpy=array([[3., 3.]], dtype=float32)>,
 <tf.Tensor: id=1, shape=(2, 1), dtype=float32, numpy=
 array([[2.],
        [2.]], dtype=float32)>)

In [4]:
product = tf.matmul(matrix1, matrix2)
product

<tf.Tensor: id=2, shape=(1, 1), dtype=float32, numpy=array([[12.]], dtype=float32)>

In [5]:
matrix1 @ matrix2

<tf.Tensor: id=3, shape=(1, 1), dtype=float32, numpy=array([[12.]], dtype=float32)>

In [6]:
product + 3

<tf.Tensor: id=5, shape=(1, 1), dtype=float32, numpy=array([[15.]], dtype=float32)>

In [7]:
w = tf.Variable(shape=(1, 2), initial_value=[[2., 1.]])
w

<tf.Variable 'Variable:0' shape=(1, 2) dtype=float32, numpy=array([[2., 1.]], dtype=float32)>

In [8]:
y = w @ [[1], [2]]
y

<tf.Tensor: id=18, shape=(1, 1), dtype=float32, numpy=array([[4.]], dtype=float32)>

In [9]:
with tf.GradientTape() as tape:
    y = w@[[1], [2]]
    loss = (y - 3)**2
gradients = tape.gradient(loss, [w])
gradients

[<tf.Tensor: id=34, shape=(1, 2), dtype=float32, numpy=array([[2., 4.]], dtype=float32)>]

## MNIST Again

In [10]:
(x_train, y_train), (x_test, y_test) = tf.keras.datasets.mnist.load_data()

x_train = (x_train-127.5)/127.5
x_test = (x_test-127.5)/127.5


In [11]:
train_ds = tf.data.Dataset.from_tensor_slices((x_train, y_train))
train_ds = train_ds.shuffle(10000).batch(64)


In [12]:
train_ds

<BatchDataset shapes: ((None, 28, 28), (None,)), types: (tf.float64, tf.uint8)>

In [13]:
test_ds = tf.data.Dataset.from_tensor_slices((x_test, y_test))
test_ds = test_ds.shuffle(10000).batch(64)



In [14]:
from tensorflow.keras.layers import Dense, Flatten, Reshape
from tensorflow.keras.models import Model

class MyModel(Model):
    def __init__(self):
        super(MyModel, self).__init__()
        self.flatten = Flatten()
        self.d1 = Dense(128, activation='relu')    
        self.d2 = Dense(10, activation='softmax')

    def call(self, x): 
        x = self.flatten(x)
        x = self.d1(x)
        return self.d2(x)

# Create an instance of the model
model = MyModel()

#model.summary()


In [15]:
loss_object = tf.keras.losses.SparseCategoricalCrossentropy()

# info of SparseCategoricalCrossentropy
# https://www.tensorflow.org/api_docs/python/tf/keras/losses/SparseCategoricalCrossentropy#used_in_the_tutorials


optimizer = tf.keras.optimizers.Adam()


train_loss = tf.keras.metrics.Mean(name='train_loss')
train_accuracy = tf.keras.metrics.SparseCategoricalAccuracy(name='train_accuracy')

test_loss = tf.keras.metrics.Mean(name='test_loss')
test_accuracy = tf.keras.metrics.SparseCategoricalAccuracy(name='test_accuracy')


In [41]:
#@tf.function
def train_step(images, labels):
    with tf.GradientTape() as tape:
        predictions = model(images)
        loss = loss_object(labels, predictions)
    gradients = tape.gradient(loss, model.trainable_variables)
    optimizer.apply_gradients(zip(gradients, model.trainable_variables))

    train_loss(loss)
    train_accuracy(labels, predictions)


In [42]:
#@tf.function
def test_step(images, labels):
    predictions = model(images)
    t_loss = loss_object(labels, predictions)
    test_loss(t_loss)
    test_accuracy(labels, predictions)


In [43]:
EPOCHS = 10

for epoch in range(EPOCHS):
    for images, labels in train_ds:
        train_step(images, labels)

    for test_images, test_labels in test_ds:
        test_step(test_images, test_labels)

    template = 'Epoch {}, Loss: {}, Accuracy: {}, Test Loss: {}, Test Accuracy: {}'
    print(template.format(epoch+1,
                        train_loss.result(),
                        train_accuracy.result()*100,
                        test_loss.result(),
                        test_accuracy.result()*100))

    # Reset the metrics for the next epoch
    train_loss.reset_states()
    train_accuracy.reset_states()
    test_loss.reset_states()
    test_accuracy.reset_states()




To change all layers to have dtype float64 by default, call `tf.keras.backend.set_floatx('float64')`. To change just this layer, pass dtype='float64' to the layer constructor. If you are the author of this layer, you can disable autocasting by passing autocast=False to the base Layer constructor.

Epoch 1, Loss: 0.3116243779659271, Accuracy: 90.58332824707031, Test Loss: 0.19100171327590942, Test Accuracy: 94.04000091552734
Epoch 2, Loss: 0.16007903218269348, Accuracy: 95.1116714477539, Test Loss: 0.12927085161209106, Test Accuracy: 95.91000366210938
Epoch 3, Loss: 0.1260104924440384, Accuracy: 96.13666534423828, Test Loss: 0.1450505256652832, Test Accuracy: 95.66000366210938
Epoch 4, Loss: 0.10551745444536209, Accuracy: 96.7066650390625, Test Loss: 0.12310515344142914, Test Accuracy: 96.30000305175781
Epoch 5, Loss: 0.09324519336223602, Accuracy: 97.17500305175781, Test Loss: 0.10607748478651047, Test Accuracy: 96.91999816894531
Epoch 6, Loss: 0.08101099729537964, Accuracy: 97.42166