In [1]:
# A logistic regression learning algorithm example using TensorFlow library.
# This example is using the MNIST database of handwritten digits 
# (http://yann.lecun.com/exdb/mnist/)

# Author: Aymeric Damien
# Project: https://github.com/aymericdamien/TensorFlow-Examples/

이 예시는 실제 분류예시인 MNIST 데이터에 대해 분류하는 과정을 보여줍니다.
MNIST는 tensorflow 자체에 기본예시로 간단한 명령어를 통해 인터넷에서 다운받을 수 있게 되어 있습니다.

In [2]:
import tensorflow as tf

# Import MINST data
from tensorflow.examples.tutorials.mnist import input_data
mnist = input_data.read_data_sets("MNIST_data/", one_hot=True)

Successfully downloaded train-images-idx3-ubyte.gz 9912422 bytes.
Extracting MNIST_data/train-images-idx3-ubyte.gz
Successfully downloaded train-labels-idx1-ubyte.gz 28881 bytes.
Extracting MNIST_data/train-labels-idx1-ubyte.gz
Successfully downloaded t10k-images-idx3-ubyte.gz 1648877 bytes.
Extracting MNIST_data/t10k-images-idx3-ubyte.gz
Successfully downloaded t10k-labels-idx1-ubyte.gz 4542 bytes.
Extracting MNIST_data/t10k-labels-idx1-ubyte.gz


학습에 필요한 파라미터들을 설정합니다. linear regression예시와 다른점은 batch_size가 설정된다는 점이며, 이 값은 한번의 batch에 몇개의 데이터를 입력받느냐를 정하여 줍니다.

In [3]:
# Parameters
learning_rate = 0.01
training_epochs = 25
batch_size = 100
display_step = 1

$$ 
\large{ P(y=1|x;w) = \frac{e^{w^{(1)\top} x + b^{(1)}}}{\sum_{j=1}^{k} e^{w^{(j)\top} x + b^{(j)}}} }
$$

$$ h(x) = 
\left [ \begin{array}{cc} 
P(y=1|x;w)  \\
P(y=2|x;w)  \\
... \\
P(y=k|x;w)  \\
\end{array} \right ]
$$

* x는 28x28 크기의 이미지 인풋으로 784차원의 인풋을 받도록 설정
* y는 10 클래스로 출력이 되도록 설정. 위의 수식 기준으로는 k=10으로 설정된 경우임.
* W와 b는 matrix 차원에 맞추어 변수 공간의 크기가 할당됩니다.
* pred는 위의 수식에서 $h(x)$ 부분을 의미합니다. `tf.nn.softmax()`합수를 통해 softmax를 구성할 수 있고, exponential 안에 들어가는 부분을 인자로 받을 수 있으며 여기서는 Wx+b가 들어가게 됩니다.

In [4]:
# tf Graph Input
x = tf.placeholder(tf.float32, [None, 784]) # mnist data image of shape 28*28=784
y = tf.placeholder(tf.float32, [None, 10]) # 0-9 digits recognition => 10 classes

# Set model weights
W = tf.Variable(tf.zeros([784, 10]))
b = tf.Variable(tf.zeros([10]))

# Construct model
pred = tf.nn.softmax(tf.matmul(x, W) + b) # Softmax

$$ cost = \frac{1}{n} \sum_{n} (- \sum_{k} y \log{\hat{y}} ) $$

In [6]:
# Minimize error using cross entropy
cost = tf.reduce_mean(-tf.reduce_sum(y*tf.log(pred), reduction_indices=1))
# Gradient Descent
optimizer = tf.train.GradientDescentOptimizer(learning_rate).minimize(cost)

In [7]:
# Initializing the variables
init = tf.global_variables_initializer()

In [8]:
# Launch the graph
with tf.Session() as sess:
    sess.run(init)

    # Training cycle
    for epoch in range(training_epochs):
        avg_cost = 0.
        total_batch = int(mnist.train.num_examples/batch_size)
        # Loop over all batches
        for i in range(total_batch):
            batch_xs, batch_ys = mnist.train.next_batch(batch_size)
            # Fit training using batch data
            _, c = sess.run([optimizer, cost], feed_dict={x: batch_xs,
                                                          y: batch_ys})
            # Compute average loss
            avg_cost += c / total_batch
        # Display logs per epoch step
        if (epoch+1) % display_step == 0:
            print "Epoch:", '%04d' % (epoch+1), "cost=", "{:.9f}".format(avg_cost)

    print "Optimization Finished!"

    # Test model
    correct_prediction = tf.equal(tf.argmax(pred, 1), tf.argmax(y, 1))
    # Calculate accuracy for 3000 examples
    accuracy = tf.reduce_mean(tf.cast(correct_prediction, tf.float32))
    print "Accuracy:", accuracy.eval({x: mnist.test.images[:3000], y: mnist.test.labels[:3000]})

Epoch: 0001 cost= 1.183671701
Epoch: 0002 cost= 0.665093600
Epoch: 0003 cost= 0.552661167
Epoch: 0004 cost= 0.498580916
Epoch: 0005 cost= 0.465463370
Epoch: 0006 cost= 0.442502252
Epoch: 0007 cost= 0.425388629
Epoch: 0008 cost= 0.412178434
Epoch: 0009 cost= 0.401353353
Epoch: 0010 cost= 0.392370607
Epoch: 0011 cost= 0.384772295
Epoch: 0012 cost= 0.378171922
Epoch: 0013 cost= 0.372400357
Epoch: 0014 cost= 0.367258130
Epoch: 0015 cost= 0.362751649
Epoch: 0016 cost= 0.358631221
Epoch: 0017 cost= 0.354872593
Epoch: 0018 cost= 0.351479804
Epoch: 0019 cost= 0.348328970
Epoch: 0020 cost= 0.345445272
Epoch: 0021 cost= 0.342732085
Epoch: 0022 cost= 0.340273067
Epoch: 0023 cost= 0.337933549
Epoch: 0024 cost= 0.335755487
Epoch: 0025 cost= 0.333669784
Optimization Finished!
Accuracy: 0.888667
