# 심층 신경망

<table align="left">
  <td>
    <a target="_blank" href="https://colab.research.google.com/github/rickiepark/hg-mldl/blob/master/7-2.ipynb"><img src="https://www.tensorflow.org/images/colab_logo_32px.png" />구글 코랩에서 실행하기</a>
  </td>
</table>

## 2개의 층

In [5]:
# 케라스 불러오기
from tensorflow import keras

# 패션 MNIST 데이터 다운로드
(train_input, train_target), (test_input, test_target) = keras.datasets.fashion_mnist.load_data()

In [6]:
# SGD Classifier 사용을 위한 정규화 + 2차원 배열 -> 1차원 배열 변경
# train 데이터 -> train, val 데이터 분류
from sklearn.model_selection import train_test_split

train_scaled = train_input / 255.0
train_scaled = train_scaled.reshape(-1, 28*28)

train_scaled, val_scaled, train_target, val_target = train_test_split(train_scaled, train_target, test_size = 0.2, random_state = 42)

In [7]:
# 신경망 밀집층(은닉층 + 출력층) 생성
dense1 = keras.layers.Dense(100, activation='sigmoid', input_shape=(784,))
dense2 = keras.layers.Dense(10, activation='softmax')

## 심층 신경망 만들기

In [8]:
# 신경망 모델 생성
model = keras.Sequential([dense1, dense2])

In [5]:
# 신경망 층 정보 출력
model.summary()

Model: "sequential"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense (Dense)               (None, 100)               78500     
                                                                 
 dense_1 (Dense)             (None, 10)                1010      
                                                                 
Total params: 79,510
Trainable params: 79,510
Non-trainable params: 0
_________________________________________________________________


## 층을 추가하는 다른 방법

In [9]:
# 신경망 밀집층(은닉층 + 출력층) 생성 + 신경망 모델 생성
model = keras.Sequential([
    keras.layers.Dense(100, activation='sigmoid', input_shape=(784,), name='hidden'),
    keras.layers.Dense(10, activation='softmax', name='output')],
    name='패션 MNIST 모델')

In [10]:
# 신경망 층 정보 출력
model.summary()

Model: "패션 MNIST 모델"
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
hidden (Dense)               (None, 100)               78500     
_________________________________________________________________
output (Dense)               (None, 10)                1010      
Total params: 79,510
Trainable params: 79,510
Non-trainable params: 0
_________________________________________________________________


In [11]:
# 신경망 모델 생성 + 신경망 밀집층(은닉층 + 출력층) 추가
model = keras.Sequential()
model.add(keras.layers.Dense(100, activation='sigmoid', input_shape=(784,)))
model.add(keras.layers.Dense(10, activation='softmax'))

In [12]:
# 신경망 층 정보 출력
model.summary()

Model: "sequential_1"
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
dense_2 (Dense)              (None, 100)               78500     
_________________________________________________________________
dense_3 (Dense)              (None, 10)                1010      
Total params: 79,510
Trainable params: 79,510
Non-trainable params: 0
_________________________________________________________________


In [13]:
# 손실함수, 측정 지표 설정
model.compile(loss='sparse_categorical_crossentropy', metrics='accuracy')

# 모델 훈련
model.fit(train_scaled, train_target, epochs=5)

Epoch 1/5
Epoch 2/5
Epoch 3/5
Epoch 4/5
Epoch 5/5


<tensorflow.python.keras.callbacks.History at 0x19c8beacd90>

## 렐루 활성화 함수

In [15]:
# 신경망 모델 생성 + 신경망 밀집층(은닉층 + 출력층) 추가
model = keras.Sequential()
model.add(keras.layers.Flatten(input_shape=(28, 28)))
model.add(keras.layers.Dense(100, activation='relu'))
model.add(keras.layers.Dense(10, activation='softmax'))

In [16]:
# 신경망 층 정보 출력
model.summary()

Model: "sequential_3"
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
flatten (Flatten)            (None, 784)               0         
_________________________________________________________________
dense_4 (Dense)              (None, 100)               78500     
_________________________________________________________________
dense_5 (Dense)              (None, 10)                1010      
Total params: 79,510
Trainable params: 79,510
Non-trainable params: 0
_________________________________________________________________


In [17]:
# 패션 MNIST 데이터 다운로드
(train_input, train_target), (test_input, test_target) = keras.datasets.fashion_mnist.load_data()

# SGD Classifier 사용을 위한 정규화
# train 데이터 -> train, val 데이터 분류
train_scaled = train_input / 255.0

train_scaled, val_scaled, train_target, val_target = train_test_split(
    train_scaled, train_target, test_size=0.2, random_state=42)

In [18]:
# 손실함수, 측정 지표 설정
model.compile(loss='sparse_categorical_crossentropy', metrics='accuracy')

# 모델 훈련
model.fit(train_scaled, train_target, epochs=5)

Epoch 1/5
Epoch 2/5
Epoch 3/5
Epoch 4/5
Epoch 5/5


<tensorflow.python.keras.callbacks.History at 0x19c8c269880>

In [19]:
# 모델 성능 평가
model.evaluate(val_scaled, val_target)



[0.3729154169559479, 0.874916672706604]

## 옵티마이저

In [20]:
# 손실함수, 측정 지표 설정(optimizer : SGD)
model.compile(optimizer='sgd', loss='sparse_categorical_crossentropy', metrics='accuracy')

In [22]:
# 손실함수, 측정 지표 설정(optimizer : SGD)
sgd = keras.optimizers.SGD()
model.compile(optimizer=sgd, loss='sparse_categorical_crossentropy', metrics='accuracy')

In [23]:
# 손실함수, 측정 지표 설정(learning rate = 0.1)
sgd = keras.optimizers.SGD(learning_rate=0.1)

In [24]:
# 손실함수, 측정 지표 설정(momentum 설정 : nesterov / momentum 값 = 0.9)
sgd = keras.optimizers.SGD(momentum=0.9, nesterov=True)

In [26]:
# 손실함수, 측정 지표 설정(optimizier : Adagrad)
adagrad = keras.optimizers.Adagrad()
model.compile(optimizer=adagrad, loss='sparse_categorical_crossentropy', metrics='accuracy')

In [27]:
# 손실함수, 측정 지표 설정(optimizier : RMSprop)
rmsprop = keras.optimizers.RMSprop()
model.compile(optimizer=rmsprop, loss='sparse_categorical_crossentropy', metrics='accuracy')

In [28]:
# 신경망 모델 생성 + 신경망 밀집층(은닉층 + 출력층) 추가
model = keras.Sequential()
model.add(keras.layers.Flatten(input_shape=(28, 28)))
model.add(keras.layers.Dense(100, activation='relu'))
model.add(keras.layers.Dense(10, activation='softmax'))

In [30]:
# 손실함수, 측정 지표 설정 + 최적화 기법 설정
model.compile(optimizer='adam', loss='sparse_categorical_crossentropy', metrics='accuracy')

# 모델 훈련
model.fit(train_scaled, train_target, epochs=5)

Epoch 1/5
Epoch 2/5
Epoch 3/5
Epoch 4/5
Epoch 5/5


<tensorflow.python.keras.callbacks.History at 0x19c824f5400>

In [31]:
# 모델 성능 평가
model.evaluate(val_scaled, val_target)



[0.34273791313171387, 0.8787500262260437]