<a href="https://colab.research.google.com/github/jehoon5940/2024-Final-machine-learning-task/blob/main/Vector_Machine%2C_MNIST_dataset.ipynb" target="_parent"><img src="https://colab.research.google.com/assets/colab-badge.svg" alt="Open In Colab"/></a>

In [2]:
import tensorflow as tf
from tensorflow.keras.models import Sequential
from tensorflow.keras.layers import Conv2D, MaxPooling2D, Flatten, Dense, Dropout, BatchNormalization
from tensorflow.keras.datasets import mnist
from tensorflow.keras.utils import to_categorical
from tensorflow.keras.preprocessing.image import ImageDataGenerator
from tensorflow.keras.callbacks import ReduceLROnPlateau, EarlyStopping

# 자동 혼합 정밀도 (최신 GPU에서만 가능)
from tensorflow.keras import mixed_precision
mixed_precision.set_global_policy('mixed_float16')

# 데이터 로드 및 전처리
(x_train, y_train), (x_test, y_test) = mnist.load_data()
x_train = x_train.reshape(-1, 28, 28, 1).astype('float32') / 255
x_test = x_test.reshape(-1, 28, 28, 1).astype('float32') / 255
y_train = to_categorical(y_train, 10)
y_test = to_categorical(y_test, 10)

# 데이터 증강 적용
datagen = ImageDataGenerator(
    rotation_range=10,
    width_shift_range=0.1,
    height_shift_range=0.1,
    zoom_range=0.1
)
datagen.fit(x_train)

# CNN 모델 (최적화)
model = Sequential([
    Conv2D(128, (3, 3), activation='relu', input_shape=(28, 28, 1), kernel_initializer='he_uniform'),
    BatchNormalization(),
    Conv2D(128, (3, 3), activation='relu', kernel_initializer='he_uniform', padding='same'),
    BatchNormalization(),
    MaxPooling2D((2, 2)),
    Dropout(0.3),

    Conv2D(256, (3, 3), activation='relu', kernel_initializer='he_uniform', padding='same'),
    BatchNormalization(),
    Conv2D(256, (3, 3), activation='relu', kernel_initializer='he_uniform', padding='same'),
    BatchNormalization(),
    MaxPooling2D((2, 2)),
    Dropout(0.4),

    Flatten(),
    Dense(512, activation='relu', kernel_initializer='he_uniform'),
    BatchNormalization(),
    Dropout(0.5),

    Dense(256, activation='relu', kernel_initializer='he_uniform'),
    Dropout(0.3),

    Dense(10, activation='softmax', dtype='float32')  # mixed precision 적용
])

# 콜백 설정 (빠른 종료)
lr_reduction = ReduceLROnPlateau(monitor='val_loss', patience=2, factor=0.5, min_lr=1e-6)
early_stopping = EarlyStopping(monitor='val_loss', patience=5, restore_best_weights=True)  # patience 줄이기

# 모델 컴파일
model.compile(optimizer=tf.keras.optimizers.Adam(learning_rate=0.0001),  # 학습률 조정
              loss='categorical_crossentropy',
              metrics=['accuracy'])

# 모델 훈련 (배치 크기 증가 + steps_per_epoch 추가)
history = model.fit(datagen.flow(x_train, y_train, batch_size=128),  # 64 → 128
                    validation_data=(x_test, y_test),
                    epochs=50,  # 100 → 50
                    steps_per_epoch=len(x_train) // 128,  # 추가
                    callbacks=[lr_reduction, early_stopping])

# 모델 평가
loss, accuracy = model.evaluate(x_test, y_test)
print(f'Test Accuracy: {accuracy * 100:.2f}%')


Epoch 1/50


  super().__init__(activity_regularizer=activity_regularizer, **kwargs)


[1m468/468[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m60s[0m 81ms/step - accuracy: 0.5680 - loss: 1.5462 - val_accuracy: 0.9744 - val_loss: 0.0835 - learning_rate: 1.0000e-04
Epoch 2/50
[1m  1/468[0m [37m━━━━━━━━━━━━━━━━━━━━[0m [1m7s[0m 17ms/step - accuracy: 0.9062 - loss: 0.3629



[1m468/468[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m1s[0m 3ms/step - accuracy: 0.9062 - loss: 0.3629 - val_accuracy: 0.9749 - val_loss: 0.0828 - learning_rate: 1.0000e-04
Epoch 3/50
[1m468/468[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m21s[0m 45ms/step - accuracy: 0.9066 - loss: 0.3001 - val_accuracy: 0.9874 - val_loss: 0.0410 - learning_rate: 1.0000e-04
Epoch 4/50
[1m468/468[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m1s[0m 2ms/step - accuracy: 0.8828 - loss: 0.2956 - val_accuracy: 0.9873 - val_loss: 0.0411 - learning_rate: 1.0000e-04
Epoch 5/50
[1m468/468[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m40s[0m 44ms/step - accuracy: 0.9423 - loss: 0.1920 - val_accuracy: 0.9887 - val_loss: 0.0339 - learning_rate: 1.0000e-04
Epoch 6/50
[1m468/468[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m1s[0m 3ms/step - accuracy: 0.9688 - loss: 0.2261 - val_accuracy: 0.9888 - val_loss: 0.0338 - learnin

In [3]:
import tensorflow as tf
from tensorflow.keras.models import Sequential
from tensorflow.keras.layers import Conv2D, MaxPooling2D, Flatten, Dense, Dropout, BatchNormalization
from tensorflow.keras.datasets import mnist
from tensorflow.keras.utils import to_categorical
from tensorflow.keras.preprocessing.image import ImageDataGenerator
from tensorflow.keras.callbacks import ReduceLROnPlateau, EarlyStopping

# 데이터 로드 및 전처리
(x_train, y_train), (x_test, y_test) = mnist.load_data()
x_train = x_train.reshape(-1, 28, 28, 1).astype('float32') / 255
x_test = x_test.reshape(-1, 28, 28, 1).astype('float32') / 255
y_train = to_categorical(y_train, 10)
y_test = to_categorical(y_test, 10)

# 데이터 증강 적용
datagen = ImageDataGenerator(
    rotation_range=10,
    width_shift_range=0.1,
    height_shift_range=0.1,
    zoom_range=0.1
)
datagen.fit(x_train)

# 개선된 CNN 모델
model = Sequential([
    Conv2D(64, (3, 3), activation='relu', input_shape=(28, 28, 1)),
    BatchNormalization(),
    MaxPooling2D((2, 2)),
    Dropout(0.3),

    Conv2D(128, (3, 3), activation='relu'),
    BatchNormalization(),
    MaxPooling2D((2, 2)),
    Dropout(0.4),

    Flatten(),
    Dense(256, activation='relu'),
    BatchNormalization(),
    Dropout(0.5),

    Dense(128, activation='relu'),
    Dropout(0.3),

    Dense(10, activation='softmax')
])

# 콜백 설정
lr_reduction = ReduceLROnPlateau(monitor='val_loss', patience=2, factor=0.5, min_lr=1e-5)
early_stopping = EarlyStopping(monitor='val_loss', patience=5, restore_best_weights=True)

# 모델 컴파일
model.compile(optimizer=tf.keras.optimizers.Adam(learning_rate=0.0003),
              loss='categorical_crossentropy',
              metrics=['accuracy'])

# 모델 훈련
history = model.fit(datagen.flow(x_train, y_train, batch_size=128),
                    validation_data=(x_test, y_test),
                    epochs=30, callbacks=[lr_reduction, early_stopping])

# 모델 평가
loss, accuracy = model.evaluate(x_test, y_test)
print(f'Test Accuracy: {accuracy * 100:.2f}%')


Epoch 1/30
[1m469/469[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m39s[0m 61ms/step - accuracy: 0.5144 - loss: 1.6067 - val_accuracy: 0.2493 - val_loss: 2.3925 - learning_rate: 3.0000e-04
Epoch 2/30
[1m469/469[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m19s[0m 40ms/step - accuracy: 0.8848 - loss: 0.3666 - val_accuracy: 0.9853 - val_loss: 0.0457 - learning_rate: 3.0000e-04
Epoch 3/30
[1m469/469[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m20s[0m 42ms/step - accuracy: 0.9256 - loss: 0.2412 - val_accuracy: 0.9863 - val_loss: 0.0420 - learning_rate: 3.0000e-04
Epoch 4/30
[1m469/469[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m18s[0m 39ms/step - accuracy: 0.9404 - loss: 0.1993 - val_accuracy: 0.9880 - val_loss: 0.0372 - learning_rate: 3.0000e-04
Epoch 5/30
[1m469/469[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m19s[0m 40ms/step - accuracy: 0.9524 - loss: 0.1576 - val_accuracy: 0.9772 - val_loss: 0.0695 - learning_rate: 3.0000e-04
Epoch 6/30
[1m469/469[0m [32m━━━━━━━━