from IPython.display import display, Image
import os, warnings

warnings.filterwarnings(action='ignore')


display(Image(filename="img/cnn.png"))


import tensorflow as tf
from tensorflow.keras import models
from tensorflow.keras import layers
import matplotlib.pyplot as plt

print(tf.__version__)

2.16.1


from tensorflow.keras.datasets import mnist
from tensorflow.keras.utils import to_categorical

(train_images, train_labels), (test_images, test_labels) = mnist.load_data()

Downloading data from https://storage.googleapis.com/tensorflow/tf-keras-datasets/mnist.npz
11490434/11490434 ━━━━━━━━━━━━━━━━━━━━ 5s 0us/step


model = models.Sequential()

model.add(layers.Conv2D(filters=32, kernel_size=(3, 3), 
                        activation='relu', input_shape=(28, 28, 1)))
model.add(layers.MaxPooling2D(pool_size=(2, 2)))

model.add(layers.Conv2D(filters=64, kernel_size=(3, 3), 
                        activation='relu'))
model.add(layers.MaxPooling2D((2, 2)))


model.add(layers.Flatten())
model.add(layers.Dense(64, activation='relu'))
model.add(layers.Dense(10, activation='softmax'))


model.summary()

Model: "sequential"

┏━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━┳━━━━━━━━━━━━━━━━━━━━━━━━━━━━━┳━━━━━━━━━━━━━━━━━┓
┃ Layer (type)                         ┃ Output Shape                ┃         Param # ┃
┡━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━╇━━━━━━━━━━━━━━━━━━━━━━━━━━━━━╇━━━━━━━━━━━━━━━━━┩
│ conv2d (Conv2D)                      │ (None, 26, 26, 32)          │             320 │
├──────────────────────────────────────┼─────────────────────────────┼─────────────────┤
│ max_pooling2d (MaxPooling2D)         │ (None, 13, 13, 32)          │               0 │
├──────────────────────────────────────┼─────────────────────────────┼─────────────────┤
│ conv2d_1 (Conv2D)                    │ (None, 11, 11, 64)          │          18,496 │
├──────────────────────────────────────┼─────────────────────────────┼─────────────────┤
│ max_pooling2d_1 (MaxPooling2D)       │ (None, 5, 5, 64)            │               0 │
├──────────────────────────────────────┼─────────────────────────────┼─────────────────┤
│ flatten (Flatten)                    │ (None, 1600)                │               0 │
├──────────────────────────────────────┼─────────────────────────────┼─────────────────┤
│ dense (Dense)                        │ (None, 64)                  │         102,464 │
├──────────────────────────────────────┼─────────────────────────────┼─────────────────┤
│ dense_1 (Dense)                      │ (None, 10)                  │             650 │
└──────────────────────────────────────┴─────────────────────────────┴─────────────────┘

 Total params: 121,930 (476.29 KB)

 Trainable params: 121,930 (476.29 KB)

 Non-trainable params: 0 (0.00 B)


# 입력층은 이미지 그대로, 입력층의 값의 범위 정규화
train_images = train_images.reshape((60000, 28, 28, 1))
train_images = train_images.astype('float32') / 255

test_images = test_images.reshape((10000, 28, 28, 1))
test_images = test_images.astype('float32') / 255

# 출력층 데이터-원핫 인코딩
train_labels = to_categorical(train_labels)
test_labels = to_categorical(test_labels)


print("입력층 데이터(X) : ",train_images.shape, test_images.shape )
print("출력층 데이터(y) : ",train_labels.shape, test_labels.shape )

입력층 데이터(X) :  (60000, 28, 28, 1) (10000, 28, 28, 1)
출력층 데이터(y) :  (60000, 10) (10000, 10)


%%time

model.compile(optimizer='rmsprop',
              loss='categorical_crossentropy',
              metrics=['accuracy'])
hist = model.fit(train_images, train_labels, 
                 validation_data=(test_images, test_labels), 
                 epochs=5, batch_size=64)

Epoch 1/5
938/938 ━━━━━━━━━━━━━━━━━━━━ 13s 13ms/step - accuracy: 0.8778 - loss: 0.3841 - val_accuracy: 0.9823 - val_loss: 0.0554
Epoch 2/5
938/938 ━━━━━━━━━━━━━━━━━━━━ 13s 13ms/step - accuracy: 0.9828 - loss: 0.0566 - val_accuracy: 0.9886 - val_loss: 0.0366
Epoch 3/5
938/938 ━━━━━━━━━━━━━━━━━━━━ 13s 14ms/step - accuracy: 0.9896 - loss: 0.0345 - val_accuracy: 0.9903 - val_loss: 0.0298
Epoch 4/5
938/938 ━━━━━━━━━━━━━━━━━━━━ 13s 14ms/step - accuracy: 0.9915 - loss: 0.0251 - val_accuracy: 0.9898 - val_loss: 0.0295
Epoch 5/5
938/938 ━━━━━━━━━━━━━━━━━━━━ 12s 13ms/step - accuracy: 0.9941 - loss: 0.0185 - val_accuracy: 0.9925 - val_loss: 0.0258
CPU times: total: 1min 11s
Wall time: 1min 3s


test_loss, test_acc = model.evaluate(test_images, test_labels)
print(test_acc)

313/313 ━━━━━━━━━━━━━━━━━━━━ 1s 3ms/step - accuracy: 0.9901 - loss: 0.0324
0.9925000071525574


hist.history['loss']

[0.17156606912612915,
 0.050500720739364624,
 0.03471164405345917,
 0.026060106232762337,
 0.020667018368840218]


plt.figure(figsize=(10,8),facecolor='white')
x_lim = range(1,6)
plt.plot(x_lim,  hist.history['loss'])
plt.plot(x_lim,  hist.history['accuracy'])
plt.legend(['loss','acc'])

<matplotlib.legend.Legend at 0x1b081d6f450>


import os

path = os.path.join(os.getcwd(), "dl_model")
savefile = os.path.join(path, "my_model_mnist.h5"  )

model.save(savefile)

os.listdir(path)

WARNING:absl:You are saving your model as an HDF5 file via `model.save()` or `keras.saving.save_model(model)`. This file format is considered legacy. We recommend using instead the native Keras format, e.g. `model.save('my_model.keras')` or `keras.saving.save_model(model, 'my_model.keras')`.

['my_model_mnist.h5']


# 모델을 불러온다.
load_model = tf.keras.models.load_model(savefile)
load_model.evaluate(test_images,  test_labels, verbose=2)

WARNING:absl:Compiled the loaded model, but the compiled metrics have yet to be built. `model.compile_metrics` will be empty until you train or evaluate the model.

313/313 - 1s - 3ms/step - accuracy: 0.9925 - loss: 0.0258

[0.025776531547307968, 0.9925000071525574]

CNN(Convolution Neural Network) - 합성곱 신경망¶

학습 내용¶

목차

사전 설치¶

01 합성망 신경망 알아보기

CNN은 무엇인가요?¶

우리가 구성할 모델¶

사용할 함수¶

02 MNIST 데이터 셋 준비

03 모델 만들기

완전 연결층(FCL) 추가¶

CNN 구조 알아보기¶

04. 모델에 맞춰 데이터 전처리

데이터 전처리¶

05 모델 학습 및 평가(CNN모델)

비용함수, 최적화 함수 구성¶

06. 모델 결과 시각화

07 모델 저장 및 불러오기

실습 01¶