rkdls
diff --git a/‎03 - MNIST, CNN/01 - MNIST.py‎
Lines changed: 77 additions & 0 deletions b/‎03 - MNIST, CNN/01 - MNIST.py‎
Lines changed: 77 additions & 0 deletions
diff --git a/‎03 - MNIST, CNN/02 - Dropout.py‎
Lines changed: 63 additions & 0 deletions b/‎03 - MNIST, CNN/02 - Dropout.py‎
Lines changed: 63 additions & 0 deletions
diff --git a/‎03 - MNIST, CNN/03 - CNN.py‎
Lines changed: 90 additions & 0 deletions b/‎03 - MNIST, CNN/03 - CNN.py‎
Lines changed: 90 additions & 0 deletions
diff --git a/‎03 - MNIST, CNN/04 - tf.contrib.layers.py‎
Lines changed: 80 additions & 0 deletions b/‎03 - MNIST, CNN/04 - tf.contrib.layers.py‎
Lines changed: 80 additions & 0 deletions
@@ -0,0 +1,77 @@
+# -*- coding: utf-8 -*-
+# 머신러닝 학습의 Hello World 와 같은 MNIST(손글씨 숫자 인식) 문제를 신경망으로 풀어봅니다.
+
+import tensorflow as tf
+
+from tensorflow.examples.tutorials.mnist import input_data
+# 텐서플로우에 기본 내장된 mnist 모듈을 이용하여 데이터를 로드합니다.
+# 지정한 폴더에 MNIST 데이터가 없는 경우 자동으로 데이터를 다운로드합니다.
+# one_hot 옵션은 레이블을 동물 분류 예제에서 보았던 one_hot 방식의 데이터로 만들어줍니다.
+mnist = input_data.read_data_sets("./mnist/data/", one_hot=True)
+
+
+#########
+# 신경망 모델 구성
+######
+# 입력 값의 차원은 [배치크기, 특성값] 으로 되어 있습니다.
+# 손글씨 이미지는 28x28 픽셀로 이루어져 있고, 이를 784개의 특성값으로 정합니다.
+X = tf.placeholder(tf.float32, [None, 784])
+# 결과는 0~9 의 10 가지 분류를 가집니다.
+Y = tf.placeholder(tf.float32, [None, 10])
+
+# 신경망의 레이어는 다음처럼 구성합니다.
+# 784(입력 특성값)
+#   -> 256 (히든레이어 뉴런 갯수) -> 256 (히든레이어 뉴런 갯수)
+#   -> 10 (결과값 0~9 분류)
+W1 = tf.Variable(tf.random_normal([784, 256], stddev=0.01))
+W2 = tf.Variable(tf.random_normal([256, 256], stddev=0.01))
+W3 = tf.Variable(tf.random_normal([256, 10], stddev=0.01))
+
+# 입력값에 가중치를 곱하고 ReLU 함수를 이용하여 레이어를 만듭니다.
+L1 = tf.nn.relu(tf.matmul(X, W1))
+# L1 레이어의 출력값에 가중치를 곱하고 ReLU 함수를 이용하여 레이어를 만듭니다.
+L2 = tf.nn.relu(tf.matmul(L1, W2))
+# 최종 모델의 출력값은 W3 변수를 곱해 10개의 분류를 가지게 됩니다.
+model = tf.matmul(L2, W3)
+
+cost = tf.reduce_mean(tf.nn.softmax_cross_entropy_with_logits(model, Y))
+optimizer = tf.train.AdamOptimizer(0.001).minimize(cost)
+
+
+#########
+# 신경망 모델 학습
+######
+init = tf.global_variables_initializer()
+sess = tf.Session()
+sess.run(init)
+
+batch_size = 100
+total_batch = int(mnist.train.num_examples/batch_size)
+
+for epoch in range(15):
+    total_cost = 0
+
+    for i in range(total_batch):
+        # 텐서플로우의 mnist 모델의 next_batch 함수를 이용해
+        # 지정한 크기만큼 학습할 데이터를 가져옵니다.
+        batch_xs, batch_ys = mnist.train.next_batch(batch_size)
+        sess.run(optimizer, feed_dict={X: batch_xs, Y: batch_ys})
+        total_cost += sess.run(cost, feed_dict={X: batch_xs, Y: batch_ys})
+
+    print 'Epoch:', '%04d' % (epoch + 1),\
+            'Avg. cost =', '{:.3f}'.format(total_cost / total_batch)
+
+print '최적화 완료!'
+
+
+#########
+# 결과 확인
+######
+# model 로 예측한 값과 실제 레이블인 Y의 값을 비교합니다.
+# tf.argmax 함수를 이용해 예측한 값에서 가장 큰 값을 예측한 레이블이라고 평가합니다.
+# 예) [0.1 0 0 0.7 0 0.2 0 0 0 0] -> 4
+check_prediction = tf.equal(tf.argmax(model, 1), tf.argmax(Y, 1))
+accuracy = tf.reduce_mean(tf.cast(check_prediction, tf.float32))
+print '정확도:', sess.run(accuracy,
+                            feed_dict={X: mnist.test.images,
+                                       Y: mnist.test.labels})
@@ -0,0 +1,63 @@
+# -*- coding: utf-8 -*-
+# 과적합 방지 기법 중 하나인 Dropout 을 사용해봅니다.
+
+import tensorflow as tf
+
+from tensorflow.examples.tutorials.mnist import input_data
+mnist = input_data.read_data_sets("./mnist/data/", one_hot=True)
+
+
+#########
+# 신경망 모델 구성
+######
+X = tf.placeholder(tf.float32, [None, 784])
+Y = tf.placeholder(tf.float32, [None, 10])
+
+W1 = tf.Variable(tf.random_normal([784, 256], stddev=0.01))
+W2 = tf.Variable(tf.random_normal([256, 256], stddev=0.01))
+W3 = tf.Variable(tf.random_normal([256, 10], stddev=0.01))
+
+L1 = tf.nn.relu(tf.matmul(X, W1))
+# 텐서플로우에 내장된 함수를 이용하여 dropout 을 적용합니다.
+# 함수에 적용할 레이어와 확률만 넣어주면 됩니다. 겁나 매직!!
+L1 = tf.nn.dropout(L1, 0.8)
+L2 = tf.nn.relu(tf.matmul(L1, W2))
+L2 = tf.nn.dropout(L2, 0.8)
+model = tf.matmul(L2, W3)
+
+cost = tf.reduce_mean(tf.nn.softmax_cross_entropy_with_logits(model, Y))
+optimizer = tf.train.AdamOptimizer(0.001).minimize(cost)
+
+
+#########
+# 신경망 모델 학습
+######
+init = tf.global_variables_initializer()
+sess = tf.Session()
+sess.run(init)
+
+batch_size = 100
+total_batch = int(mnist.train.num_examples/batch_size)
+
+for epoch in range(15):
+    total_cost = 0
+
+    for i in range(total_batch):
+        batch_xs, batch_ys = mnist.train.next_batch(batch_size)
+        sess.run(optimizer, feed_dict={X: batch_xs, Y: batch_ys})
+        total_cost += sess.run(cost, feed_dict={X: batch_xs, Y: batch_ys})
+
+    print 'Epoch:', '%04d' % (epoch + 1), \
+        'Avg. cost =', '{:.3f}'.format(total_cost / total_batch)
+
+print '최적화 완료!'
+
+
+#########
+# 결과 확인
+######
+check_prediction = tf.equal(tf.argmax(model, 1), tf.argmax(Y, 1))
+accuracy = tf.reduce_mean(tf.cast(check_prediction, tf.float32))
+print '정확도:', sess.run(accuracy,
+                       feed_dict={X: mnist.test.images,
+                                  Y: mnist.test.labels})
@@ -0,0 +1,90 @@
+# -*- coding: utf-8 -*-
+# 이미지 처리 분야에서 가장 유명한 신경망 모델인 CNN 을 이용하여 더 높은 인식률을 만들어봅니다.
+
+import tensorflow as tf
+
+from tensorflow.examples.tutorials.mnist import input_data
+mnist = input_data.read_data_sets("./mnist/data/", one_hot=True)
+
+
+#########
+# 신경망 모델 구성
+######
+# 기존 모델에서는 입력 값을 28x28 하나의 차원으로 구성하였으나,
+# CNN 모델을 사용하기 위해 2차원 평면과 특성치의 형태를 갖는 구조로 만듭니다.
+X = tf.placeholder(tf.float32, [None, 28, 28, 1])
+Y = tf.placeholder(tf.float32, [None, 10])
+
+# 각각의 변수와 레이어는 다음과 같은 형태로 구성됩니다.
+# W1 [3 3 1 32] -> [3 3]: 커널 크기, 1: 입력값 X 의 특성수, 32: 필터 갯수
+# L1 Conv shape=(?, 28, 28, 32)
+#    Pool     ->(?, 14, 14, 32)
+W1 = tf.Variable(tf.random_normal([3, 3, 1, 32], stddev=0.01))
+# tf.nn.conv2d 를 이용해 한칸씩 움직이는 컨볼루션 레이어를 쉽게 만들 수 있습니다.
+# padding='SAME' 은 커널 슬라이딩시 최외곽에서 한칸 밖으로 더 움직이는 옵션
+L1 = tf.nn.relu(tf.nn.conv2d(X, W1, strides=[1, 1, 1, 1], padding='SAME'))
+# Pooling 역시 tf.nn.max_pool 을 이용하여 쉽게 구성할 수 있습니다.
+L1 = tf.nn.max_pool(L1, ksize=[1, 2, 2, 1], strides=[1, 2, 2, 1], padding='SAME')
+L1 = tf.nn.dropout(L1, 0.8)
+
+# L2 Conv shape=(?, 14, 14, 64)
+#    Pool     ->(?, 7, 7, 64)
+#    Reshape  ->(?, 256)
+# W2 의 [3, 3, 32, 64] 에서 32 는 L1 에서 출력된 W1 의 마지막 차원, 필터의 크기 입니다.
+W2 = tf.Variable(tf.random_normal([3, 3, 32, 64], stddev=0.01))
+L2 = tf.nn.relu(tf.nn.conv2d(L1, W2, strides=[1, 1, 1, 1], padding='SAME'))
+L2 = tf.nn.max_pool(L2, ksize=[1, 2, 2, 1], strides=[1, 2, 2, 1], padding='SAME')
+# Full Connect 를 위해 차원을 줄입니다.
+# 직전의 Pool 사이즈인 (?, 7, 7, 64) 를 참고합니다.
+L2 = tf.reshape(L2, [-1, 7 * 7 * 64])
+L2 = tf.nn.dropout(L2, 0.8)
+
+# FC 레이어: 입력값 7x7x64 -> 출력값 256
+W3 = tf.Variable(tf.random_normal([7 * 7 * 64, 256], stddev=0.01))
+L3 = tf.nn.relu(tf.matmul(L2, W3))
+L3 = tf.nn.dropout(L3, 0.5)
+
+# 최종 출력값 L3 에서의 출력 256개를 입력값으로 받아서 0~9 레이블인 10개의 출력값을 만듭니다.
+W4 = tf.Variable(tf.random_normal([256, 10], stddev=0.01))
+model = tf.matmul(L3, W4)
+
+cost = tf.reduce_mean(tf.nn.softmax_cross_entropy_with_logits(model, Y))
+optimizer = tf.train.AdamOptimizer(0.001).minimize(cost)
+# 최적화 함수를 RMSPropOptimizer 로 바꿔서 결과를 확인해봅시다.
+# optimizer = tf.train.RMSPropOptimizer(0.001, 0.9).minimize(cost)
+
+
+#########
+# 신경망 모델 학습
+######
+init = tf.global_variables_initializer()
+sess = tf.Session()
+sess.run(init)
+
+batch_size = 100
+total_batch = int(mnist.train.num_examples/batch_size)
+
+for epoch in range(15):
+    total_cost = 0
+
+    for i in range(total_batch):
+        batch_xs, batch_ys = mnist.train.next_batch(batch_size)
+        # 이미지 데이터를 CNN 모델을 위한 자료형태인 [28 28 1] 의 형태로 재구성합니다.
+        batch_xs = batch_xs.reshape(-1, 28, 28, 1)
+        _, cost_val = sess.run([optimizer, cost], feed_dict={X: batch_xs, Y: batch_ys})
+        total_cost += cost_val
+
+    print 'Epoch:', '%04d' % (epoch + 1), \
+        'Avg. cost =', '{:.3f}'.format(total_cost / total_batch)
+
+print '최적화 완료!'
+
+
+#########
+# 결과 확인
+######
+check_prediction = tf.equal(tf.argmax(model, 1), tf.argmax(Y, 1))
+accuracy = tf.reduce_mean(tf.cast(check_prediction, tf.float32))
+print '정확도:', sess.run(accuracy,
+                       feed_dict={X: mnist.test.images.reshape(-1, 28, 28, 1),
+                                  Y: mnist.test.labels})
@@ -0,0 +1,80 @@
+# -*- coding: utf-8 -*-
+# 신경망 구성을 손쉽게 해 주는 유틸리티 모음인 tensorflow.contrib.layers 를 사용해봅니다.
+# 03 - CNN.py 를 재구성한 것이니, 소스를 한 번 비교해보세요.
+# 이처럼 TensorFlow 에는 간단하게 사용할 수 있는 다양한 함수와 유틸리티들이 매우 많이 마련되어 있습니다.
+# 다만, 처음에는 기본적인 개념에 익숙히지는 것이 좋으므로 이후에도 가급적 기본 함수들을 이용하도록 하겠습니다.
+
+import tensorflow as tf
+
+from tensorflow.examples.tutorials.mnist import input_data
+mnist = input_data.read_data_sets("./mnist/data/", one_hot=True)
+
+
+#########
+# 옵션 설정
+######
+n_width = 28  # MNIST 이미지의 가로 크기
+n_height = 28  # MNIST 이미지의 세로 크기
+n_output = 10
+
+#########
+# 신경망 모델 구성
+######
+X = tf.placeholder(tf.float32, [None, n_width, n_height, 1])
+Y = tf.placeholder(tf.float32, [None, n_output])
+
+# 기본적으로 inputs, outputs size, kernel_size 만 넣어주면
+# 활성화 함수 적용은 물론, 컨볼루션 신경망을 만들기 위한 나머지 수치들은 알아서 계산해줍니다.
+# 특히 Weights 를 계산하는데 xavier_initializer 를 쓰고 있는 등,
+# 크게 신경쓰지 않아도 일반적으로 효율적인 신경망을 만들어줍니다.
+L1 = tf.contrib.layers.conv2d(X, 32, [3, 3])
+L2 = tf.contrib.layers.max_pool2d(L1, [2, 2])
+# normalizer_fn 인자를 사용하면 과적합등을 막아주는 normalizer 기법을 간단히 적용할 수 있습니다.
+L3 = tf.contrib.layers.conv2d(L2, 64, [3, 3],
+                              normalizer_fn=tf.nn.dropout,
+                              normalizer_params={'keep_prob': 0.8})
+L4 = tf.contrib.layers.max_pool2d(L3, [2, 2])
+
+L5 = tf.contrib.layers.flatten(L4)
+L5 = tf.contrib.layers.fully_connected(L5, 256,
+                                       normalizer_fn=tf.contrib.layers.batch_norm)
+model = tf.contrib.layers.fully_connected(L5, n_output)
+
+cost = tf.reduce_mean(tf.nn.softmax_cross_entropy_with_logits(model, Y))
+optimizer = tf.train.AdamOptimizer(0.001).minimize(cost)
+
+
+#########
+# 신경망 모델 학습
+######
+init = tf.global_variables_initializer()
+sess = tf.Session()
+sess.run(init)
+
+batch_size = 100
+total_batch = int(mnist.train.num_examples/batch_size)
+
+for epoch in range(15):
+    total_cost = 0
+
+    for i in range(total_batch):
+        batch_xs, batch_ys = mnist.train.next_batch(batch_size)
+        # 이미지 데이터를 CNN 모델을 위한 자료형태인 [28 28 1] 의 형태로 재구성합니다.
+        batch_xs = batch_xs.reshape(-1, 28, 28, 1)
+        _, cost_val = sess.run([optimizer, cost], feed_dict={X: batch_xs, Y: batch_ys})
+        total_cost += cost_val
+
+    print 'Epoch:', '%04d' % (epoch + 1), \
+        'Avg. cost =', '{:.3f}'.format(total_cost / total_batch)
+
+print '최적화 완료!'
+
+
+#########
+# 결과 확인
+######
+check_prediction = tf.equal(tf.argmax(model, 1), tf.argmax(Y, 1))
+accuracy = tf.reduce_mean(tf.cast(check_prediction, tf.float32))
+print '정확도:', sess.run(accuracy,
+                       feed_dict={X: mnist.test.images.reshape(-1, 28, 28, 1),
+                                  Y: mnist.test.labels})