solaris33 · June 15, 2018 11:49
diff --git a/mnist_classification_using_cnn_with_tfsaver.py b/mnist_classification_using_cnn_with_tfsaver.py
 # -*- coding: utf-8 -*-
 # Convolutional Neural Networks(CNN)을 이용한 MNIST 분류기(Classifier)
 # Author : solaris33
 # Project URL : http://solarisailab.com/archives/2524

 import tensorflow as tf
 import os

 # MNIST 데이터를 다운로드 합니다.
 from tensorflow.examples.tutorials.mnist import input_data
 mnist = input_data.read_data_sets("/tmp/data/", one_hot=True)

 # CNN 모델을 정의합니다. 
 def build_CNN_classifier(x):
  # MNIST 데이터를 3차원 형태로 reshape합니다. MNIST 데이터는 grayscale 이미지기 떄문에 3번째차원(컬러채널)의 값은 1입니다. 
  x_image = tf.reshape(x, [-1, 28, 28, 1])

  # 첫번째 Convolution Layer 
  # 5x5 Kernel Size를 가진 32개의 Filter를 적용합니다.
  # 28x28x1 -> 28x28x32
  W_conv1 = tf.Variable(tf.truncated_normal(shape=[5, 5, 1, 32], stddev=5e-2))
  b_conv1 = tf.Variable(tf.constant(0.1, shape=[32]))
  h_conv1 = tf.nn.relu(tf.nn.conv2d(x_image, W_conv1, strides=[1, 1, 1, 1], padding='SAME') + b_conv1)

  # 첫번째 Pooling Layer
  # Max Pooling을 이용해서 이미지의 크기를 1/2로 downsample합니다.
  # 28x28x32 -> 14x14x32
  h_pool1 = tf.nn.max_pool(h_conv1, ksize=[1, 2, 2, 1], strides=[1, 2, 2, 1], padding='SAME')

  # 두번째 Convolutional Layer 
  # 5x5 Kernel Size를 가진 64개의 Filter를 적용합니다.
  # 14x14x32 -> 14x14x64
  W_conv2 = tf.Variable(tf.truncated_normal(shape=[5, 5, 32, 64], stddev=5e-2))
  b_conv2 = tf.Variable(tf.constant(0.1, shape=[64]))
  h_conv2 = tf.nn.relu(tf.nn.conv2d(h_pool1, W_conv2, strides=[1, 1, 1, 1], padding='SAME') + b_conv2)

  # 두번째 Pooling Layer
  # Max Pooling을 이용해서 이미지의 크기를 1/2로 downsample합니다.
  # 14x14x64 -> 7x7x64
  h_pool2 = tf.nn.max_pool(h_conv2, ksize=[1, 2, 2, 1], strides=[1, 2, 2, 1], padding='SAME')

  # Fully Connected Layer
  # 7x7 크기를 가진 64개의 activation map을 1024개의 특징들로 변환합니다. 
  # 7x7x64(3136) -> 1024
  W_fc1 = tf.Variable(tf.truncated_normal(shape=[7 * 7 * 64, 1024], stddev=5e-2))
  b_fc1 = tf.Variable(tf.constant(0.1, shape=[1024]))
  h_pool2_flat = tf.reshape(h_pool2, [-1, 7*7*64])
  h_fc1 = tf.nn.relu(tf.matmul(h_pool2_flat, W_fc1) + b_fc1)

  # Output Layer
  # 1024개의 특징들(feature)을 10개의 클래스-숫자 0-9-로 변환합니다.
  # 1024 -> 10
  W_output = tf.Variable(tf.truncated_normal(shape=[1024, 10], stddev=5e-2))
  b_output = tf.Variable(tf.constant(0.1, shape=[10]))
  logits = tf.matmul(h_fc1, W_output) + b_output
  y_pred = tf.nn.softmax(logits)

  return y_pred, logits

 # 인풋 아웃풋 데이터를 받기위한 플레이스홀더를 정의합니다.
 x = tf.placeholder(tf.float32, shape=[None, 784])
 y = tf.placeholder(tf.float32, shape=[None, 10])

 # Convolutional Neural Networks(CNN)을 선언합니다.
 y_pred, logits = build_CNN_classifier(x)

 # Cross Entropy를 손실 함수(loss function)으로 정의하고 옵티마이저를 정의합니다.
 loss = tf.reduce_mean(tf.nn.softmax_cross_entropy_with_logits(labels=y, logits=logits))
 train_step = tf.train.AdamOptimizer(1e-4).minimize(loss)

 # 정확도를 계산하는 연산을 추가합니다.
 correct_prediction = tf.equal(tf.argmax(y_pred, 1), tf.argmax(y, 1))
 accuracy = tf.reduce_mean(tf.cast(correct_prediction, tf.float32))

 # tf.train.Saver를 이용해서 모델과 파라미터를 저장합니다.
 SAVER_DIR = "model"
 saver = tf.train.Saver()
 checkpoint_path = os.path.join(SAVER_DIR, "model")
 ckpt = tf.train.get_checkpoint_state(SAVER_DIR)

 # 세션을 열어 실제 학습을 진행합니다.
 with tf.Session() as sess:
  # 모든 변수들을 초기화합니다.
  sess.run(tf.global_variables_initializer())

  # 만약 저장된 모델과 파라미터가 있으면 이를 불러오고 (Restore)
  # Restored 모델을 이용해서 테스트 데이터에 대한 정확도를 출력하고 프로그램을 종료합니다.
  if ckpt and ckpt.model_checkpoint_path:
    saver.restore(sess, ckpt.model_checkpoint_path)    
    print("테스트 데이터 정확도 (Restored) : %f" % accuracy.eval(feed_dict={x: mnist.test.images, y: mnist.test.labels}))
    sess.close()
    exit()

  # 10000 Step만큼 최적화를 수행합니다.
  for step in range(10000):
    # 50개씩 MNIST 데이터를 불러옵니다.
    batch = mnist.train.next_batch(50)
    # 100 Step마다 training 데이터셋에 대한 정확도를 출력하고 tf.train.Saver를 이용해서 모델과 파라미터를 저장합니다.
    if step % 100 == 0:      
      saver.save(sess, checkpoint_path, global_step=step)
      train_accuracy = accuracy.eval(feed_dict={x: batch[0], y: batch[1]})
      print("반복(Epoch): %d, 트레이닝 데이터 정확도: %f" % (step, train_accuracy))
    # 옵티마이저를 실행해 학습을 진행합니다.
    sess.run([train_step], feed_dict={x: batch[0], y: batch[1]})

  # 학습이 끝나면 테스트 데이터에 대한 정확도를 출력합니다.
  print("테스트 데이터 정확도: %f" % accuracy.eval(feed_dict={x: mnist.test.images, y: mnist.test.labels}))
	# -- coding: utf-8 --
	# Convolutional Neural Networks(CNN)을 이용한 MNIST 분류기(Classifier)
	# Author : solaris33
	# Project URL : http://solarisailab.com/archives/2524

	import tensorflow as tf
	import os

	# MNIST 데이터를 다운로드 합니다.
	from tensorflow.examples.tutorials.mnist import input_data
	mnist = input_data.read_data_sets("/tmp/data/", one_hot=True)

	# CNN 모델을 정의합니다.
	def build_CNN_classifier(x):
	# MNIST 데이터를 3차원 형태로 reshape합니다. MNIST 데이터는 grayscale 이미지기 떄문에 3번째차원(컬러채널)의 값은 1입니다.
	x_image = tf.reshape(x, [-1, 28, 28, 1])

	# 첫번째 Convolution Layer
	# 5x5 Kernel Size를 가진 32개의 Filter를 적용합니다.
	# 28x28x1 -> 28x28x32
	W_conv1 = tf.Variable(tf.truncated_normal(shape=[5, 5, 1, 32], stddev=5e-2))
	b_conv1 = tf.Variable(tf.constant(0.1, shape=[32]))
	h_conv1 = tf.nn.relu(tf.nn.conv2d(x_image, W_conv1, strides=[1, 1, 1, 1], padding='SAME') + b_conv1)

	# 첫번째 Pooling Layer
	# Max Pooling을 이용해서 이미지의 크기를 1/2로 downsample합니다.
	# 28x28x32 -> 14x14x32
	h_pool1 = tf.nn.max_pool(h_conv1, ksize=[1, 2, 2, 1], strides=[1, 2, 2, 1], padding='SAME')

	# 두번째 Convolutional Layer
	# 5x5 Kernel Size를 가진 64개의 Filter를 적용합니다.
	# 14x14x32 -> 14x14x64
	W_conv2 = tf.Variable(tf.truncated_normal(shape=[5, 5, 32, 64], stddev=5e-2))
	b_conv2 = tf.Variable(tf.constant(0.1, shape=[64]))
	h_conv2 = tf.nn.relu(tf.nn.conv2d(h_pool1, W_conv2, strides=[1, 1, 1, 1], padding='SAME') + b_conv2)

	# 두번째 Pooling Layer
	# Max Pooling을 이용해서 이미지의 크기를 1/2로 downsample합니다.
	# 14x14x64 -> 7x7x64
	h_pool2 = tf.nn.max_pool(h_conv2, ksize=[1, 2, 2, 1], strides=[1, 2, 2, 1], padding='SAME')

	# Fully Connected Layer
	# 7x7 크기를 가진 64개의 activation map을 1024개의 특징들로 변환합니다.
	# 7x7x64(3136) -> 1024
	W_fc1 = tf.Variable(tf.truncated_normal(shape=[7 * 7 * 64, 1024], stddev=5e-2))
	b_fc1 = tf.Variable(tf.constant(0.1, shape=[1024]))
	h_pool2_flat = tf.reshape(h_pool2, [-1, 7764])
	h_fc1 = tf.nn.relu(tf.matmul(h_pool2_flat, W_fc1) + b_fc1)

	# Output Layer
	# 1024개의 특징들(feature)을 10개의 클래스-숫자 0-9-로 변환합니다.
	# 1024 -> 10
	W_output = tf.Variable(tf.truncated_normal(shape=[1024, 10], stddev=5e-2))
	b_output = tf.Variable(tf.constant(0.1, shape=[10]))
	logits = tf.matmul(h_fc1, W_output) + b_output
	y_pred = tf.nn.softmax(logits)

	return y_pred, logits

	# 인풋 아웃풋 데이터를 받기위한 플레이스홀더를 정의합니다.
	x = tf.placeholder(tf.float32, shape=[None, 784])
	y = tf.placeholder(tf.float32, shape=[None, 10])

	# Convolutional Neural Networks(CNN)을 선언합니다.
	y_pred, logits = build_CNN_classifier(x)

	# Cross Entropy를 손실 함수(loss function)으로 정의하고 옵티마이저를 정의합니다.
	loss = tf.reduce_mean(tf.nn.softmax_cross_entropy_with_logits(labels=y, logits=logits))
	train_step = tf.train.AdamOptimizer(1e-4).minimize(loss)

	# 정확도를 계산하는 연산을 추가합니다.
	correct_prediction = tf.equal(tf.argmax(y_pred, 1), tf.argmax(y, 1))
	accuracy = tf.reduce_mean(tf.cast(correct_prediction, tf.float32))

	# tf.train.Saver를 이용해서 모델과 파라미터를 저장합니다.
	SAVER_DIR = "model"
	saver = tf.train.Saver()
	checkpoint_path = os.path.join(SAVER_DIR, "model")
	ckpt = tf.train.get_checkpoint_state(SAVER_DIR)

	# 세션을 열어 실제 학습을 진행합니다.
	with tf.Session() as sess:
	# 모든 변수들을 초기화합니다.
	sess.run(tf.global_variables_initializer())

	# 만약 저장된 모델과 파라미터가 있으면 이를 불러오고 (Restore)
	# Restored 모델을 이용해서 테스트 데이터에 대한 정확도를 출력하고 프로그램을 종료합니다.
	if ckpt and ckpt.model_checkpoint_path:
	saver.restore(sess, ckpt.model_checkpoint_path)
	print("테스트 데이터 정확도 (Restored) : %f" % accuracy.eval(feed_dict={x: mnist.test.images, y: mnist.test.labels}))
	sess.close()
	exit()

	# 10000 Step만큼 최적화를 수행합니다.
	for step in range(10000):
	# 50개씩 MNIST 데이터를 불러옵니다.
	batch = mnist.train.next_batch(50)
	# 100 Step마다 training 데이터셋에 대한 정확도를 출력하고 tf.train.Saver를 이용해서 모델과 파라미터를 저장합니다.
	if step % 100 == 0:
	saver.save(sess, checkpoint_path, global_step=step)
	train_accuracy = accuracy.eval(feed_dict={x: batch[0], y: batch[1]})
	print("반복(Epoch): %d, 트레이닝 데이터 정확도: %f" % (step, train_accuracy))
	# 옵티마이저를 실행해 학습을 진행합니다.
	sess.run([train_step], feed_dict={x: batch[0], y: batch[1]})

	# 학습이 끝나면 테스트 데이터에 대한 정확도를 출력합니다.
	print("테스트 데이터 정확도: %f" % accuracy.eval(feed_dict={x: mnist.test.images, y: mnist.test.labels}))