TensroFlow學習——第三章（二）

阿新 • • 發佈：2018-12-05

MINIST數字識別問題

卷積神經網路實現手寫數字識別

採用了L2正則化、滑動平均模型，固定學習率
訓練結果為：訓練集100%，驗證集99.4%，測試集99.43%
第一部分：前向傳播和網路引數

# 定義前向傳播和神經網路中的引數
import tensorflow as tf

# 配置神經網路引數
INPUT_NODE=784  # 輸入層節點個數
OUTPUT_NODE=10  # 輸出層節點個數

IMAGE_SIZE=28
NUM_CHANNELS=1

# 第一層卷積的尺寸和深度
CONV1_DEEP=32
CONV1_SIZE=5
# 第二層卷積的尺寸和深度
CONV2_DEEP=64
CONV2_SIZE=5
# 全連線層的節點個數
FC_SIZE=512


# 前向傳播
def inference(input_tensor,regularizer,avg_class,train=True,reuse=False):
	# 第一層卷積層
	with tf.variable_scope('layer_conv1',reuse=reuse):
		conv1_weights=tf.get_variable('weights',[CONV1_SIZE,CONV1_SIZE,NUM_CHANNELS,CONV1_DEEP],initializer=tf.truncated_normal_initializer(mean=0,stddev=0.1))
		conv1_biases=tf.get_variable('biases',[CONV1_DEEP],initializer=tf.constant_initializer(0.0))
		conv1=tf.nn.conv2d(input_tensor,conv1_weights,[1,1,1,1],padding='SAME')
		relu1=tf.nn.relu(tf.nn.bias_add(conv1,conv1_biases))

	# 第一層池化層
	with tf.name_scope('layer_pool1'):
		pool1=tf.nn.max_pool(relu1,ksize=[1,2,2,1],strides=[1,2,2,1],padding='SAME')

	# 第二層卷積層
	with tf.variable_scope('layer_conv2',reuse=reuse):
		conv2_weights=tf.get_variable('weights',[CONV2_SIZE,CONV2_SIZE,CONV1_DEEP,CONV2_DEEP],initializer=tf.truncated_normal_initializer(stddev=0.1))
		conv2_biases=tf.get_variable('biases',[CONV2_DEEP],initializer=tf.constant_initializer(0.0))
		conv2=tf.nn.conv2d(pool1,conv2_weights,[1,1,1,1],padding='SAME')
		relu2=tf.nn.relu(tf.nn.bias_add(conv2,conv2_biases))

	# 第二層池化層
	with tf.name_scope('layer_pool2'):
		pool2=tf.nn.max_pool(relu2,ksize=[1,2,2,1],strides=[1,2,2,1],padding='SAME')

	# 將多維向量展開作為密集連線層的輸入
	pool_shape=pool2.get_shape().as_list()
	# pool_shape[0]為BATCH_SIZE維度
	nodes=pool_shape[1]*pool_shape[2]*pool_shape[3]
	FC_INPUT=tf.reshape(pool2,[pool_shape[0],nodes])

	# 宣告第一層神經網路的變數並完成前向傳播
	with tf.variable_scope('layer1',reuse=reuse):
		weights=tf.get_variable('weights',[nodes,FC_SIZE],initializer=tf.truncated_normal_initializer(mean=0,stddev=0.1))
		biases=tf.get_variable('biases',[FC_SIZE],initializer=tf.constant_initializer(0.0))
		if regularizer != None:
			tf.add_to_collection('losses',regularizer(weights))
		if avg_class == None:
			fc1=tf.nn.relu(tf.matmul(FC_INPUT,weights)+biases)
		else:
			fc1=tf.nn.relu(tf.matmul(FC_INPUT,avg_class.average(weights))+avg_class.average(biases))
		# dropout正則化，降低過擬合
		if train:
			fc1=tf.nn.dropout(fc1,0.5)
	# 宣告第二層神經網路的變數並完成前向傳播
	with tf.variable_scope('layer2',reuse=reuse):
		weights=tf.get_variable('weights',[FC_SIZE,OUTPUT_NODE],initializer=tf.truncated_normal_initializer(mean=0,stddev=0.1))
		biases=tf.get_variable('biases',[OUTPUT_NODE],initializer=tf.constant_initializer(0.0))
		if regularizer != None:
			tf.add_to_collection('losses',regularizer(weights))
		if avg_class == None:
			fc2=tf.matmul(fc1,weights)+biases
		else:
			fc2=tf.matmul(fc1,avg_class.average(weights))+avg_class.average(biases)
	return fc2

第二部分：訓練，包括訓練集和驗證集

# 神經網路訓練程式
import numpy as np
import tensorflow as tf
import matplotlib.pyplot as plt
from tensorflow.examples.tutorials.mnist import input_data

import mnist_inference

# 配置神經網路引數
BATCH_SIZE=128
LEARNING_RATE_BASE=0.8
LEARNING_RATE_DECAY=0.99
REGULARAZTION_RATE=0.0001
TRAINING_STEP=30000
MOVING_AVERAGE_DECAY=0.99
# 模型儲存路徑和檔名
MODEL_SAVE_PATH='./model2.ckpt'
# 訓練引數
train_acc,valid_acc=[],[]
train_loss,valid_loss=[],[]
epochs=[]


def train(mnist):
	x=tf.placeholder(tf.float32,[None,mnist_inference.IMAGE_SIZE,mnist_inference.IMAGE_SIZE,mnist_inference.NUM_CHANNELS],name='x-input')
	y_=tf.placeholder(tf.float32,[None,mnist_inference.OUTPUT_NODE],name='y-input')

	regularizer=tf.contrib.layers.l2_regularizer(REGULARAZTION_RATE)

	y=mnist_inference.inference(x,regularizer=regularizer,avg_class=None,reuse=False,train=True)
	global_step=tf.Variable(0,trainable=False)

	variable_averages=tf.train.ExponentialMovingAverage(MOVING_AVERAGE_DECAY,global_step)
	variable_averages_op=variable_averages.apply(tf.trainable_variables())

	cross_entropy=tf.nn.sparse_softmax_cross_entropy_with_logits(logits=y,labels=tf.argmax(y_,1))
	cross_entropy_mean=tf.reduce_mean(cross_entropy)

	loss=cross_entropy_mean+tf.add_n(tf.get_collection('losses'))

	learning_rate=0.1
		# tf.train.exponential_decay(LEARNING_RATE_BASE,global_step,mnist.train.num_examples/BATCH_SIZE,LEARNING_RATE_DECAY)
	train_step=tf.train.GradientDescentOptimizer(learning_rate).minimize(loss,global_step)

	with tf.control_dependencies([train_step,variable_averages_op]):
		train_op=tf.no_op(name='train')

	# 計算使用滑動平均之後的前向傳播結果
	average_y=mnist_inference.inference(x,regularizer=regularizer,avg_class=variable_averages,train=True,reuse=tf.AUTO_REUSE)

	correct_prediction=tf.equal(tf.argmax(average_y,1),tf.argmax(y_,1))
	#tf.cast為轉化資料格式
	accuracy=tf.reduce_mean(tf.cast(correct_prediction,tf.float32))

	# 初始化TensorFlow持久化類
	saver=tf.train.Saver()

	with tf.Session() as sess:
		tf.initialize_all_variables().run()

		for i in range(TRAINING_STEP):
			xs,ys=mnist.train.next_batch(BATCH_SIZE)
			xs=np.reshape(xs,[BATCH_SIZE,mnist_inference.IMAGE_SIZE,mnist_inference.IMAGE_SIZE,mnist_inference.NUM_CHANNELS])
			_,tra_loss,step=sess.run([train_op,loss,global_step],feed_dict={x:xs,y_:ys})

			val_xs,val_ys=mnist.validation.next_batch(BATCH_SIZE)
			val_xs=np.reshape(val_xs,[BATCH_SIZE,mnist_inference.IMAGE_SIZE,mnist_inference.IMAGE_SIZE,mnist_inference.NUM_CHANNELS])
			val_loss=sess.run([loss],feed_dict={x:val_xs,y_:val_ys})

			epochs.append(step)
			train_acc.append(sess.run(accuracy,feed_dict={x:xs,y_:ys}))
			train_loss.append(tra_loss)
			valid_acc.append(sess.run(accuracy,feed_dict={x:val_xs,y_:val_ys}))
			valid_loss.append(val_loss)
			# 每1000輪
			if (i+1)%1000==0:
				print('<==%d==>,loss on training batch is %g.'%(i+1,tra_loss))

		print(train_acc[-1])
		print(valid_acc[-1])
		plt.figure(1)
		plt.grid(True)
		plt.subplot(1,2,1)
		plt.plot(epochs, train_loss, color='red',label='train')
		plt.plot(epochs, valid_loss, color='blue',label='valid')
		plt.legend()
		plt.xlabel('Epochs',fontsize=15)
		plt.ylabel('Y',fontsize=15)
		plt.title('Loss',fontsize=15)
		plt.subplot(1,2,2)
		plt.plot(epochs, train_acc, color='red',label='train')
		plt.plot(epochs, valid_acc, color='blue',label='valid')
		plt.legend()
		plt.xlabel('Epochs',fontsize=15)
		plt.ylabel('Y',fontsize=15)
		plt.title('Acc',fontsize=15)
		plt.show()

		saver.save(sess,MODEL_SAVE_PATH)


def main(argv=None):
	mnist=input_data.read_data_sets('E:/User-Duanduan/python/Deep-Learning/tensorflow/data/MNIST_data/',one_hot=True)
	train(mnist)

if __name__=='__main__':
	tf.app.run()

第三部分：測試集

# 測試模型
import tensorflow as tf
from tensorflow.examples.tutorials.mnist import input_data
import matplotlib.pyplot as plt
import numpy as np
import mnist_inference
import mnist_train

BATCH_SIZE=10000

def evaluate(mnist):
	with tf.Graph().as_default() as g:
		# 定義輸入輸出格式
		x=tf.placeholder(tf.float32,[BATCH_SIZE,mnist_inference.IMAGE_SIZE,mnist_inference.IMAGE_SIZE,mnist_inference.NUM_CHANNELS],name='x-input')
		y_=tf.placeholder(tf.float32,[BATCH_SIZE,mnist_inference.OUTPUT_NODE],name='y-input')

		# 測試批量圖
		y=mnist_inference.inference(x,None,None,train=False, reuse=False)
		correct_prediction=tf.equal(tf.argmax(y,1),tf.argmax(y_,1))
		accuracy=tf.reduce_mean(tf.cast(correct_prediction,tf.float32))

		# 讀取測試圖集
		xs=mnist.test.images
		xs=np.reshape(xs,[BATCH_SIZE,mnist_inference.IMAGE_SIZE,mnist_inference.IMAGE_SIZE,mnist_inference.NUM_CHANNELS])
		test_feed={x:xs,y_:mnist.test.labels}

		# 測試單張圖片
		show_image=mnist.test.images[5000]
		label=mnist.test.labels[5000]
		flatten_image=np.reshape(show_image,[1,mnist_inference.IMAGE_SIZE,mnist_inference.IMAGE_SIZE,mnist_inference.NUM_CHANNELS])
		actual_label=label.tolist().index(max(label.tolist()))

		x_test=tf.placeholder(tf.float32,[1,mnist_inference.IMAGE_SIZE,mnist_inference.IMAGE_SIZE,mnist_inference.NUM_CHANNELS],name='x-input')
		y_test=mnist_inference.inference(x_test,None,None,train=False,reuse=tf.AUTO_REUSE)
		pred_label=tf.argmax(y_test,1)

		variable_averages=tf.train.ExponentialMovingAverage(mnist_train.MOVING_AVERAGE_DECAY)
		variable_to_restore=variable_averages.variables_to_restore()

		saver=tf.train.Saver(variable_to_restore)

		with tf.Session() as sess:
			# 載入模型
			saver.restore(sess,'./model.ckpt')
			# 批量測試
			accuracy_score=sess.run(accuracy,feed_dict=test_feed)
			print('Test accuracy is %g%%'%(accuracy_score*100))
			# 單張測試
			result=sess.run(pred_label,feed_dict={x_test:flatten_image})
			print('Actual:%g,predtion:%g'%(actual_label,result))

			show_image=tf.reshape(show_image,[28,28])
			plt.figure('Show')
			plt.imshow(show_image.eval())
			plt.show()

def main(argv=None):
	mnist=input_data.read_data_sets('E:/User-Duanduan/python/Deep-Learning/tensorflow/data/MNIST_data/',one_hot=True)
	evaluate(mnist)

if __name__=='__main__':
	tf.app.run()

TensroFlow學習——第三章（二）

MINIST數字識別問題卷積神經網路實現手寫數字識別採用了L2正則化、滑動平均模型，固定學習率訓練結果為：訓練集100%，驗證集99.4%，測試集99.43% 第一部分：前向傳播和網路引數 # 定義前向傳播和神經網路中的引數 import tensorflow as tf

TensroFlow學習——第三章（一）

MINIST數字識別問題全連線層實現手寫數字識別採用了L2正則化、滑動平均模型和指數衰減學習率訓練結果為：訓練集93%，驗證集95.36%，測試集95.01% 第一部分：前向傳播和網路引數 # 定義前向傳播和神經網路中的引數 import tensorflow as tf

TensroFlow學習——第三章（三）

卷積神經網路遷移學習基於訓練好的Inception-v3的模型，對flower_photos資料集進行分類訓練結果如下，測試集的準確率為91.0082% 演算法如下: import os import random import numpy as np import t

UNP學習第五章（二）

igp 編程函數名 gpo atl clu 運行 poll 發生一、POSIX信號處理信號：告知某進程發生了某個事件的通知(軟中斷)，通常是異步的。信號可以：由進程發給另一個進程，由內核發給某個進程。設置信號處理辦法，有三個選擇： 1.寫一個函數，在信號發生時

UNP學習第六章（二）

默認 clas 套接字 post 討論默認值第六章數據當前一、描述符就緒條件對於引起select返回套接字“就緒”的條件我們必須討論得更明確：（1）滿足一下塞個條件中的仍和一個時，一個套接字準備好讀。 a）該套接字接收緩沖區中的數據字節數不大於等於套接字接收緩

安卓學習（初）第三章（2）（《第一行程式碼》）

一、佈局的線性佈局<LinearLayout 1、示例： <LinearLayout xmlns:android="http://schemas.android.com/apk/res/android" android:orientation="horizontal"

安卓學習（初）第三章（3）（《第一行程式碼》）

一、建立自定義標題欄 1、以線性佈局編寫程式碼。除了之前學過的設定控制元件對齊方式控制元件大小還有控制元件地址命名外，android:text設定控制元件文字內容，android:textColor設定控制元件底色，android:background設定背景，android:layout_ma

安卓學習（初）第三章（1）（《第一行程式碼》）

佈局控制元件一、TextView 1、<TextView>可以說是Android中最簡單的一個控制元件，主要用於在介面上顯示一段文字資訊。 2、指定控制元件的寬度和高度 android:layout_width="match_parent" android:layout

Win32API學習筆記第六章（二）

這次記錄的是一部分選單的內容（由於VS生成的已經比較全面了，所以這裡主要是講使用） // Win32ProjectRc.cpp : 定義應用程式的入口點。 // #include "stdafx.h" #include "Win32ProjectRc.h

第三章（6）複合Lambda表示式

你可以把多個簡單的Lambda複合成複雜的表示式。比如，你可以讓兩個謂詞之間做一個or操作，組合成一個更大的謂詞。而且，你還可以讓一個函式的結果成為另一個函式的輸入。你可能會想，函式式介面中怎麼可能有更多的方法呢？（畢竟，這違背了函式式介面的定義啊！）竅門在於

第三章（5）方法引用

1.方法引用初探方法呼叫可以被看作僅僅呼叫特定方法的lambda表示式的一種快捷寫法。如果一個Lambda代表的只是“直接呼叫這個方法”，那最好還是用名稱來呼叫它，而不是去描述如何呼叫它。事實上，方法引用就是讓你根據已有的方法實現來建立Lambda表示式

第三章（4）擴充套件------lambda表示式與閉包(關於lambda使用區域性變數的補充)

關於閉包，掌握js的童鞋會更加的瞭解，但是如今，我們在學習java8的lambda的時候，上一章提到lambda關於使用區域性變數的時候，書中提到了lambda與閉包的問題。他的原話是這麼說的：你可能已經聽說過閉

第三章（2） JAVA8 api為我們提供的函式式介面

咱們書接上回，上回咱們說到，Java 8的庫設計師幫你在java.util.function包中引入了幾個新的函式式介面。我們接下來會介紹Predicate、Consumer和Function。 1.Predicate（謂詞）

第三章（1） Lambda表示式

1.lambda表示式的基本形式在上一章中，你瞭解了利用行為引數化來傳遞程式碼有助於應對不斷變化的需求。它允許你定義一個程式碼塊來表示一個行為，然後傳遞它。你可以決定在某一事件發生時（例如單擊一個按鈕）或在演算法中的某個特定時刻（例

第三章（3） lambda表示式型別檢查、型別推斷以及區域性變數

1.型別檢查當我們在之前第一次提到lambda表示式的時候，說它可以為函式式介面生成一個例項。然而，Lambda表示式本身並不包含它在實現哪個函式式介面的資訊。為了全面瞭解Lambda表示式，你

機器學習第三週（下）

擬合 1、擬合程度 1.1、過擬合 1.1.1、原因 1.1.2、理論解決方法 1.1.3、實際解決方法之一：正則化 1.1.3.1、正則化線性迴歸 1.1.3.2、正則化正規方

Java第四天——核心技術第三章（2）

繼續第三章的學習。。。運算子運算子+、-、*、/表示加、減、乘、除運算 %求餘操作 /運算兩個運算元都是整數時，表示整數除法；否則，表示浮點數除法例：15/2=7 15%2=1 15.0/2=7.5 整數被0除會產生

Java核心技術--第三章（5）

控制流程條件語句+迴圈結構控制流程條件語句迴圈語句 switch語句（判斷多個值）塊用 { }括起來的若干條Java語句塊可巢狀在另一個塊中 public static void main(String[] args)

計算機組成原理筆記-第三章（哈工大）

1.匯流排的基本概念匯流排：是連線各個部件的資訊傳輸線，是各個部件共享的傳輸介質。匯流排的傳輸方式：序列——長距離，一次傳輸1位並行——短距離，一次傳輸n位 2.匯流排分類 1.片內匯流排晶片內部的匯流排

《Web前端黑客技術揭祕》學習筆記第二章（二）

Dom樹： <html>是樹根，其他是樹的每個節點標籤節點以<xxx>表示,屬性節點以@xxx表示，而文字節點以xxx表示隱私資料可能儲存在： HTML內容中瀏覽器本地儲存中，如Cookies等 URL地址中很多網站通過ifram

TensroFlow學習——第三章（二）

MINIST數字識別問題

卷積神經網路實現手寫數字識別

相關推薦