Tensorflow實現Xaiver初始化、權重寫入L2正則、新增LRN層

阿新 • • 發佈：2018-12-14

源自Tensorflow實戰的黃文堅、唐源書中的啟發：

def xavier_init(fan_in, fan_out, constant = 1):
    low = -constant * np.sqrt(6.0 / (fan_in + fan_out))
    high = constant * np.sqrt(6.0 / (fan_in + fan_out))
    return tf.random_uniform((fan_in, fan_out),
                             minval = low, maxval = high,
                             dtype = tf.float32)
#初始化
w1= tf.Variable(xavier_init(n_input, n_hidden))
w2= tf.Variable(tf.zeros([n_hidden, n_input], dtype = tf.float32))

在權重初始化加入L2正則化以及LRN層的常用方法：

def variable_with_weight_loss(shape, stddev, wl):
    var = tf.Variable(tf.truncated_normal(shape, stddev=stddev))
    if wl is not None:
        weight_loss = tf.multiply(tf.nn.l2_loss(var), wl, name='weight_loss')
        tf.add_to_collection('losses', weight_loss)
    return var

def loss(logits, labels):

    labels = tf.cast(labels, tf.int64)
    cross_entropy = tf.nn.sparse_softmax_cross_entropy_with_logits(
        logits=logits, labels=labels, name='cross_entropy_per_example')
    cross_entropy_mean = tf.reduce_mean(cross_entropy, name='cross_entropy')
    tf.add_to_collection('losses', cross_entropy_mean)

weight1 = variable_with_weight_loss(shape=[5, 5, 3, 64], stddev=5e-2, wl=0.0)
kernel1 = tf.nn.conv2d(image_holder, weight1, [1, 1, 1, 1], padding='SAME')
bias1 = tf.Variable(tf.constant(0.0, shape=[64]))
conv1 = tf.nn.relu(tf.nn.bias_add(kernel1, bias1))
pool1 = tf.nn.max_pool(conv1, ksize=[1, 3, 3, 1], strides=[1, 2, 2, 1],
                       padding='SAME')
norm1 = tf.nn.lrn(pool1, 4, bias=1.0, alpha=0.001 / 9.0, beta=0.75)


weight2 = variable_with_weight_loss(shape=[5, 5, 64, 64], stddev=5e-2, wl=0.0)
kernel2 = tf.nn.conv2d(norm1, weight2, [1, 1, 1, 1], padding='SAME')
bias2 = tf.Variable(tf.constant(0.1, shape=[64]))
conv2 = tf.nn.relu(tf.nn.bias_add(kernel2, bias2))
norm2 = tf.nn.lrn(conv2, 4, bias=1.0, alpha=0.001 / 9.0, beta=0.75)
pool2 = tf.nn.max_pool(norm2, ksize=[1, 3, 3, 1], strides=[1, 2, 2, 1],
                       padding='SAME')

reshape = tf.reshape(pool2, [batch_size, -1])
dim = reshape.get_shape()[1].value
weight3 = variable_with_weight_loss(shape=[dim, 384], stddev=0.04, wl=0.004)
bias3 = tf.Variable(tf.constant(0.1, shape=[384]))
local3 = tf.nn.relu(tf.matmul(reshape, weight3) + bias3)

weight4 = variable_with_weight_loss(shape=[384, 192], stddev=0.04, wl=0.004)
bias4 = tf.Variable(tf.constant(0.1, shape=[192]))                                      
local4 = tf.nn.relu(tf.matmul(local3, weight4) + bias4)

weight5 = variable_with_weight_loss(shape=[192, 10], stddev=1/192.0, wl=0.0)
bias5 = tf.Variable(tf.constant(0.0, shape=[10]))
logits = tf.add(tf.matmul(local4, weight5), bias5)

loss = loss(logits, label_holder)

完整程式碼如下：

import cifar10,cifar10_input
import tensorflow as tf
import numpy as np
import time

max_steps = 3000
batch_size = 128
data_dir = '/tmp/cifar10_data/cifar-10-batches-bin'


def variable_with_weight_loss(shape, stddev, wl):
    var = tf.Variable(tf.truncated_normal(shape, stddev=stddev))
    if wl is not None:
        weight_loss = tf.multiply(tf.nn.l2_loss(var), wl, name='weight_loss')
        tf.add_to_collection('losses', weight_loss)
    return var


def loss(logits, labels):
#交叉熵損失與權重正則放在一起
    labels = tf.cast(labels, tf.int64)
    cross_entropy = tf.nn.sparse_softmax_cross_entropy_with_logits(
        logits=logits, labels=labels, name='cross_entropy_per_example')
    cross_entropy_mean = tf.reduce_mean(cross_entropy, name='cross_entropy')
    tf.add_to_collection('losses', cross_entropy_mean)
    return tf.add_n(tf.get_collection('losses'), name='total_loss')
  


cifar10.maybe_download_and_extract()


images_train, labels_train = cifar10_input.distorted_inputs(data_dir=data_dir,
                                                            batch_size=batch_size)

images_test, labels_test = cifar10_input.inputs(eval_data=True,
                                                data_dir=data_dir,
                                                batch_size=batch_size)                                                  
#images_train, labels_train = cifar10.distorted_inputs()
#images_test, labels_test = cifar10.inputs(eval_data=True)

image_holder = tf.placeholder(tf.float32, [batch_size, 24, 24, 3])
label_holder = tf.placeholder(tf.int32, [batch_size])

#logits = inference(image_holder)

weight1 = variable_with_weight_loss(shape=[5, 5, 3, 64], stddev=5e-2, wl=0.0)
kernel1 = tf.nn.conv2d(image_holder, weight1, [1, 1, 1, 1], padding='SAME')
bias1 = tf.Variable(tf.constant(0.0, shape=[64]))
conv1 = tf.nn.relu(tf.nn.bias_add(kernel1, bias1))
pool1 = tf.nn.max_pool(conv1, ksize=[1, 3, 3, 1], strides=[1, 2, 2, 1],
                       padding='SAME')
norm1 = tf.nn.lrn(pool1, 4, bias=1.0, alpha=0.001 / 9.0, beta=0.75)


weight2 = variable_with_weight_loss(shape=[5, 5, 64, 64], stddev=5e-2, wl=0.0)
kernel2 = tf.nn.conv2d(norm1, weight2, [1, 1, 1, 1], padding='SAME')
bias2 = tf.Variable(tf.constant(0.1, shape=[64]))
conv2 = tf.nn.relu(tf.nn.bias_add(kernel2, bias2))
norm2 = tf.nn.lrn(conv2, 4, bias=1.0, alpha=0.001 / 9.0, beta=0.75)
pool2 = tf.nn.max_pool(norm2, ksize=[1, 3, 3, 1], strides=[1, 2, 2, 1],
                       padding='SAME')

reshape = tf.reshape(pool2, [batch_size, -1])
dim = reshape.get_shape()[1].value
weight3 = variable_with_weight_loss(shape=[dim, 384], stddev=0.04, wl=0.004)
bias3 = tf.Variable(tf.constant(0.1, shape=[384]))
local3 = tf.nn.relu(tf.matmul(reshape, weight3) + bias3)

weight4 = variable_with_weight_loss(shape=[384, 192], stddev=0.04, wl=0.004)
bias4 = tf.Variable(tf.constant(0.1, shape=[192]))                                      
local4 = tf.nn.relu(tf.matmul(local3, weight4) + bias4)

weight5 = variable_with_weight_loss(shape=[192, 10], stddev=1/192.0, wl=0.0)
bias5 = tf.Variable(tf.constant(0.0, shape=[10]))
logits = tf.add(tf.matmul(local4, weight5), bias5)

loss = loss(logits, label_holder)


train_op = tf.train.AdamOptimizer(1e-3).minimize(loss) #0.72

top_k_op = tf.nn.in_top_k(logits, label_holder, 1)

sess = tf.InteractiveSession()
tf.global_variables_initializer().run()

tf.train.start_queue_runners()
###
for step in range(max_steps):
    start_time = time.time()
    image_batch,label_batch = sess.run([images_train,labels_train])
    _, loss_value = sess.run([train_op, loss],feed_dict={image_holder: image_batch, 
                                                         label_holder:label_batch})
    duration = time.time() - start_time

    if step % 10 == 0:
        examples_per_sec = batch_size / duration
        sec_per_batch = float(duration)
    
        format_str = ('step %d, loss = %.2f (%.1f examples/sec; %.3f sec/batch)')
        print(format_str % (step, loss_value, examples_per_sec, sec_per_batch))
    
###
num_examples = 10000
import math
num_iter = int(math.ceil(num_examples / batch_size))
true_count = 0  
total_sample_count = num_iter * batch_size
step = 0
while step < num_iter:
    image_batch,label_batch = sess.run([images_test,labels_test])
    predictions = sess.run([top_k_op],feed_dict={image_holder: image_batch,
                                                 label_holder:label_batch})
    true_count += np.sum(predictions)
    step += 1

precision = true_count / total_sample_count
print('precision @ 1 = %.3f' % precision)

Tensorflow實現Xaiver初始化、權重寫入L2正則、新增LRN層

源自Tensorflow實戰的黃文堅、唐源書中的啟發： def xavier_init(fan_in, fan_out, constant = 1): low = -constant * np.sqrt(6.0 / (fan_in + fan_out))

訓練過程--正則化(regularization)技巧(包括L2正則化、dropout，資料增廣，早停)

正則化（regularization）正則化是解決高方差問題的重要方案之一，也是Reducing Overfiltering（克服過擬合）的方法。過擬合一直是DeepLearning的大敵，它會導致訓練集的error rate非常小，而測試集的error rate大部分時候很

為什麼L1正則項產生稀疏的權重，L2正則項產生相對平滑的權重

L1 和L2正則項的定義如下： L1=∑i|wi|L2=∑i(wi)2 L 1 =

倍福TwinCAT(貝福Beckhoff)常見問題(FAQ)-如何在初始化的時候寫入參數

是不是 dsw 通過介紹變量 main.c red word 是我最常見的是定義一個全局變量，然後跟對應的變量綁定，比如我定義了一個SINT型的變量ControlWord 數值是8，定義好之後編譯一下，可以發現PLC程序中或多出來這個變量（MAIN.ControlWo

MOOC清華《面向對象程序設計》第8章：用代理模式實現延遲初始化

blank ngx cin www. oci 初始化 lanp margin 程序 Z9閃5PFVL衣坑9http://shequ.docin.com/zdfi78227 哦3O8b4z宦塹7http://huiyi.docin.com/dvok6368 W34搜6csiy

關於並發場景下，通過雙重檢查鎖實現延遲初始化的優化問題隱患的記錄

ron href 修飾符屬性 tin 記錄 targe turn 優化問題　　首先，這個問題是從《阿裏巴巴Java開發手冊》的1.6.12（P31）上面看到的，裏面有這樣一句話，並列出一種反例代碼（以下為仿寫，並非與書上一致）：　　在並發場景下，通過雙重檢查鎖（do

pytorch系列 -- 9 pytorch nn.init 中實現的初始化函式 uniform, normal, const, Xavier, He initialization

本文內容： 1. Xavier 初始化 2. nn.init 中各種初始化函式 3. He 初始化 torch.init https://pytorch.org/docs/stable/nn.html#torch-nn-init 1. 均勻分佈 torch.nn.init.u

tensorflow-單變數初始化

# -*- coding: utf-8 -*- """ Spyder Editor This is a temporary script file. """ import tensorflow as tf a=tf.Variable(6,dtype=tf.int32) b=tf.Variable(3,dt

深度學習筆記：tensorflow 入門變數初始化

# 變數op # 1、變數能夠持久化儲存，普通的張量op是不行的 # 2、當定義一個變數op的時候，一定要在會話當中去執行初始化 a = tf.constant([1, 2, 3, 4, 5]) var = tf.Variable(tf.random_no

Spring IOC/BeanFactory/ApplicationContext的工作流程/實現原理/初始化/依賴注入原始碼詳解

Spring的工作流程/實現原理之基石IOC/BeanFactory/ApplicationContext 更新1：2017/11/23更新2:2018/1/30（截圖）一、什麼是IOC容器？IOC(Inversion of Control)、控制反轉亦稱依賴注入.IOC容器

初始化塊和構造器的比較、總結

初始化塊分為：靜態初始化塊和普通初始化塊。在定義初始化塊時使用了static修飾符，靜態初始化塊（也叫做類初始化塊）；否則，就是普通初始化塊。與靜態方法、非靜態方法的理解其實類似，普通初始化塊負責對物件執行初始化，類初始化塊負責對類執行初始化。為了更好地區分，上一段程式碼：p

SparkContext的初始化（季篇）——測量系統、ContextCleaner及環境更新

《深入理解Spark：核心思想與原始碼分析》一書第一章的內容請看連結《第1章環境準備》《深入理解Spark：核心思想與原始碼分析》一書第二章的內容請看連結《第2章 SPARK設計理念與基本架構》由於本書的第3章內容較多，所以打算分別開闢四篇隨筆分別展現。本文展現第3章第三部分的內

Spring類註冊不上，applicationContext不初始化，在Filter中無法getBean、使用Dao、Service等

新建一個xml檔案，裡面複製下面內容： <?xml version="1.0" encoding="UTF-8"?> <!DOCTYPE beans PUBLIC "-//SPRING//DTD BEAN//EN" "http://www.springf

C#效能優化之Lazy 實現延遲初始化

　在.NET4.0中，可以使用Lazy<T> 來實現物件的延遲初始化，從而優化系統的效能。延遲初始化就是將物件的初始化延遲到第一次使用該物件時。延遲初始化是我們在寫程式時經常會遇到的情形，例如建立某一物件時需要花費很大的開銷，而這一物件在系統的執行過程中不

WebView深究之Android是如何實現webview初始化的

webview初始化關注Android載入webview核心的過程。我們從WebView的init過程中切入。 WebView的構造方法,最終都會呼叫 WebView(Context context, AttributeSet attrs, int

神經網路模型無法正常工作時我們應該做什麼（系列）——初始化網路權重（Initialized Network Weights）

前言當你進入深度學習領域，準備好深度神經網路，開始進行訓練時，遇到這樣一個大部分新手都會遇到的問題：你的神經網路沒法正常工作，而你不知道該如何去修正它。你去問你的老闆或者導師，他們也不知道該如何處理，因為在深度神經網路面前，他們和你一樣也是新手。

tensorflow下已經初始化，但還是存在 Attempting to use uninitialized value的解決方案

執行tensorflow後，程式報錯： FailedPreconditionError (see above for traceback): Attempting to use uninitialized value beta1_power [[Node: b

L2正則化—tensorflow實現

L2正則化是一種減少過擬合的方法，在損失函式中加入刻畫模型複雜程度的指標。假設損失函式是J(θ)，則優化的是J(θ)+λR(w)，R(w)=∑ni=0|w2i|。在tensorflow中的具體實現過

Python基礎(正則、序列化、常用模塊和面向對象)-day06

.net 支持 tro sub 商城 pytho font spa 要求寫在前面上課第六天，打卡：　　　　天地不仁，以萬物為芻狗；一、正則　　- 　　- 在線正則工具：http://tool.oschina.net/regex/ 　　-

TensorFlow(三) 用TensorFlow實現L2正則損失函數線性回歸算法

glob ini upper ace arr 算法 var 增加初始化 import tensorflow as tf import numpy as np import matplotlib.pyplot as plt from sklearn import dat

Tensorflow實現Xaiver初始化、權重寫入L2正則、新增LRN層

源自Tensorflow實戰的黃文堅、唐源書中的啟發：

相關推薦