tensorflow 學習筆記13 RNN LSTM結構預測正弦(sin)函式

阿新 • • 發佈：2019-02-05

import tensorflow as tf
import numpy as np
import matplotlib.pyplot as plt


BATCH_START = 0
TIME_STEPS = 20
BATCH_SIZE = 50
INPUT_SIZE = 1
OUTPUT_SIZE = 1
#hidden_unit_size
CELL_SIZE = 10
#learning_rate
LR = 0.006

#資料輸入函式
#按照序列的順序,每次get_batch()就切出BATCH_SIZE*TIME_STEPS*INPUT_SIZE作為下一次訓練的輸入資料
def get_batch():
    global BATCH_START, TIME_STEPS
    # xs shape (50batch, 20steps)
    xs = np.arange(BATCH_START, BATCH_START+TIME_STEPS*BATCH_SIZE).reshape((BATCH_SIZE, TIME_STEPS)) / (10*np.pi)
    seq = np.sin(xs)
    res = np.cos(xs)
    BATCH_START += TIME_STEPS
    # returned seq, res and xs: shape (batch, step, input)
    return [seq[:, :, np.newaxis], res[:, :, np.newaxis], xs]#np.newaxis 在使用和功能上等價於 None，其實就是 None 的一個別名


class LSTMRNN(object):
    def __init__(self, n_steps, input_size, output_size, cell_size, batch_size):
        self.n_steps = n_steps
        self.input_size = input_size
        self.output_size = output_size
        self.cell_size = cell_size
        self.batch_size = batch_size
        with tf.name_scope('inputs'):
            self.xs = tf.placeholder(tf.float32, [None, n_steps, input_size], name='xs')
            self.ys = tf.placeholder(tf.float32, [None, n_steps, output_size], name='ys')
        with tf.variable_scope('in_hidden'):
            self.add_input_layer()
        with tf.variable_scope('LSTM_cell'):
            self.add_cell()
        with tf.variable_scope('out_hidden'):
            self.add_output_layer()
        with tf.name_scope('cost'):
            self.compute_cost()
        with tf.name_scope('train'):
            self.train_op = tf.train.AdamOptimizer(LR).minimize(self.cost)

    def add_input_layer(self,):
        # reshape 3維變2維 用於矩陣計算 l_in_x (batch, n_steps, input_size)==> (batch*n_step, in_size)
        l_in_x = tf.reshape(self.xs, [-1, self.input_size], name='2_2D')
        # Ws (in_size, cell_size)
        Ws_in = self._weight_variable([self.input_size, self.cell_size])
        # bs (cell_size, )
        bs_in = self._bias_variable([self.cell_size,])
        # l_in_y = (batch * n_steps, cell_size)
        with tf.name_scope('Wx_plus_b'):
            l_in_y = tf.matmul(l_in_x, Ws_in) + bs_in
        #reshape 2維變3維 l_in_y (batch*n_step, in_size)==> (batch, n_steps, cell_size)
        self.l_in_y = tf.reshape(l_in_y, [-1, self.n_steps, self.cell_size], name='2_3D')

    def add_cell(self):
        lstm_cell = tf.contrib.rnn.BasicLSTMCell(self.cell_size, forget_bias=1.0, state_is_tuple=True)
        with tf.name_scope('initial_state'):
            self.cell_init_state = lstm_cell.zero_state(self.batch_size, dtype=tf.float32)
        self.cell_outputs, self.cell_final_state = tf.nn.dynamic_rnn(
            lstm_cell, self.l_in_y, initial_state=self.cell_init_state, time_major=False)

    def add_output_layer(self):
        # reshape 3維變2維 用於矩陣計算 l_out_x (batch, n_steps, cell_size)==> (batch * steps, cell_size)
        l_out_x = tf.reshape(self.cell_outputs, [-1, self.cell_size], name='2_2D')
        Ws_out = self._weight_variable([self.cell_size, self.output_size])
        bs_out = self._bias_variable([self.output_size, ])
        # shape = (batch * steps, output_size)
        with tf.name_scope('Wx_plus_b'):
            self.pred = tf.matmul(l_out_x, Ws_out) + bs_out

    def compute_cost(self):
        #(logits, targets, weights):針對logits中的每一個num_step,即[batch_size, classes],
        # 對所有classes個預測結果，得出預測值最大的那個類別，與targets中的值相比較計算Loss值
        losses = tf.contrib.legacy_seq2seq.sequence_loss_by_example(
            [tf.reshape(self.pred, [-1], name='reshape_pred')],
            [tf.reshape(self.ys, [-1], name='reshape_target')],
            [tf.ones([self.batch_size * self.n_steps], dtype=tf.float32)],
            average_across_timesteps=True,
            softmax_loss_function=self.ms_error,
            name='losses'
        )
        with tf.name_scope('average_cost'):
            #對於每一個batch_size計算平均cost
            self.cost = tf.div(tf.reduce_sum(losses, name='losses_sum'),self.batch_size,name='average_cost')
            tf.summary.scalar('cost', self.cost)

    def ms_error(self, labels, logits):
        return tf.square(tf.subtract(labels, logits))

    def _weight_variable(self, shape, name='weights'):
        initializer = tf.random_normal_initializer(mean=0., stddev=1.,)
        return tf.get_variable(shape=shape, initializer=initializer, name=name)

    def _bias_variable(self, shape, name='biases'):
        initializer = tf.constant_initializer(0.1)
        return tf.get_variable(name=name, shape=shape, initializer=initializer)


if __name__ == '__main__':
    model = LSTMRNN(TIME_STEPS, INPUT_SIZE, OUTPUT_SIZE, CELL_SIZE, BATCH_SIZE)
    sess = tf.Session()
    merged = tf.summary.merge_all()
    writer = tf.summary.FileWriter("桌面/logs/", sess.graph)

    init = tf.global_variables_initializer()
    sess.run(init)

    plt.ion()
    plt.show()
    for i in range(200):
        seq, res, xs = get_batch()
        if i == 0:
            #該LSTM模型所學習到的是sin(x)到cos(x)的對映關係,最後給定一個輸入sin(x0),LSTM能夠預測出相對應的cos(x0)
            feed_dict = {
                    model.xs: seq,
                    model.ys: res,
                    # create initial state
            }
        else:
            feed_dict = {
                model.xs: seq,
                model.ys: res,
                model.cell_init_state: state    # use last state as the initial state for this run
            }

        _, cost, state, pred = sess.run([model.train_op, model.cost, model.cell_final_state, model.pred],feed_dict=feed_dict)

        # plotting
        plt.plot(xs[0, :], res[0].flatten(), 'r', xs[0, :], pred.flatten()[:TIME_STEPS], 'b--')
        plt.ylim((-1.2, 1.2))
        plt.draw()
        plt.pause(0.3)

        if i % 20 == 0:
            print('cost: ', round(cost, 4))
            result = sess.run(merged, feed_dict)
writer.add_summary(result, i)

結果：

tensorflow 學習筆記13 RNN LSTM結構預測正弦(sin)函式

import tensorflow as tf import numpy as np import matplotlib.pyplot as plt BATCH_START = 0 TIME_STEPS = 20 BATCH_SIZE = 50 INPUT_SIZE =

python3學習筆記13（資料結構）

參考http://www.runoob.com/python3/python3-data-structure.html 列表列表是可修改的。列表方法讓列表可以方便的作為一個堆疊來使用，堆疊作為特定的資料結構，最先進入的元素最後一個被釋放（後進先出）。其中用append()方法可以把一個元素新增的

Tensorflow學習筆記（五）——結構化模型及Skip-gram模型的實現

一、結構化模型結構化我們的模型，可以方便我們Debug和良好的視覺化。一般我們的模型都是由以下兩步構成，第一步是構建計算圖，第二步是執行計算圖。 Assemble Graph Define placeholders for Inp

Tensorflow 學習筆記之使用LSTM實現MNIST資料集

LSTM實現MNIST手寫集識別這幾天剛好看了RNN之後瞭解了LSTM（原理可以去參考這個）。雖然LSTM主要用於處理自然語言、語音、機器人翻譯等領域，但圖片也可以看做一個有序列的資料。所以用LSTM

【TensorFlow】LSTM（使用TFLearn預測正弦sin函式）

專案已上傳至 GitHub —— sin_pre 資料生成因為標準的迴圈神經網路模型預測的是離散的數值，所以需要將連續的 sin 函式曲線離散化所謂離散化就是在一個給定的區間 [0,MAX] 內，通過有限個取樣點模擬一個連續的曲線，即間

tensorflow 學習筆記12 迴圈神經網路RNN LSTM結構實現MNIST手寫識別

長短時記憶網路（LSTM）就是為了解決在複雜的場景中，有用資訊的間隔有大有小、長短不一問題。LSTM是一種擁有三個門結構的特殊網路結構。 LSTM靠一些門的結構讓資訊有選擇的影響迴圈神經網路中每個時刻的狀態。所謂門的結構就是一個使用sigmoid神經網路和按位做乘法的操作

Tensorflow學習筆記——基本結構

tensorflow構建神經網路的基本框架 1：匯入模組，生成資料 import 常量定義生成資料集 2：前向傳播定義輸入，輸出 x = y_= W1 = W2 = &nb

Tensorflow學習筆記-基於LeNet5結構的ORL資料集人臉識別

參考文獻: 《基於卷積神經網路的人臉識別研究》李春利，柳振東，惠康華文章中基於經典的網路LeNet-5的結構，提出了一種適用於ORL資料集的CNN結構，在該資料集上取得了較高的識別率。本文是在參考此論文的基礎上，使用tensorflow實現了文中相關

TensorFlow學習筆記（1）：LSTM相關程式碼

LSTM是seq2seq模型中經典的子結構，TensorFlow中提供了相應的結構，供我們使用： tensorflow提供了LSTM實現的一個basic版本，不包含lstm的一些高階擴充套件，同時也提供了一個標準介面，其中包含了lstm的擴充套件。分別為：tf.nn.rnn

tensorflow學習筆記(三十九) : 雙向rnn (BiRNN)

雙向RNN實際上僅僅是兩個獨立的RNN放在一起, 本博文將介紹如何在tensorflow中實現雙向rnn 單層雙向rnn 單層雙向rnn (cs224d) tensorflow中已經提供了雙向rnn的介面,它就是tf.nn.bidirectional_dyna

tensorflow學習筆記——模型持久化的原理，將CKPT轉為pb檔案，使用pb模型預測

　　由題目就可以看出，本節內容分為三部分，第一部分就是如何將訓練好的模型持久化，並學習模型持久化的原理，第二部分就是如何將CKPT轉化為pb檔案，第三部分就是如何使用pb模型進行預測。一，模型持久化　　為了讓訓練得到的模型儲存下來方便下次直接呼叫，我們需要將訓練得到的神經網路模型持久化。下面學習通過Ten

Java學習筆記-13.創建窗口和程序片

pri let tostring 離開窗口 dbo solid n) height 1.init()方法：程序片第一次被創建，初次運行初始化程序片時調用。 start()方法：每當程序片進入web瀏覽器中，並且允許程序片啟動他的常規操作時調用（特殊的程序片被sto

tensorflow學習筆記（二）

example initial turn rate mnist pac rac test mode import tensorflow as tfimport numpy as npimport mathimport tensorflow.examples.tutorial

python 學習筆記 13 -- 經常使用的時間模塊之time

分鐘英文超過最好還原 %x tracking 運動文檔 Python 沒有包括相應日期和時間的內置類型。只是提供了3個相應的模塊，能夠採用多種表示管理日期和時間值： * time 模塊由底層C庫提供與時間相關的函數。它包括一些函數

tensorflow學習筆記(三)：實現自編碼器

sea start ear var logs cos soft 編碼 red 黃文堅的tensorflow實戰一書中的第四章，講述了tensorflow實現多層感知機。Hiton早年提出過自編碼器的非監督學習算法，書中的代碼給出了一個隱藏層的神經網絡，本人擴展到了多層，改進

Tensorflow - Tutorial (7) : 利用 RNN/LSTM 進行手寫數字識別

ddc htm net sets 手寫 n-2 align csdn global 1. 經常使用類 class tf.contrib.rnn.BasicLSTMCell BasicLSTMCell 是最簡單的一個LSTM類。沒有實現clippi

springmvc學習筆記(13)-springmvc註解開發之集合類型參數綁定

return 可擴展性 list .net items trac class javascrip lin springmvc學習筆記(13)-springmvc註解開發之集合類型參數綁定

TensorFlow學習筆記（UTF-8 問題解決 UnicodeDecodeError: 'utf-8' codec can't decode byte 0xff in position 0: invalid start byte）

show 學習 github red star ims fas can pri 我使用VS2013 Python3.5 TensorFlow 1.3 的開發環境 UnicodeDecodeError: ‘utf-8‘ codec can‘t decode byte

pandas模塊學習筆記1--數據結構

名稱 pandas taf 不同函數標記數據標簽命名 port pandas是基於Numpy構建的。 pandas的兩個主要數據結構：Series和DataFrame。 Series和DataFrame用的次數非常多，將其導入本地命名空間會更方便： from pa

Hadoop學習筆記—13.分布式集群中節點的動態添加與下架

情況好的當前每次原因修改輸入 task tle 開篇：在本筆記系列的第一篇中，我們介紹了如何搭建偽分布與分布模式的Hadoop集群。現在，我們來了解一下在一個Hadoop分布式集群中，如何動態（不關機且正在運行的情況下）地添加一個Hadoop節點與下架一個Had

tensorflow 學習筆記13 RNN LSTM結構預測正弦(sin)函式

相關推薦