RNN中利用LSTM來預測sin函式

阿新 • • 發佈：2018-12-16

前言：這個例子是用LSTM來預測sin函式的問題，期間遇到了一個了十分致命的問題，就是構造資料的時候，沒有把資料構造成序列，所以一直在報維度上的錯誤，以後對時序問題的預測要格外注意資料是否是序列的資料，否則很難檢查出問題，中間的問題其實比較好看出來，一除錯就能解決。

這個例項來自於《TensorFlow實戰Google深度學習框架》

先給出錯誤的程式碼示例，以便給自己一個警醒。

# !/usr/bin/env python
# -*- coding:utf-8 -*-
# author:lxy

import numpy as np
import matplotlib.pyplot as plt
import tensorflow as tf

hidden_size = 30
num_layers = 2
time_step = 10
train_steps = 10000
batch_size = 32
train_examples =10000
test_examples =1000
sample_gap = 0.01

def generate_data(seq):
    X = []
    y = []
    for i in range(len(seq)-time_step):
        # 輸入資料是10個時間步的，去預測這10個時間步的後面一個的資料,即用sin函式前面的
time_step個點的資訊，去預測第i+time_step的函式值
        X.append(seq[i:i+time_step])
        y.append(seq[i+time_step])
    return np.array(X,dtype = np.float32),np.array(y,dtype = np.float32)

def lstm_model(X,y,is_training):
    # 使用多層的LSTM結構
    cell = tf.nn.rnn_cell.MultiRNNCell([tf.nn.rnn_cell.BasicLSTMCell(hidden_size) 
    for _ in range(num_layers)])
    outputs,state = tf.nn.dynamic_rnn(cell,X,dtype = tf.float32)
    # outputs[batch_size,-1,:]==state[1,batch_size,:]
    output = outputs[:,-1,:] # state[1]

    # 對LSTM網路的輸出再加一層全連線層
    prediction = tf.contrib.layers.fully_connected(output,1,activation = None)
    if not is_training:
        return prediction,None,None

    # 計算損失函式
    loss = tf.losses.mean_squared_error(labels=y,prediction=prediction)
    # 建立優化器
    train_op = tf.contrib.layers.optimize_loss(loss,tf.train.get_global_step(),
    optimizer ="Adagrad",learning_rate = 0.1)
    return prediction,loss,train_op

def trian(sess,train_x,train_y):
    # 將訓練資料一資料集的形式提供給計算圖
    ds = tf.data.Dataset.from_tensor_slices((train_x,train_y))
    ds = ds.repeat().shuffle(1000).batch(batch_size)
    X,y = ds.make_one_shot_iterator().get_next()

    # 呼叫模型，得到預測結果，損失函式以及訓練操作
    with tf.variable_scope("model"):
        prediction,loss,train_op = lstm_model(X,y,True)

    # 初始化變數
    sess.run(tf.global_variables_initializer())
    for i in range(train_steps):
        train_,l = sess.run([train_op,loss])
        if i%100==0:
            print("train_step:{0},loss is {1}".format(i,l))

def run_eval(sess,test_x,test_y):
    ds = tf.data.Dataset.from_tensor_slices((test_x,test_y))
    ds = ds.batch(1)
    X,y  = ds.make_one_shot_iterator().get_next()

    # 呼叫模型
    with tf.variable_scope("model",reuse=True):
        test_prediction,test_loss,test_op = lstm_model(X,[0.0],False)
    # 預測的數字
    prediction = []
    # 真實的數字
    labels = []
    for i in range(test_examples):
        pre,l = sess.run([test_prediction,y])
        prediction.append(pre)
        labels.append(l)
    # 計算rmse作為評價的指標
    pre_squ=np.array(prediction).squeeze()
    lab_squ = np.array(labels).squeeze()
    rmse = np.sqrt(((pre_squ-lab_squ)**2).mean(axis = 0))
    print("Mean Square Error is :%f" % rmse)
    #對預測的sin函式曲線進行繪圖
    plt.figure()
    plt.plot(pre_squ,labels ='prediction',colors ='red')
    plt.plot(lab_squ,labels = 'real_sin',colors ='green')
    plt.show()

# 生成資料集
test_start = (train_examples+time_step)*sample_gap
test_end = test_start+(test_examples+time_step)*sample_gap
train_x,train_y = generate_data(np.sin(np.linspace(0,test_start,train_examples+time_step,dtype = np.float32)))
test_x,test_y = generate_data(np.sin(np.linspace(test_start,test_end,test_examples+time_step,
dtype=np.float32)))
# print(train_x)
# print(train_y)

# 開始訓練模型，建立會話
with tf.Session() as sess:
    trian(sess,train_x,train_y)
    run_eval(sess,test_x,test_y)

最關鍵的錯誤：

期間還寫錯了

prediction = tf.contrib.layers.fully_connected(output,1,activation = None)

loss = tf.losses.mean_squared_error(labels=y,prediction=prediction)

# !/usr/bin/env python
# -*- coding:utf-8 -*-
# author:lxy

import numpy as np
import matplotlib.pyplot as plt
import tensorflow as tf

hidden_size = 30
num_layers = 2
time_step = 10
train_steps = 10000
batch_size = 32
train_examples =10000
test_examples =1000
sample_gap = 0.01

def generate_data(seq):
    X = []
    y = []
    for i in range(len(seq)-time_step):
        # 輸入資料是10個時間步的，去預測這10個時間步的後面一個的資料,是很常見的一種時間預測模型的資料格式
        X.append([seq[i:i+time_step]])
        y.append([seq[i+time_step]])
    return np.array(X,dtype = np.float32),np.array(y,dtype = np.float32)

def lstm_model(X,y,is_training):
    # 使用多層的LSTM結構
    cell = tf.nn.rnn_cell.MultiRNNCell([tf.nn.rnn_cell.BasicLSTMCell(hidden_size,forget_bias=1.0,state_is_tuple=True) for _ in range(num_layers)])
    # cell_initializer = cell.zero_state(batch_size,tf.float32)
    outputs,state = tf.nn.dynamic_rnn(cell,X,dtype = tf.float32)
    # outputs[batch_size,-1,:]==state[1,batch_size,:]
    output = outputs[:,-1,:]  # state[1]
    # 對LSTM網路的輸出再加一層全連線層
    prediction = tf.contrib.layers.fully_connected(output,1,activation_fn = None)
    if not is_training:
        return prediction,None,None

    # 計算損失函式
    loss = tf.losses.mean_squared_error(labels=y,predictions = prediction)
    # 建立優化器
    train_op = tf.contrib.layers.optimize_loss(loss,tf.train.get_global_step(),optimizer ="Adagrad",learning_rate = 0.1)
    return prediction,loss,train_op

def trian(sess,train_x,train_y):
    # 將訓練資料一資料集的形式提供給計算圖
    ds = tf.data.Dataset.from_tensor_slices((train_x,train_y))
    ds = ds.repeat().shuffle(1000).batch(batch_size)
    X,y = ds.make_one_shot_iterator().get_next()

    # 呼叫模型，得到預測結果，損失函式以及訓練操作
    with tf.variable_scope("model"):
        prediction,loss,train_op = lstm_model(X,y,True)

    # 初始化變數
    sess.run(tf.global_variables_initializer())
    for i in range(train_steps):
        train_,l = sess.run([train_op,loss])
        if i%100==0:
            print("train_step:{0},loss is {1}".format(i,l))

def run_eval(sess,test_x,test_y):
    ds = tf.data.Dataset.from_tensor_slices((test_x,test_y))
    ds = ds.batch(1)
    X,y  = ds.make_one_shot_iterator().get_next()

    # 呼叫模型
    with tf.variable_scope("model",reuse=True):
        test_prediction,test_loss,test_op = lstm_model(X,[0.0],False)
    # 預測的數字
    prediction = []
    # 真實的數字
    labels = []
    for i in range(test_examples):
        pre,l = sess.run([test_prediction,y])
        prediction.append(pre)
        labels.append(l)
    # 計算rmse作為評價的指標
    pre_squ=np.array(prediction).squeeze()
    lab_squ = np.array(labels).squeeze()
    rmse = np.sqrt(((pre_squ-lab_squ)**2).mean(axis = 0))
    print("Mean Square Error is :%f" % (rmse))
    #對預測的sin函式曲線進行繪圖
    plt.figure()
    plt.plot(pre_squ,label ='prediction',linestyle ='-',color='r')
    plt.scatter(lab_squ,label = 'real_sin',color='green')
    plt.legend()
    plt.show()

# 生成資料集
test_start = (train_examples+time_step)*sample_gap
test_end = test_start+(test_examples+time_step)*sample_gap
train_x,train_y = generate_data(np.sin(np.linspace(0,test_start,train_examples+time_step,dtype = np.float32)))
test_x,test_y = generate_data(np.sin(np.linspace(test_start,test_end,test_examples+time_step,dtype=np.float32)))
# print(train_x)
# print(train_y)

# 開始訓練模型，建立會話
with tf.Session() as sess:
    trian(sess,train_x,train_y)
    run_eval(sess,test_x,test_y)


.....
.....
.....
train_step:9100,loss is 4.266162250132766e-06
train_step:9200,loss is 5.570855591940926e-06
train_step:9300,loss is 3.8035254874557722e-06
train_step:9400,loss is 4.238047949911561e-06
train_step:9500,loss is 4.5835963646823075e-06
train_step:9600,loss is 4.353491931397002e-06
train_step:9700,loss is 3.338790065754438e-06
train_step:9800,loss is 4.182937573204981e-06
train_step:9900,loss is 4.109343080926919e-06
Mean Square Error is :0.002006

這次給我的教訓除了訓練資料要構造成序列外，還有一些函式的引數也要注意下。

RNN中利用LSTM來預測sin函式

前言：這個例子是用LSTM來預測sin函式的問題，期間遇到了一個了十分致命的問題，就是構造資料的時候，沒有把資料構造成序列，所以一直在報維度上的錯誤，以後對時序問題的預測要格外注意資料是否是序列的資料，否則很難檢查出問題，中間的問題其實比較好看出來，一除錯就能解決。這個例

在Angular中利用trackBy來提升性能

trac () str -m return info 新的第一個大量在Angular的模板中遍歷一個集合（collection）的時候你會這樣寫： <ul> <li *ngFor="let item of collection">{{ite

Vuejs在v-for中,利用index來對第一項新增class的方法

1.為li列表首項新增選中樣式： <li v-for="(items,index) in currentImgList" class="imgLiClass" :class="{'active': !index}"></li> 或者 <li v-for="(

c++中利用巨集來宣告和定義變數

假設我們要定義一個配置類，類中包含了很多的配置成員，有一種通過巨集的方法可以讓我們方便的維護繁多的成員在一個類中，定義一個變數需要型別，建構函式中給出的初始值。我們需要能夠像指令碼語言一樣進行配置變數： tconfig.h OPTION(m_data,OPT_INT,-1) OPTION(m_value

AngularJS 中利用 Interceptors 來統一處理 HTTP 的錯誤

Web 開發中，除了資料操作之外，最頻繁的就是發起和處理各種 HTTP 請求了，加上 HTTP 請求又是非同步的，如果在每個請求中來單獨捕獲各種常規錯誤，處理各類自定義錯誤，那將會有大量的功能類似的程式碼，或者使用醜陋的方法在每個請求中呼叫某幾個自定義的函式來處理。這兩種

VIM中利用巨集來實現插入一列遞增或遞減序號

　　經常遇到需要在文字中插入序號的情況，網上有很多方法，有時還要用到外掛。在這裡偶介紹偶經常使用的方法：利用VIM的巨集錄製功能來插入一列遞增或遞減序號。其實VIM的巨集錄製功能確實比較實用，可以完成很多工，省掉好多外掛。這裡舉例：　　需要在一個已經寫好的文字中插入行

MATLAB中利用牛頓法求解目標函式的區域性最小值

主函式（main_newton.m） % Newton法求解目標函式的區域性最小值 % Meringue % 2017/4/1 % --------------------------- % --

git中利用rebase來壓縮多次提交

之前我們用git merge –squash來將分支中多次提交合併到master後，只保留一次提交歷史。但是有些提交到github遠端倉庫中的commit資訊如何合併呢？歷史記錄首先我們檢視一下master分支的提交歷史： $ git log

Linux中利用logrotate來對log檔案進行轉儲

使用logrotate對日誌檔案轉儲，按時或者按大小。 logrotate簡介 NAME logrotate - rotates, compresses, and mails system logs SYNOPSIS

SpringMVC中利用@InitBinder來對頁面資料進行解析繫結

在使用SpingMVC框架的專案中，經常會遇到頁面某些資料型別是Date、Integer、Double等的資料要繫結到控制器的實體，或者控制器需要接受這些資料，如果這類資料型別不做處理的話將無法繫結。解決方法：使用註解@InitBinder來解決這些問題，這樣

如何在QML中利用Sprite來做我們需要的動畫

import QtQuick 2.0 import QtMultimedia 5.0 Item { width: 64 height: 64 property real hp: 3 SoundEffect { id: spawnSound s

JS中利用正則表示式交換函式的引數位置

某百科中看到一個例子，要用正則表示式將函式foo（a,b,c）中的引數位置換為foo（b,a,c），正好又在複習JS的過程中看到了正則表示式的部分，於是考慮用JS來實現這個功能。函式的引數同例題中一樣通過 [^,]* 進行匹配，於是寫出正則式： /foo\

Android中利用服務來守護程序

我們寫程式的時候，肯定會用到Service，而且還不止使用一個。當我們的程式中用到了Service的時候，說不定會被停掉。例如像360這樣的防毒軟體可能會誤操作對我們的Service有威脅。那麼我們就需要對我們的Service進行一個保護，也就是這裡所說的守

tensorflow 學習筆記13 RNN LSTM結構預測正弦(sin)函式

import tensorflow as tf import numpy as np import matplotlib.pyplot as plt BATCH_START = 0 TIME_STEPS = 20 BATCH_SIZE = 50 INPUT_SIZE =

【TensorFlow】LSTM（使用TFLearn預測正弦sin函式）

專案已上傳至 GitHub —— sin_pre 資料生成因為標準的迴圈神經網路模型預測的是離散的數值，所以需要將連續的 sin 函式曲線離散化所謂離散化就是在一個給定的區間 [0,MAX] 內，通過有限個取樣點模擬一個連續的曲線，即間

利用觀察者模式來獲取執行緒中的資料或者回調函式

首先//抽象主題角色，watched：被觀察 public interface Watched { public void addWatcher(Watcher watcher); public void removeWatcher(Watcher wat

【深度學習】python用RNN中LSTM進行正弦函式擬合

深度學習框架：Tensorflow 0.8.0 Python：2.7.6 資料的兩種輸入模型： ①data和label是同一個變數，整個模型相當於自迴歸（本文先演示第一種） ②data和label是不同的變數，整個模型相

利用ceye中的dns來獲取數據

ima .com 命令 flag 技術 img class pos div 安恒杯的一道命令執行題目查看，存在robots.txt文件查看index.txt文件，存在where_is_flag.php文件使用cat沒有任何回顯可以使用ceye平臺利

實測《Tensorflow實例：利用LSTM預測股票每日最高價（二）》的結果

直接 batch Language name 開盤 num 完全 tor 運行近期股市行情牛轉熊，大盤一直下探！由3200跌到了2700，想必很多人被深套了。這時想起人工智能能否預測股市趨勢?RNN能否起作用？　　這時便從網上找下教程，發現網上有個例子，

python中利用類創建的對象來保存信息

bsp 保存信息 ngs sha 入學 env exe pre info 在類創建的對象中，一般都是以字典的方式來class Student: class Student: def __init__(self, name, age, score):

RNN中利用LSTM來預測sin函式

相關推薦