SimpleRNN 預測下個字母

阿新 • • 發佈：2018-10-31

看下SimpleRNN實現的預測下一字母。

from __future__ import print_function

from keras.layers import Dense, Activation
from keras.layers.recurrent import SimpleRNN
from keras.models import Sequential
from keras.utils.vis_utils import plot_model
import numpy as np

# using simpleRNN to generate next letter
class RNNSimple:
    def __init__(self, hidden_size=128, batch_size=128,
                 num_iter=24, num_epoch=1, num_pred=100, seq_len=10, step=1):
        self.hidden_size = hidden_size
        self.batch_size = batch_size
        self.num_iter = num_iter
        self.num_epoch = num_epoch
        self.num_pred = num_pred
        self.seq_len = seq_len
        self.step = step

    def read_text(self, file_path):
        lines = []
        with open(file_path, 'rb') as f:
            for line in f:
                line = line.strip().lower()
                line = line.decode('ascii', 'ignore')
                if len(line) == 0:
                    continue
                lines.append(line)
        text = ' '.join(lines)
        return text

    def vectorize(self, text):
        # generate index
        chars = set([c for c in text])
        self.chars_count = len(chars)
        self.char2index = dict((c, i) for i, c in enumerate(chars))
        self.index2char = dict((i, c) for i, c in enumerate(chars))
        print(self.char2index)
        print(self.index2char)
        # generate input and label
        self.input_chars = []
        self.label_chars = []
        for i in range(0, len(text) - self.seq_len, self.step):
            self.input_chars.append(text[i: i+self.seq_len])
            self.label_chars.append(text[i+self.seq_len])
        print(self.input_chars)
        print(self.label_chars)
        # one-hot to vectorize input and label
        X = np.zeros((len(self.input_chars), self.seq_len, self.chars_count), dtype=np.bool)
        Y = np.zeros((len(self.input_chars), self.chars_count), dtype=np.bool)
        for i, input_char in enumerate(self.input_chars):
            for j, c in enumerate(input_char):
                X[i,j,self.char2index[c]] = 1 
            Y[i, self.char2index[self.label_chars[i]]] = 1 

        print(X.shape)
        print(Y.shape)
        return X, Y

    def train(self, X, Y):
        # build model
        model = Sequential()
        model.add(SimpleRNN(self.hidden_size, return_sequences=False,
                            input_shape=(self.seq_len, self.chars_count), unroll=True))
        model.add(Dense(self.chars_count))
        model.add(Activation('softmax'))
        model.compile(loss='categorical_crossentropy', optimizer='rmsprop')
        # training and predict
        for iteration in range(self.num_iter):
            print('Iteration: %d'%iteration)
            model.fit(X, Y, batch_size=self.batch_size, epochs=self.num_epoch)
        return model

    def predict(self, model, test_chars):
        result = test_chars
        epoch_chars = test_chars
        for i in range(self.num_pred):
            vect_test = np.zeros((1, self.seq_len, self.chars_count))
            # label char index of vector as 1 which appear in test chars
            for i, ch in enumerate(epoch_chars):
                vect_test[0, i, self.char2index[ch]] = 1
            pred = model.predict(vect_test, verbose=0)[0]
            pred_char = self.index2char[np.argmax(pred)]
            result += pred_char
            epoch_chars = epoch_chars[1:] + pred_char
        return result

    def process(self):
        # 1. read text from file
        text = self.read_text('./test.txt')
        print(len(text))
        # 2. vectorize text
        X, Y = self.vectorize(text)
        # 3. train based on X, Y
        model = self.train(X, Y)
        # 4. try predict
        test_idx = np.random.randint(len(self.input_chars))
        test_chars = self.input_chars[test_idx]
        print('test seed is: %s'%test_chars)
        result = self.predict(model, test_chars)
        print('result is: %s'%result)

if __name__ == '__main__':
    rnn_simple = RNNSimple()
    rnn_simple.process()

輸出結果

Iteration: 0
Epoch 1/1
1739/1739 [==============================] - 0s 180us/step - loss: 3.1235
Iteration: 1
Epoch 1/1
1739/1739 [==============================] - 0s 42us/step - loss: 2.8657
Iteration: 2
Epoch 1/1
1739/1739 [==============================] - 0s 41us/step - loss: 2.7682
Iteration: 3
Epoch 1/1
1739/1739 [==============================] - 0s 42us/step - loss: 2.6973
Iteration: 4
Epoch 1/1
1739/1739 [==============================] - 0s 41us/step - loss: 2.6078
Iteration: 5
Epoch 1/1
1739/1739 [==============================] - 0s 42us/step - loss: 2.5333
Iteration: 6
Epoch 1/1
1739/1739 [==============================] - 0s 41us/step - loss: 2.4714
Iteration: 7
Epoch 1/1
1739/1739 [==============================] - 0s 41us/step - loss: 2.4033
Iteration: 8
Epoch 1/1
1739/1739 [==============================] - 0s 41us/step - loss: 2.3416
Iteration: 9
Epoch 1/1
1739/1739 [==============================] - 0s 42us/step - loss: 2.2842
Iteration: 10
Epoch 1/1
1739/1739 [==============================] - 0s 41us/step - loss: 2.2356
Iteration: 11
Epoch 1/1
1739/1739 [==============================] - 0s 40us/step - loss: 2.1725
Iteration: 12
Epoch 1/1
1739/1739 [==============================] - 0s 41us/step - loss: 2.1179
Iteration: 13
Epoch 1/1
1739/1739 [==============================] - 0s 41us/step - loss: 2.0791
Iteration: 14
Epoch 1/1
1739/1739 [==============================] - 0s 41us/step - loss: 2.0257
Iteration: 15
Epoch 1/1
1739/1739 [==============================] - 0s 41us/step - loss: 1.9759
Iteration: 16
Epoch 1/1
1739/1739 [==============================] - 0s 42us/step - loss: 1.9279
Iteration: 17
Epoch 1/1
1739/1739 [==============================] - 0s 41us/step - loss: 1.8844
Iteration: 18
Epoch 1/1
1739/1739 [==============================] - 0s 42us/step - loss: 1.8449
Iteration: 19
Epoch 1/1
1739/1739 [==============================] - 0s 41us/step - loss: 1.7889
Iteration: 20
Epoch 1/1
1739/1739 [==============================] - 0s 41us/step - loss: 1.7589
Iteration: 21
Epoch 1/1
1739/1739 [==============================] - 0s 41us/step - loss: 1.7087
Iteration: 22
Epoch 1/1
1739/1739 [==============================] - 0s 42us/step - loss: 1.6699
Iteration: 23
Epoch 1/1
1739/1739 [==============================] - 0s 41us/step - loss: 1.6291
test seed is: rrive at t
result is: rrive at the input nodes area ion is the sem of the seruen eo an te de the nm or es ae eamhen niin t ae ter

SimpleRNN 預測下個字母

看下SimpleRNN實現的預測下一字母。 from __future__ import print_function from keras.layers import Dense, Activation from keras.layers.recurrent import SimpleRNN

js 去掉下劃線,後首個字母變大寫

toupper 駝峰 uri family 大寫 var let upper 字母 1.駝峰轉連字符: var s = "fooStyleCss"; s = s.replace(/([A-Z])/g,"-$1").toLowerCase(); //利用正則進行替

救急修復17款MacBook Pro鍵盤出現某些健按一下被識別成兩下，然後打出2個字母的情況

本文提供的是軟體解決方法如果經過試驗並不能有效解決問題，請及時送修。永遠的，最好的最合適的解決方法就是送修，在條件不允許的情況下，可以使用本方法來救急。 20181019更新：博主剛剛下方向鍵失靈，慢慢深按才能觸發，所以那一張卡插進縫隙裡撬了幾下，現在下方向鍵已經好了，但是n鍵

java驗證，”支援6-20個字母、數字、下劃線或減號，以字母開頭“這個的正則表示式怎麼寫？

轉自：https://yq.aliyun.com/wenzhang/show_96854 問題描述 java驗證，”支援6-20個字母、數字、下劃線或減號，以字母開頭“這個的正則表示式怎麼寫？驗證”支援6-20個字母、數字、下劃線或減號，以字母開頭“的正則表示式

語音助手下個互聯網風口？

智能助手語音助手只能平臺最近一段時間看到一個語音助手帖子，說iphone的siri這麽難用為什麽還會被一直研發，谷歌的GoogleAssistan已經在appstore上架了。我想了下就立即回復蘋果不可能放棄siri，因為語音助手太重要了。因為語音助手大家可能只能想到的只是打個電話，

漢語轉拼音(全轉與只轉首個字母)工具類

turn pin english wan ring shu cef utils sas 1.全轉的工具類 ChineseConvertAll.java package Utils.Chinese; /** * 將中文詞組轉換成拼音 * @author

天上掉下個男朋友

src big mar http 技術分享 sha left 技術 targe 天上掉下個男朋友天上掉下個男朋友

plsql中net_day 中求下個星期幾用漢字不能用的辦法

plsql中net_day 中求下個星期幾用漢字不能用的辦法首先解決plsql中顯示漢字的問題如果 select sysdate from daul; //顯示的 2017/9/24/星是這個就能正常用如果不是1、http://10788133.blog.51cto.com/10778133/1968

【C語言程序】讓用戶輸入一句話，輸出這句話中每個單詞含有多少個字母

get mage 一句話 printf png es2017 urn bsp can #include <stdio.h>#define N 100 //宏定義，用N表示100 int main(int argc, char *argv[]) { int i

26、有一行電文，已按下面規律譯成密碼即第一個字母變成第26個字母，第I個字母變成第（26-i+1）

targe 第一個 span clas spa -i 擴展 title 知識擴展知識參考請輸入一個數字，把它顯示為對應的字母，比如輸入65，顯示A，輸入97，顯示a 26、有一行電文，已按下面規律譯成密碼即第一個字母變成第26個字母，第I個字母變成第（26-i+1

Python + Appium 【已解決】driver(session)在多個class之間復用，執行完一個類的用例，再次執行下個類的用例時不需要初始化

nic bject config com appium client lee session ted py文件的名稱為：appium_config.py 中的寫法如下 # coding=UTF-8 ‘‘‘ Created on 2017.1.13 @author: Lu

vue下個兄弟節點

ext script div pre current style brush asc ren checkOne(e) { e.currentTarget.nextElementSibling.style.background = ‘red‘ } 　　vue下個

獲取下個月的今天

PHP 日期 date /* 獲取下個月的今天如果 $date = 2018-1-31 二月沒有31號則獲取二月份的最後一天返回值為2018-2-28 如果 $date = 2018-1-15 返回值為2018-2-15 -- psw-- */ function getNextMon

DT時代下[個推3.0]遵循的四個法則

個推 ArchSummit全球架構師峰會 DT(Data Technology)，是以服務大眾、激發生產力為主的技術。從IT時代走向DT時代，我們要思考如何用互聯網技術、理念、思想去與傳統行業進行交融和共同發展。 1.數據是決策的基本依據數億客戶端情況下，如何迅速定位？譬如：有的手機定位正常，有的不正

java轉換ddMMMyyyy 格式的日期（12MAY2018）月三個字母

所有不支持支持默認日期 mat int pre inter sim SimpleDateFormat oldFormat = new SimpleDateFormat("ddMMMyyyy", Locale.ENGLISH); Date parseDate =

java 獲取下一個字母（傳大寫返回大寫，傳小寫返回小寫）

public HA java array PE ret pan supper 返回 public static String getNextUpEn(String en){ char lastE = ‘a‘; char st = e

import time 進度條動態輸出26個字母

time num abcdefg 結果 sleep 字母運行 end 調用 # 2018-08-06　　19:42:51 import time　　# 調用時間模塊 num = 97　　# 字母a while num <= 115:　　# 　　print(chr(n

C語言加密練習：第一個字母變成第26個字母，第i個字母變成第（26-i+1）個字母。非字母字符不變。要求編程序將密碼譯回原文，並輸出密碼和原文。

c語言 http () spa mage strlen str png for 1 int Afan(char a); 2 3 int main() 4 5 { 6 7 char arr[40] = {"aABX"}; 8 9 scanf("%s

Python3基礎 str capitalize 返回新字符串，第一個字母大寫

2.4 6.5 world vat 哲學源碼大寫開源 copy ? python : 3.7.0 OS : Ubuntu 18.04.1 LTS

php 計算下個月

i++ intval col strong ont str mark ef6 time 在使用如下方法計算當前日期以後的6個月的時候發現了問題 for($i = 0;$i<6;$i++){ echo date(‘Y-m-d‘, mktime(0, 0, 0,

SimpleRNN 預測下個字母

相關推薦