python搭建簡易神經網路結構

阿新 • • 發佈：2019-01-01

本節使用python環境，在不使用深度學習工具箱情況下搭建一個簡單的神經網路結構（非CNN卷積網路）來訓練mnist手寫體資料庫。

網路的結構可以很簡單，比如就是([784,200,100,10])，輸入維度為784是一個樣本大小的28*28，網路包含dropout操作，更多的是理解這種最基礎的反向傳播機制的實現過程。

下面看下可執行的包含訓練測試的程式碼：

# -*- coding: utf-8 -*-
"""
@author: chen

"""
import numpy as np
import struct
from datetime import datetime
import matplotlib.pyplot as 
 plt

#讀取影象
def read_image(filename):
    binfile = open(filename , 'rb')
    buf = binfile.read()

    index = 0
    magic, numImages , numRows , numColumns = struct.unpack_from('>IIII' , buf , index)
    index += struct.calcsize('>IIII')

    data = np.zeros((numImages,numRows*numColumns))
    for 
 i in range(numImages): 
        im = struct.unpack_from('>784B' ,buf, index)
        index += struct.calcsize('>784B')

        im = np.array(im)
        data[i,:] = im
    return data

#讀取影象label
def read_label(filename):
    binfile = open(filename , 'rb')
    buf = binfile.read()

    index = 0 

    magic, numLabels = struct.unpack_from('>II' , buf , index)
    index += struct.calcsize('>II')

    data = np.zeros((numLabels,10))
    for i in range(numLabels): 
        label = struct.unpack_from('>B' ,buf, index)[0]

        label = np.array(label)
        data[i,label] = 1

        index += struct.calcsize('>B')
    return data

# 建立與初始化網路引數    
class nn_setup():
    def __init__(self,net,learningRate = 2, epochs = 100, batch = 100, dropoutFraction = 0.05):
        self.net = net
        self.size = net.size
        self.learningRate = learningRate
        self.dropoutFraction = dropoutFraction
        self.epochs = epochs
        self.batch = batch
        # 權值以list的形式儲存，方便不同層之間的矩陣引數索引
        self.W = list() 
        self.a = list()
        self.d = list()
        self.dW = list()
        self.dropoutMask = list()
        self.L = 0
        # 初始化網路引數
        for i in range(1,self.size):
            weight = (np.random.rand(self.net[i], self.net[i - 1]+1) - 0.5) * 2 * 4 * np.sqrt(6 / (self.net[i] + self.net[i - 1]))
            self.W.append(weight)

            weight = np.zeros([self.net[i], self.net[i - 1]+1])
            self.dW.append(weight)

        for i in range(self.size):
            if i == self.size-1:
                a_weight = np.zeros([self.batch, self.net[i]])
            else:      
                a_weight = np.zeros([self.batch, self.net[i]+1])
            self.a.append(a_weight)

        if self.dropoutFraction > 0:
            for i in range(self.size):
                if i == self.size-1:
                    dropout_weight = np.zeros([self.batch, self.net[i]])
                else:      
                    dropout_weight = np.zeros([self.batch, self.net[i]+1])
                self.dropoutMask.append(dropout_weight)

        for i in range(self.size):
            if i == self.size-1:
                d_weight = np.zeros([self.batch, self.net[i]])
            else:      
                d_weight = np.zeros([self.batch, self.net[i]+1])
            self.d.append(d_weight) 

        self.e = np.zeros(self.batch,self.net[self.size - 1])


def sigmoid(inputs):
    row,col = inputs.shape
    for i in range(row):
        for j in range(col):
            inputs[i,j] = 1 / (1 + np.exp(- inputs[i,j]))
    return inputs

##----------------------------------------------------------------
if __name__ == '__main__':
    # 資料庫資料夾選擇
    filename_traindata = 'MNIST_data/train-images.idx3-ubyte'
    filename_trainlabel = 'MNIST_data/train-labels.idx1-ubyte'
    filename_testdata = 'MNIST_data/t10k-images.idx3-ubyte'
    filename_testlabel = 'MNIST_data/t10k-labels.idx1-ubyte'
    train_data = read_image(filename_traindata)/255;
    train_label = read_label(filename_trainlabel)
    test_data = read_image(filename_testdata)/255;
    test_label = read_label(filename_testlabel)
    # 自定義網路結構與網路引數
    net = np.array([784,200,100,10])   
    learningRate = 2 #學習率
    batch = 100 #batch大小
    epochs = 100 #迭代次數
    dropoutFraction = 0.05 #dropout率
    # 初始化網路
    nn = nn_setup(net,learningRate = learningRate,batch = batch,epochs = epochs)

    plot_flag = 0 #是否影象畫出中間結果 0-不畫 
    Loss = np.array([])
    accuracy_all = np.array([])
    ##----------------------訓練----------------------------
    for epochs in range(nn.epochs):
        time_start = datetime.now()  #記錄訓練開始時間
        num = int(np.floor(train_data.shape[0]/nn.batch))
        for num_batch in range(num) :
            choose = np.random.randint(1,train_data.shape[0],nn.batch) 
            batch_x = train_data[choose,:]
            batch_y = train_label[choose,:]      
    ##--------------------nn前向傳播計算各層輸出值---------------
            m = batch_x.shape[0]
            nn.a[0] = np.hstack((np.ones([m,1]),batch_x))
            #從前往後依次計算各層輸出
            for i in range(1,nn.size-1):
                nn.a[i] = sigmoid(np.dot(nn.a[i-1],nn.W[i-1].T))
                if nn.dropoutFraction > 0:
                    nn.dropoutMask[i] = np.random.rand(nn.a[i].shape[0],nn.a[i].shape[1])
                    nn.dropoutMask[i][nn.dropoutMask[i] > nn.dropoutFraction] = 1
                    nn.dropoutMask[i][nn.dropoutMask[i] <= nn.dropoutFraction] = 0
                    nn.a[i] = nn.a[i] * nn.dropoutMask[i]

                nn.a[i] = np.hstack((np.ones([m,1]),nn.a[i]))
            # 計算最後一層的誤差    
            nn.a[nn.size-1] = sigmoid(np.dot(nn.a[nn.size-2],nn.W[nn.size-2].T))
            nn.e = batch_y - nn.a[nn.size-1] #誤差計算
            nn.L = 1/2 * np.sum(nn.e * nn.e)/m
            Loss = np.hstack((Loss,nn.L))
    ##---------------------nn反向傳播計算各層梯度----------------
            nn.d[nn.size-1] = - nn.e * (nn.a[nn.size-1] * (1 - nn.a[nn.size-1]))
            # 從後往前依次計算反向傳播的各層梯度
            for i in range(nn.size-2,0,-1):
                d_act = nn.a[i] * (1 - nn.a[i])
                if i+1 == nn.size-1:
                    nn.d[i] = np.dot(nn.d[i+1],nn.W[i]) * d_act
                else:
                    nn.d[i] = np.dot(nn.d[i+1][:,1:],nn.W[i]) * d_act
                if nn.dropoutFraction > 0:
                    nn.d[i] = nn.d[i] * np.hstack((np.ones([nn.d[i].shape[0],1]),nn.dropoutMask[i]))

            for i in range(nn.size-2):
                if i+1 == nn.size-1:
                    nn.dW[i] = np.dot(nn.d[i + 1].T , nn.a[i]) / nn.d[i + 1].shape[0]
                else:
                    nn.dW[i] = np.dot(nn.d[i + 1][:,1:].T , nn.a[i]) / nn.d[i + 1].shape[0]
    ##-------------------nn計算各層梯度更新-------------------
            for i in range(nn.size-2):
                dW = nn.dW[i]
                dW = nn.learningRate * dW
                nn.W[i] = nn.W[i] - dW           
            # 相關結果輸出
            if num_batch % 100 == 0:
                print('epochs = ', epochs,' / ', nn.epochs,
                        '; batch = ',num_batch,' / ',num,
                        '; error_batch = ', nn.L)

        time_end = datetime.now()
        print('time using for this epoch = ', (time_end.minute -time_start.minute)*60 + 
              (time_end.second-time_start.second) + 
            (time_end.microsecond - time_start.microsecond)/1000000, 's')
    ##-------------------計算測試樣本的準確率-----------------
        m = test_data.shape[0]
        nn.a[0] = np.hstack((np.ones([m,1]),test_data))
        for i in range(1,nn.size-1):
            nn.a[i] = sigmoid(np.dot(nn.a[i-1],nn.W[i-1].T))
            nn.a[i] = nn.a[i] * (1-nn.dropoutFraction)
            nn.a[i] = np.hstack((np.ones([m,1]),nn.a[i]))

        nn.a[nn.size-1] = sigmoid(np.dot(nn.a[nn.size-2],nn.W[nn.size-2].T))
        res = nn.a[nn.size-1]
        pre_y = np.zeros(res.shape[0])
        y_label = np.zeros(res.shape[0])
        count = 0

        for i in range(res.shape[0]):
            pre_y[i] = np.argmax(res[i,:])
            y_label[i] = np.argmax(test_label[i,:])
            if pre_y[i] == y_label[i]:
                count = count + 1
        accuracy = count/y_label.size
        accuracy_all = np.hstack((accuracy_all,accuracy))
        print('-----------------------------------------\n',
        'test accuracy = ', accuracy, '(',count,'/',y_label.size,')',
        '\n-----------------------------------------\n')
        if plot_flag:
            plt.figure(1)
            plt.plot(Loss)
            plt.title("training batch error")
            plt.figure(2)
            plt.plot(accuracy_all)
            plt.title("testing accuracy in different epochs")
            plt.show()

python搭建簡易神經網路結構

本節使用python環境，在不使用深度學習工具箱情況下搭建一個簡單的神經網路結構（非CNN卷積網路）來訓練mnist手寫體資料庫。網路的結構可以很簡單，比如就是([784,200,100,10])，輸入維度為784是一個樣本大小的28*28，網路包含drop

使用python定義一個神經網路結構

使用python定義一個神經網路 python定義一個神經網路是進行深度學習或者實現神經網路的基礎，那麼如果定義一個深度神經網路的結構呢？ import numpy as np class Ne

Python + Graphviz繪製神經網路結構圖--簡化版本實現

# -*- coding: utf-8 -*- """ Created on Mon Feb 20 14:27:54 2017 @author: ustc """ import os import sys import platform def isWindowsSystem(): retur

Python搭建簡易web伺服器，超好用～

有時需要手機除錯一些web頁面，於是～找到了這個超好用的方法首先，你要有python 然後，命令列進入web資料夾根目錄，這裡假設是index.html所在目錄輸入python命令： python -m SimpleHTTPServer 8080 8080是埠號，可以任

python 搭建簡易部落格詳細教程

最近想搞個個人主頁所以來學習下django，過程還是非常簡單的，耐心操作，其中的原理也大概能猜出來 1.下載django sudo pip install django 用的是1.10.1，大於1.7都行 2.建立工程在當前目錄下輸入 dja

Python搭建簡易HTTP服務（3.x版本和2.x版本的）

原文轉載地址：http://www.cnblogs.com/91allan/p/4889167.html 廢話不多說，我們工作時經常會用到需要HTTP服務，如果不想搞那些複雜的Apache、IIS伺服器等，這時我們就可以用python幫我們搭建一個簡單的伺服器。操作如下： 1、下載並安裝一個python；

python快速搭建簡易的FTP服務器

abc mark hang ces 一個用戶但是密碼完成上回說到，使用python搭建一個簡易的web下載服務器，但是這個簡易的服務器客戶端不能夠上傳文件。這次來搭建一個簡易的ftp服務器，來提供文件的下載和上傳功能。一、首先我們來安裝提供服務的pyftpdli

Python中使用Flask、MongoDB搭建簡易圖片伺服器

轉載：http://www.cppcns.com/shujuku/mongodb/119378.html 這篇文章主要介紹了Python中使用Flask、MongoDB搭建簡易圖片伺服器,本文是一個詳細完整的教程,需要的朋友可以參考下 1、前期準備通過 pip 或 easy_insta

神經網路一之神經網路結構與原理以及python實戰

技術交流qq群： 659201069 　　本系列埔文由淺入深介紹神經網路相關知識，然後深入神經網路核心原理與技術，最後淺出python神經網路程式設計實戰。通過本系列博文，您將徹底理解神經網路的原理以及如何通過python開發可用於生產環境的程式。本博

【python keras實戰】用keras搭建捲起神經網路訓練模型

端到端的MINIST訓練數字識別 MINIST資料集是由LeCun Yang 教授和他的團隊整理的，囊括了6萬個訓練集和1萬個測試集，每個樣本都是32*32的畫素值，並且是黑色的，沒有R、G、B三層。我們要做的就是把每一個圖片分類到0~9的類別中。 kera

Tensorflow 搭建簡單神經網路 | Python

本案例為迴歸問題，採用了一層隱層，隱層和輸出層的啟用函式都為 relu，損失函式MSE。 import tensorflow as tf from numpy.random import Rando

從零開始：用Python搭建神經網路

在這篇部落格裡，我們將從零開始搭建一個三層的神經網路。我們不會對用到的數學原理一一贅述，但我保證你可以直觀地瞭解到我們在做什麼。另外，你也可以通過文章內的連結來獲取更詳細的資訊。這兒我就假定你已經熟悉基礎的微積分和機器學習的一些概念，比如分類和規範化，最好還能懂得一些優

python搭建httpserver

瀏覽器服務器一個 .html 助手使用簡單 sim 文章因為手機要下載電腦上的文件，使用手機助手什麽的經常出沒反應，於是網上查了下，直接使用python搭建簡單的HTTP服務器，之後在其運行目錄下扔文件就行了。瀏覽器訪問時可以直接顯示相關的文件列表。參考了

github+hexo+themes搭建簡易個性主題博客

page tps 什麽 ner new 安裝git w3c 封面 ges 0x00 install Node.js and git 安裝Node.js:http://www.runoob.com/nodejs/nodejs-install-setup.html 安裝g

python搭建ssserver限制端口連接數

時間是把 ipv 間隔 bin logging lis only rst 新建文件，編寫下面內容，保存為socket.py文件。放到ssserver.exe所在文件夾#!/usr/bin/python# -*- coding: utf-8 -*-## Copyright

python實現簡易的進度條

span div imp 進度 python stdout for flush logs 1 import sys,time 2 3 for i in range(50): 4 sys.stdout.write(‘#‘) 5 sys.stdout.flu

vue2搭建簡易spa

log col sset 修改 conf 新頁面 root 標簽 cnblogs 使用vue-cli來配置webpack,webpack是一個打包工具，使程序模塊化全局安裝vue-cli: npm install -g vue-cli 安裝好後，使用vue-cli腳手

nodejs 搭建簡易服務器

-1 max multer next() rom cookie () active .get www文件夾下 template文件夾下 server.js代碼： const express=require(‘express‘); const static=requi

dnsmasq搭建簡易dns服務器

dnsmasq系統：centos6.8_x64本機IP：172.17.41.243為了簡便直接使用yum安裝dnsmasqyum install -y dnsmasq安裝後編輯配置文件/etc/dnsmasql.cofcp /etc/dnsmasq.conf /etc/dnsmasq.conf.ori >

Python搭建環境

python 2.7介紹完python之後，相信大家對這門編程語言有一定的了解了吧。那麽接下來我們就要為自己的計算機裝上python，然後就開始我們愉快的python學習之路咯。Python是一門跨平臺語言，它可以在我們熟悉的windows上運行，也可以在mac和Linux系統上運行，安裝完成後你可以通過終端

python搭建簡易神經網路結構

相關推薦