機器學習BP神經網路，任意拓撲結構（C++）

阿新 • • 發佈：2019-01-28

這次的版本更優秀了的樣子！

按照老闆說的，每個節點是單獨的匯出節點（會導致sigmod訓練變慢，原因sigmod層數多了，梯度會下降很快導致爆炸。）

換個啟用函式就行了。

net<10>表示網咯有10個節點

然後input.txt裡的檔案格式大概是

0 1

1 2

3 4

....

n表示有n行，每行2個數字，表示2個點有邊。（0下標開始，不超過net初始化的節點數量）。任意拓撲結構都可以執行。

#include <bits/stdc++.h>
#include "recordlog.h"
#include <memory>

using std::cin;
using std::endl;
using std::cout;
#define pr(x)	cout<<#x<<" = "<<x<<" "
#define prln(x)	cout<<#x<<" = "<<x<<endl


#define NODE		(neurons[node])
#define NODE_GAIN	(NODE.energy)
#define NODE_THETA	(NODE.loss_energy)			//node節點的theta，也就是閾值
#define NODE_VALUE	(NODE_GAIN + NODE_THETA)	//node節點的實際能量（獲得能量+theta）
#define NODE_OUTPUT 	(NODE.output)				//node節點的實際輸出
#define NODE_PE		(NODE.partial_derivative)		//node節點output，對最終答案的導數
#define D_NODE		(derivative(NODE_VALUE))		//node節點獲得的所有能量（加過theta的），對於node節點output的導數



#define NEXT_NODE		(neurons[nextnode.first])
#define NEXT_NODE_OUTPUT 	(NEXT_NODE.output)				//node節點的實際輸出
#define NEXT_NODE_GAIN		(NEXT_NODE.energy)
#define NEXT_NODE_PE		(NEXT_NODE.partial_derivative)			//node節點output，對最終答案的導數
#define NEXT_NODE_THETA		(NEXT_NODE.loss_energy)				//node節點的theta，也就是閾值
#define NEXT_NODE_VALUE		(NEXT_NODE_GAIN + NEXT_NODE_THETA)	//node節點的實際能量（獲得能量+theta）
#define D_NEXT_NODE		(derivative(NEXT_NODE_VALUE))			//node節點獲得的所有能量（加過theta的），對於node節點output的導數
#define NODE_TO_NEXTNODE_WEIGHT (nextnode.second)

class neuron_t;
typedef std::pair<int, double> 		PID;
typedef std::vector<PID> 		neuron_array_t;
typedef std::vector<int>	  	vector_map_t;
typedef std::unique_ptr<neuron_t>	neuron_ptr_t;

class neuron_t
{
	public:
		double 			energy;
		double			output;
		int 			number;
		double 			loss_energy;
		neuron_array_t 		neuron_array;
		double			partial_derivative;
		bool			is_input;
		bool			is_output;
};

template<int neuron_size>
class net_t
{
	public:
		neuron_t		neurons[neuron_size];
		vector_map_t		vector_map[neuron_size];
		std::string		activation_way;			//啟用函式的選擇，預設ReLU

		std::vector<double>	input_weight;

		std::vector<int> 	output_number;
		std::vector<int> 	input_number;
		int 			tmp[neuron_size];		//臨時陣列，生成過n的全排列，和拓撲排序中記錄入度。
		int 			height[neuron_size];		//輔助構圖的高度陣列
		int			topology[neuron_size];		//拓撲序
		double			rate;				//學習率
		int			userful_neuron_size;

		static double sigmoid(double x)
		{
			return 1.0/(1.0 + exp(-x));
		}

		static double line(double x)
		{
			return x;
		}

		static double ReLU(double x)
		{
			if (x<=0)	return 0;
			return x;
		}

		double derivative(double x)
		{
			if (activation_way == "sigmoid"){
				return sigmoid(x) * (1 - sigmoid(x));
			}
			if (activation_way == "ReLU"){
				if (x<0)	return 0;
				return 1;
			}
			if (activation_way == "line"){
				return 1;
			}
			cout<<"no activationFunction!"<<endl;
			return 0;
		
		}

		double activationFunction(double sum, double theta)
		{
			if (activation_way == "sigmoid"){
				return sigmoid(sum + theta);
			}
			if (activation_way == "ReLU"){
				return ReLU(sum + theta);
			}
			if (activation_way == "line"){	
				return line(sum + theta);
			}
			cout<<"no activationWay !" << endl;
			return 0;
		}

		static double randomDouble(double l, double r)
		{
			return randomInt(l*10000, r * 10000)/10000.0;
		}

		static long long randomInt(long long L, long long R)
		{
			long long tmp = (unsigned long long)rand()
				*(unsigned long long)rand()
				*(unsigned  long long)rand()
				*(unsigned long long)rand() % (R - L + 1);
			return L + tmp;
		}

		~net_t()
		{
		}


		net_t (std::string file_name)
		{
			//初始化新的網路
			FILE *file = fopen(file_name.c_str(), "r");
			printf("[%s]\n", file_name.c_str());
			int n;
			fscanf(file, "%d", &n);
			this -> activation_way = "sigmoid";
			this -> rate = 0.1;	//xuexilv
			for (int i = 0; i < neuron_size; ++ i){
				vector_map[i].clear();
				tmp[i] = i;
				neurons[i].number = i;
				neurons[i].is_input = false;
				neurons[i].is_output = false;
			}
			this -> output_number.clear();
			this -> input_number.clear();
			prln(neuron_size);
			while (n--){
				int s, t;
				fscanf(file, "%d%d", &s, &t);
				cout<<s<<" "<<t<<endl;
				vector_map[s].push_back(t);
				vector_map[t].push_back(s);
			}
			fclose(file);
		}

		net_t()
		{
			*this = net_t("input.txt");
		}

		void initInputNeuron(std::vector<int> &input_num){
			int sz = input_num.size();
			input_weight.resize(sz);
			for (int i = 0; i < sz; ++ i){
				input_weight[i] = randomDouble(-1, 1);
				neurons[input_num[i]].is_input = true;
			}
		}

		void setIO(std::vector<double> &input, std::vector<double> &output, std::vector<int> *input_num = NULL, std::vector<int> *output_num = NULL){
			if (input.size() == 0){
				//throws something TODO
				return;
			}
			if (output.size() == 0){
				//throws something TODO
				return;
			}

			if (input_num && output_num)
			{
				output_number = *output_num;
				input_number = *input_num;
			}
			else
			{
				std::random_shuffle(tmp, tmp + neuron_size);
				printf("output nodes are: ");
				for (int i = 0; i < output.size(); ++ i){
					output_number.push_back(tmp[i]);
					printf("%d ",tmp[i]);
				}
				printf("\n");
				printf("input nodes are:");
				for (int i = output.size(); i < input.size() + output.size(); ++ i){
					input_number.push_back(tmp[i]);
					printf("%d ",tmp[i]);
				}
				printf("\n");
			}
			initInputNeuron(*input_num);
			for (int i = 0; i < output.size(); ++ i){
				neurons[output_number[i]].is_output = true;
				//pr(i),prln(output_number[i]);
			}

			std::queue<int>q[output.size() + input.size()];
			memset(height, -1, sizeof(height));
			int painted = output.size();
			int cnt=0;
			for (auto curnode : output_number){
				q[cnt++].push(curnode);
				height[curnode] = 0;
			}
			for (auto curnode : input_number){
				q[cnt++].push(curnode);
				height[curnode] = neuron_size;
			}
			bool flag = true;
			while (flag){
				int cnt = 0;
				flag = false;
				for (auto curnode : output_number){
					flag |= bfs(q[cnt++], 1);
				}
				for (auto curnode : input_number){
					flag |= bfs(q[cnt++], -1);
				}
			}
			auto build_map = [=](int from, int to){
				neurons[from].neuron_array.push_back(std::make_pair(to, randomDouble(-1,1)));
			};
			for (int i = 0; i < neuron_size; ++ i){
				for (auto curnode : vector_map[i]){
					if (height[i] > height[curnode]){
						build_map(i, curnode);
					}
				}
			}
			for (int i = 0; i < neuron_size; ++ i){
				neurons[i].loss_energy = randomDouble(-1, 1);
			}
			getTopology();
			//至此構造完網路的拓撲結構
		}

		void getTopology()
		{
			memset(tmp, 0, sizeof(tmp));
			for (int i = 0; i < neuron_size; ++ i){
				for (auto nextnode : neurons[i].neuron_array){
					++ tmp[nextnode.first];
				}
			}
			std::queue<int>q;
			for (auto curnode : input_number){
				q.push(curnode);
			}
			int pos = 0;
			while (!q.empty())
			{
				int curnode = q.front();
				q.pop();
				topology[pos++] = curnode;
				for (auto nextnode : neurons[curnode].neuron_array){
					if(-- tmp[nextnode.first] == 0){
						q.push(nextnode.first);
					}
				}
			}
			userful_neuron_size = pos;
			//DEBUG
			//for (int i = 0; i < neuron_size; ++ i)
			//	pr(i),prln(topology[i]);

		}

		bool bfs(std::queue<int> &q, int delta){
			if (q.empty()){
				return false;
			}
			int h = height[q.front()];
			while (!q.empty() && height[q.front()] == h){
				int curnode = q.front();
				q.pop();
				for (auto nextnode : vector_map[curnode]){
					if (height[nextnode] != -1){
						continue;
					}
					height[nextnode] = h + delta;
					q.push(nextnode);
				}
			}
			return true;
		}

		void cal_propagate(int node){
			NODE_OUTPUT = activationFunction(NODE_GAIN, NODE_THETA);
			for (auto nextnode : NODE.neuron_array){
				NEXT_NODE_GAIN += NODE_OUTPUT * NODE_TO_NEXTNODE_WEIGHT;
			}
		}

		void propagate(std::vector<double> &input){
			//TODO
			
			
			/*
			for (int i = 0; i < input_number.size(); ++i)
			{
				input_weight[i] = 1;
			}
			*/
			

			for (int i = 0; i < neuron_size; ++ i){
				neurons[i].energy = 0;
				neurons[i].output = 0;
			}

			for (int i = 0; i != input.size(); ++ i){
				int node = input_number[i];
				NODE_GAIN += input_weight[i] * input[i];
			}

			for (int i = 0; i < userful_neuron_size; ++ i){
				int node = topology[i];
				cal_propagate(node);
			}
		}

		void cal_back(int node){
			for (auto &nextnode : NODE.neuron_array){
				NODE_PE += NEXT_NODE_PE * NODE_TO_NEXTNODE_WEIGHT * D_NEXT_NODE;
			}

			for (auto &nextnode : NODE.neuron_array){
				NODE_TO_NEXTNODE_WEIGHT -= NODE_OUTPUT * D_NEXT_NODE * NEXT_NODE_PE * rate;
			}
			NODE_THETA -= NODE_PE * D_NODE * rate;
		}

		void back(std::vector<double> &input, std::vector<double> &output){
			for (int i = 0; i < neuron_size; ++ i){
				neurons[i].partial_derivative = 0;
			}

			for (int i = 0; i != output.size(); ++ i)
			{
				int node = output_number[i];
				NODE_PE = NODE_OUTPUT - output[i];
				NODE_THETA -= NODE_PE * D_NODE * rate;
			}

			for (int i = userful_neuron_size - 1; i >= 0; -- i){
				int node = topology[i];
				if (NODE.is_output){
					continue;
				}
				else{
					cal_back(node);
				}
			}

			for (int i = 0; i < input.size(); ++ i){
				int node = input_number[i];
				double tmp = input[i] * NODE_PE * D_NODE;
				//prln(tmp);
				//prln(input_weight[i]);
				input_weight[i] -= tmp * rate;
				//prln(input_weight[i]);
			}
		}

		double train(std::vector<double> &input, std::vector<double> &output){
			propagate(input);
			//	outputNetwork();
			back(input, output);
			double error=0;
			for (int i = 0; i < output.size(); ++ i){
				error += 0.5*pow((neurons[output_number[i]].output - output[i]), 2);
			}
			return error;
		}

		void outputNetwork(){
			printf("---------------input nodes------------:\n");
			for (int i = 0; i < input_number.size(); ++ i)
			{
				printf("[%d] weight:(%.7lf) \n", input_number[i], input_weight[i]);
			}
			printf("---------------other nodes------------\n");
			printf("other nodes\n");
			for (int i = 0; i < neuron_size; ++ i){
				pr(topology[i]),prln(i);
				int node = topology[i];
				printf("[%d] gain(%.7lf) theta(%.7lf) par_derivative(%.7lf) output(%.7lf) d(%.7lf)\n", 
						node,
						NODE_GAIN,
						NODE_THETA, 
						NODE_PE, 
						NODE_OUTPUT, 
						D_NODE);
				for (auto nextnode : NODE.neuron_array){
					printf("  -> %d (%.7lf)\n", nextnode.first, nextnode.second);
				}
			}
			printf("=============End====================\n");
		}

		void testOutput(std::vector<double> &input)
		{
			propagate(input);
			cout<<"output: ";
			for (auto curnode : output_number)
			{
				printf("%.7lf ", neurons[curnode].output);
			}
			cout<<endl;
		}

		std::vector<double> getTest(std::vector<double> &input)
		{
			std::vector<double> q;
			for (auto curnode : output_number)
			{
				q.push_back(neurons[curnode].energy);
			}
			return move(q);
		}
};

void doit251()
{
	std::vector<int>in({0,1});
	std::vector<int>out({7});
	net_t<8> net;//("input.txt");
	srand(0);
	std::vector<double>input1({0,0});
	std::vector<double>input2({0,1});
	std::vector<double>input3({1,0});
	std::vector<double>input4({1,1});
	std::vector<double>output1({0});
	std::vector<double>output2({1});
	std::vector<double>output3({1});
	std::vector<double>output4({0});

	net.setIO(input1, output1, &in, &out);
	net.activation_way = "sigmoid";
	net.rate = 20;



	/*
	net.propagate(input3);
	net.outputNetwork();
	net.back(input3, output3);
	net.outputNetwork();
	return;
	*/




	double error=0;
	for (int i = 1;i<=20000;++i){
		error = 0;
		error += net.train(input1, output1);
		error += net.train(input2, output2);
		error += net.train(input3, output3);
		error += net.train(input4, output4);
		error/=4;
		cout<<error<<"\r";
	}
	prln(error);
	//prln(net.userful_neuron_size);
	net.testOutput(input1);
	net.testOutput(input2);
	net.testOutput(input3);
	net.testOutput(input4);
}


int main()
{
	doit251();
	return 0;
}

機器學習BP神經網路，任意拓撲結構（C++）

這次的版本更優秀了的樣子！按照老闆說的，每個節點是單獨的匯出節點（會導致sigmod訓練變慢，原因sigmod層數多了，梯度會下降很快導致爆炸。）換個啟用函式就行了。 net<10>表示網咯有10個節點然後input.txt裡的檔案格式大概是 n 0 1

基於BP神經網路的數字識別基礎系統（四）

基於BP神經網路的數字識別基礎系統（四）（接上篇）上一篇的連結：http://blog.csdn.net/z_x_1996/article/details/68490009 3.系統設計上一篇筆者已經討論完了BP神經網路需要用到的知識點，接下來就開始設計符合我們標題

基於BP神經網路的數字識別基礎系統（三）

基於BP神經網路的數字識別基礎系統（三）（接上篇）上一篇的連結：http://blog.csdn.net/z_x_1996/article/details/60779141 上篇博文中筆者簡單的介紹了一下梯度下降演算法，這裡接著為大家介紹增量梯度下降演算法。 2.2.

基於OpenCV 人工神經網路的噴碼字元識別（C++）

新手上路記本人做的第一個影象處理實驗噴碼字元識別流程：讀圖——濾波——二值化——腐蝕——分割——ANN訓練——識別本例程訓練類別14類（0-9，C、L、冒號、空格）,每類樣本數量50張搭配環境：VS2017+opencv3.4.1 語言：C++ 由於工程有點大，下面進行簡單介紹，詳情見

巡禮卷積神經網路中的那些經典結構（二）——inception module

這篇文章向大家介紹一下inception module這個結構，在本文中我們只對inception module進行介紹，inception v1——v4系列文章會在後續文章中推出，請大家期待。本文轉載自磐創AI 一、Inception網路簡介 Inception網路又

巡禮卷積神經網路中的那些經典結構（一）—— Group convolution

筆者在閱讀論文的過程中，發現論文中經常會涉及到一些經典的神經網路結構，儘管這些結構可能出現的時間，但是生生不息，經歷住了時間的考驗。在這個系列文章中，我將對那些經典的網路分別做一個簡單介紹。作為這個系列文章的第一篇文章，本文首先要介紹的是 Group convolution這個結構

機器學習與神經網路（四）：BP神經網路的介紹和Python程式碼實現

前言：本篇博文主要介紹BP神經網路的相關知識，採用理論+程式碼實踐的方式，進行BP神經網路的學習。本文首先介紹BP神經網路的模型，然後介紹BP學習演算法，推導相關的數學公式，最後通過Python程式碼實現BP演算法，從而給讀者一個更加直觀的認識。 1.BP網路模型為了將理

機器學習入門-神經網路&BP演算法的實現

在MP神經元模型之中，神經元接收到來自其它n個神經元傳遞過來的輸入訊號，這些輸入訊號通過帶權重的連線2進行傳遞，神經元接收到的總輸入值與神經元的閾值進行比較，然後通過啟用函式處理以產生神經元的輸出。一般而言選取sigmoid函式作為啟用函式來使用，因為其相對啟用

【機器學習】神經網路及BP推導

1 前向傳播這裡的推導都用矩陣和向量的形式，計算單個變數寫起來太麻煩。矩陣、向量求導可參見上面參考的部落格，個人覺得解釋得很直接很好。前向傳播每一層的計算如下： z(l+1)=W(l,l+1)a(l)+b(l,l+1)(1.1) a(l+

簡單易學的機器學習演算法——神經網路之BP神經網路

%% BP的主函式 % 清空 clear all; clc; % 匯入資料 load data; %從1到2000間隨機排序 k=rand(1,2000); [m,n]=sort(k); %輸入輸出資料 input=data(:,2:25); output1 =data(:,1); %把輸出從1維變

機器學習之神經網路bp演算法推導

這是一篇學習UFLDL反向傳導演算法的筆記，按自己的思路捋了一遍，有不對的地方請大家指點。首先說明一下神經網路的符號： 1. nl 表示神經網路的層數。 2. sl 表示第 l 層神經元個數，不包含偏置單元。 3. z(l)i 表示第 l 層第 i 個

人工智慧、機器學習和神經網路計算棒走出試驗室的應用場景

跟著“人工智慧”走出試驗室、逐步有了實踐的應用場景，它成為了一項可能在不久的將來徹底改動人類社會的根底技能，也成為了很多人最愛評論的論題。可是，AI（人工智慧）、機器學習、神經網路計算棒，這些詞看著潮，究竟是指什麼呢？別慌，咱們試著舉幾個簡略的比方來解釋一下。人工智慧 “科技

【GitChat】從機器學習到神經網路

訂閱地址：從機器學習到神經網路人工智慧已經是各大媒體經常聚焦的話題，人工智慧、機器學習、深度學習與神經網路之間究竟是怎樣的關係？神經網路是深度學習的重要基礎，作為實現人工智慧的技術之一，曾經在歷史的長河中沉睡了數十年，為何又能夠重新甦醒、熠熠生輝。本文將詳細介紹神經網路的前生今世

機器學習_3.神經網路之CNN

卷積神經網路卷積神經網路（Convoltional Neural Networks, CNN）是一類包含卷積或相關計算且具有深度結構的前饋神經網路（Feedforward Neural Networks），是深度學習（deep learning）的代表演算法之一

機器學習_2.神經網路之DBN

深度信念網路（DBN）深度信念網路是一個概率生成模型，與傳統的判別模型的神經網路相對，生成模型是建立一個觀察資料和標籤之間的聯合分佈，對P(Observation|Label)和 P(Label|Observation)都做了評估，而判別模型僅僅而已評估了後者，也就是P(Label|O

機器學習_1.神經網路的研究和學習（一）

人工神經網路 — —百度百科人工神經網路（Artificial Neural Network，即ANN ），是20世紀80 年代以來人工智慧領域興起的研究熱點。它從資訊處理角度對

從機器學習到神經網路

人工智慧已經是各大媒體經常聚焦的話題，人工智慧、機器學習、深度學習與神經網路之間究竟是怎樣的關係？神經網路是深度學習的重要基礎，作為實現人工智慧的技術之一，曾經在歷史的長河中沉睡了數十年，為何又能夠重新甦醒、熠熠生輝。本文將詳細介紹神經網路的前生今世，以及它的基本結構、實現形式和核心要點。歡迎感

Hinton《面向機器學習的神經網路》中文版視訊教程

Hinton《面向機器學習的神經網路》中文版開課時間：深度學習鼻祖Hinton公開課視訊，隨到隨學開課時長：16個章節，系統學習神經網路知識體系連結： http://www.mooc.ai/course/58 後記

【機器學習】神經網路DNN的正則化

和普通的機器學習演算法一樣，DNN也會遇到過擬合的問題，需要考慮泛化，之前在【Keras】MLP多層感知機中提到了過擬合、欠擬合等處理方法的問題，正則化是常用的手段之一，這裡我們就對DNN的正則化方法做一個總結。 1. DNN的L1&L2正則化想到正則化，我們首先想到的就是L1正則化和L2正則化

機器學習---演算法---神經網路入門

轉自：http://www.ruanyifeng.com/blog/2017/07/neural-network.html 眼下最熱門的技術，絕對是人工智慧。人工智慧的底層模型是"神經網路"（neural network）。許多複雜的應用（比如模式識別、自動控制）和高階模型（比如深度學習

機器學習BP神經網路，任意拓撲結構 （C++）

相關推薦

機器學習BP神經網路，任意拓撲結構（C++）