Softmax迴歸C++實現

阿新 • • 發佈：2019-02-04

前言 Softmax迴歸模型的理論知識上一篇博文已經介紹。C++程式碼來源於一個開源專案，連結地址我忘了

，哪天找到了再附上。對原始碼改動不大，只是進行了一些擴充。

實驗環境

Visual Studio 2013

資料

裡面共有20000個樣本，每個樣本16維。

實驗目的

完成對資料集中字元樣本的分類。

實驗程式碼

1.定義一個LogisticRegression的類：

標頭檔案 LogisticRegression.h

#include <iostream>
#include <math.h>
#include<algorithm> 
#include <functional> 
#include <string>
#include <cassert>
#include <vector>
using namespace std;
class LogisticRegression {
public:
	LogisticRegression(int inputSize, int k, int dataSize, int num_iters,double learningRate);
	~LogisticRegression();
	bool loadData(const string& filename);//載入資料
	void train();//訓練函式
	void softmax(double* thetaX);//得到樣本對應的屬於某個類別的概率
	double predict(double* x);//預測函式
	double** getX();
	double** getY();
	void printX();
	void printY();
	void printTheta();
private:
	int inputSize;//輸入特徵數，不包括bias項
	int k;//類別數
	int dataSize;//樣本數
	int num_iters;//迭代次數
	double **theta;//學習得到的權值引數
	double alpha;//學習速率
	double** x;//訓練資料集
	double** y;//訓練資料集對應的標號
};

實現檔案 LogisticRegression.cpp

#include "LogisticRegression.h"
LogisticRegression::LogisticRegression(int in, int out,int size, int num_iters,double learningRate) {
	inputSize = in;
	k = out;
	alpha = learningRate;
	dataSize = size; 
	this->num_iters = num_iters;
	// initialize theta
	theta = new double*[k];
	for (int i = 0; i<k; i++) theta[i] = new double[inputSize];
	for (int i = 0; i<k; i++) {
		for (int j = 0; j<inputSize; j++) {
			theta[i][j] = 0;
		}
	}
	//initialize x
	x = new double*[dataSize];
	for (int i = 0; i<dataSize; i++) x[i] = new double[inputSize];
	for (int i = 0; i<dataSize; i++) {
		for (int j = 0; j<inputSize; j++) {
			x[i][j] = 0;
		}
	}
	//initialize y
	y = new double*[dataSize];
	for (int i = 0; i<dataSize; i++) y[i] = new double[k];
	for (int i = 0; i<dataSize; i++) {
		for (int j = 0; j<k; j++) {
			y[i][j] = 0;
		}
	}
}

LogisticRegression::~LogisticRegression() {
	for (int i = 0; i<k; i++) delete[] theta[i];
	delete[] theta;
	for (int i = 0; i < dataSize; i++)
	{
		delete[] x[i];
		delete[] y[i];
	}
	delete[] x;
	delete[] y;
}

void LogisticRegression::train() {
	for (int n = 0; n < num_iters; n++)
	{
		for (int s = 0; s < dataSize; s++)
		{
			double *py_x = new double[k];
			double *dy = new double[k];
			//1.求出theta*x
			for (int i = 0; i<k; i++) {
				py_x[i] = 0;
				for (int j = 0; j<inputSize; j++) {
					py_x[i] += theta[i][j] * x[s][j];
				}
			}
			//2.求出概率
			softmax(py_x);
			for (int i = 0; i<k; i++) {
				dy[i] = y[s][i] - py_x[i];//真實值與預測值的差異

				for (int j = 0; j<inputSize; j++) {
					theta[i][j] += alpha * dy[i] * x[s][j] / dataSize;
				}
			}
			delete[] py_x;
			delete[] dy;
		}
	}
}

void LogisticRegression::softmax(double *x) {
	double max = 0.0;
	double sum = 0.0;

	for (int i = 0; i<k; i++) if (max < x[i]) max = x[i];
	for (int i = 0; i<k; i++) {
		x[i] = exp(x[i] - max);
		sum += x[i];
	}

	for (int i = 0; i<k; i++) x[i] /= sum;
}


double LogisticRegression::predict(double *x) {
	double clsLabel;
	double* predictY = new double[k];
	for (int i = 0; i < k; i++) {
		predictY[i] = 0;
		for (int j = 0; j < inputSize; j++) {
			predictY[i] += theta[i][j] * x[j];
		}
	}
	softmax(predictY);
	double max = 0;
	for (int i = 0; i < k; i++)
	{
		if (predictY[i]>max) {
			clsLabel = i;
			max = predictY[i];
		}
	}
	return clsLabel;
}

double** LogisticRegression::getX()
{
	return x;
}
double** LogisticRegression::getY()
{
	return y;
}

bool LogisticRegression::loadData (const string& filename)
{
	const int M = 1024;
	char buf[M + 2];
	int i;
	vector<int> responses;
	FILE* f = fopen(filename.c_str(), "rt");
	if (!f)
	{
		cout << "Could not read the database " << filename << endl;
		return false;
	}
	int rowIndex = 0;
	for (;;)
	{
		char* ptr;
		if (!fgets(buf, M, f) || !strchr(buf, ','))// char *strchr(const char *s,char c):查詢字串s中首次出現字元c的位置
			break;
		y[rowIndex][buf[0] - 'A'] = 1;
		ptr = buf + 2;
		for (i = 0; i < inputSize; i++)
		{
			int n = 0;//存放sscanf當前已讀取了的總字元數
			int m = 0;
			sscanf(ptr, "%d%n", &m, &n);//sscanf() - 從一個字串中讀進與指定格式相符的資料
			x[rowIndex][i] = m;
			ptr += n + 1;
		}
		rowIndex++;
		if (rowIndex >= dataSize) break;
		if (i < inputSize)
			break;
	}
	fclose(f);
	cout << "The database " << filename << " is loaded.\n";
	return true;
}

void LogisticRegression::printX()
{
	for (int i = 0; i<dataSize; i++) {
		for (int j = 0; j<inputSize; j++) {
			cout << x[i][j] << " ";
		}
		cout << endl;
	}
}
void LogisticRegression::printY()
{
	for (int i = 0; i<dataSize; i++) {
		for (int j = 0; j<k; j++) {
			cout << y[i][j] << " ";
		}
		cout << endl;
	}
}

void LogisticRegression::printTheta()
{
	for (int i = 0; i < k; i++) {
		for (int j = 0; j < inputSize; j++) {
			cout << theta[i][j] << " ";
		}
		cout << endl;
	}

}

2.程式碼測試：

#include "LogisticRegression.h"
void letter_recog()
{
	double learning_rate = 0.1;
	int num_iters = 500;//迭代次數
	int train_N =10000;//訓練樣本個數
	int test_N = 8;//測試樣本個數
	int n_in = 16;//輸入特徵維數
	int n_out = 26;//類別數
	LogisticRegression classifier(n_in, n_out, train_N, num_iters, learning_rate);
	classifier.loadData("letter-recognition.data");
	//訓練
	classifier.train();
	// test data
	double test_X[8][16] = {
		{ 5, 10, 6, 8, 4, 7, 7, 12, 2, 7, 9, 8, 9, 6, 0, 8 },//M
		{ 6, 12, 7, 6, 5, 8, 8, 3, 3, 6, 9, 7, 10, 10, 3, 6 },//W
		{ 3, 8, 4, 6, 4, 7, 7, 12, 1, 6, 6, 8, 5, 8, 0, 8 },//N
		{ 1, 0, 1, 0, 0, 7, 8, 10, 1, 7, 5, 8, 2, 8, 0, 8 },//H
		{ 3, 6, 5, 5, 6, 6, 8, 3, 3, 6, 5, 9, 6, 7, 5, 9 },//R
		{ 7, 11, 11, 8, 7, 4, 8, 2, 9, 10, 11, 9, 5, 8, 5, 4 }, //X
		{ 6, 9, 6, 4, 4, 8, 9, 5, 3, 10, 5, 5, 5, 10, 5, 6 },//P	
		{ 4, 7, 6, 5, 5, 8, 5, 7, 4, 6, 7, 9, 3, 7, 6, 9 }//Q
	};
	// test
	for (int i = 0; i<test_N; i++) {
		double predict = classifier.predict(test_X[i]);
		char char_predict = 'A' + predict;
		cout << "predict:" << char_predict << endl;
	}
}

int main() {
	letter_recog();
	getchar();
	return 0;

輸出結果：

程式中用了前1w個樣本來訓練分類器，整個訓練過程花了328.117s。為了加快程式的執行速度，決定使用OpenMP來加速for迴圈。在Visual Studio裡面使用OpenMP很簡單。點選專案-->屬性，進入屬性頁。在c/c++下面的Language中開啟Open MP Support即可。

修改過後的train函式：

void LogisticRegression::train() {
	for (int n = 0; n < num_iters; n++)
	{
#pragma omp parallel for  
		for (int s = 0; s < dataSize; s++)
		{
			double *py_x = new double[k];
			double *dy = new double[k];
			//1.求出theta*x
			for (int i = 0; i<k; i++) {
				py_x[i] = 0;
				for (int j = 0; j<inputSize; j++) {
					py_x[i] += theta[i][j] * x[s][j];
				}
			}
			//2.求出概率
			softmax(py_x);
#pragma omp parallel for  
			for (int i = 0; i<k; i++) {
				dy[i] = y[s][i] - py_x[i];//真實值與預測值的差異			
				for (int j = 0; j<inputSize; j++) {
					theta[i][j] += alpha * dy[i] * x[s][j] / dataSize; //- lambda*theta[i][j];
				}
			}
			delete[] py_x;
			delete[] dy;
		}
	}
}

修改過後的softmax函式：

void LogisticRegression::softmax(double *x) {
	double max = 0.0;
	double sum = 0.0;
	for (int i = 0; i<k; i++) if (max < x[i]) max = x[i];
#pragma omp parallel for  
	for (int i = 0; i<k; i++) {
		x[i] = exp(x[i] - max);//防止資料溢位
		sum += x[i];
	}
#pragma omp parallel for  
	for (int i = 0; i<k; i++) x[i] /= sum;
}

輸出結果：

訓練時間從之前的328.117s較少到49.081s,提升了6.68倍。
從測試結果來看，分類器把R預測成了K，把X預測成了U。本文沒有對分類器的準確率進行嚴格的測試，有興趣的同學可以自己去測一下。

Softmax迴歸C++實現

前言 Softmax迴歸模型的理論知識上一篇博文已經介紹。C++程式碼來源於一個開源專案，連結地址我忘了，哪天找到了再附上。對原始碼改動不大，只是進行了一些擴充。實驗環境 Visual Studio 2013 資料裡面共有20000個樣本，每個樣本16維。實驗目的

softmax迴歸及其實現（TensorFlow）

在之前的博文《logistic迴歸》中，我們簡單的提到了softmax迴歸。本文將首先介紹softmax迴歸的基本原理。然後比較softmax迴歸於logistic迴歸的關聯。最後用開源TensorFl

KNN分類與迴歸-C++實現

#include <iostream> #include <algorithm> #include <iomanip> #include <fstream> #include <sstream> #include <cstring> #

TensorFlow實現Softmax迴歸（模型儲存與載入）

1 # -*- coding: utf-8 -*- 2 """ 3 Created on Thu Oct 18 18:02:26 2018 4 5 @author: zhen 6 """ 7 8 from tensorflow.examples.tutorials.mnist imp

c++實現線性迴歸（高斯消元）（附python實現）

前言寫這次blog的契機是上次筆試的時候，遇到了這個問題當時以為numpy庫是可以用的，就先寫了個python版，結果並不能用。。最後憤然寫了個c++版不過最後一個小問題導致我差了兩分鐘沒交上去程式碼，所以這一版原始碼只是通過了案例但沒有提交ac。。

深度學習2--tensorflow--Softmax迴歸實現手寫數字識別

使用Softmax迴歸來實現手寫數字識別，即給定一張手寫數字，判斷屬於0--9中哪一個數字。 1.LR邏輯迴歸先準備一下LR邏輯迴歸：廣義線性模型：實現x到y的非線性對映：在LR邏輯迴歸中取g函式：實現0--1對映輸出值為預測結果為1的概率

tensorflow11：雙隱層+softmax迴歸實現mnist圖片識別

概述上篇文章講到的sofmax迴歸，除了輸入層，只有線性層+sofmax,這兩者合起來可以被稱為輸出層。沒有中間的隱藏層。本文介紹在sofmax迴歸基礎上增加兩層隱藏層的方法。本文的主要參考來自參考資料裡的《TensorFlow運作方式入門》和《Tenso

tensorflow 12：雙隱層+softmax迴歸實現mnist圖片識別之二

概述 tensorflow的自帶例程用兩個檔案演示了“全連線層+softmax迴歸”實現mnist圖片識別的功能。一個檔案是mnist.py,在之前一篇文章《tensorflow 11：雙隱層+softmax迴歸實現mnist圖片識別》已經介紹過了。不過mnis

一元線性迴歸模型與最小二乘法及其C++實現

監督學習中，如果預測的變數是離散的，我們稱其為分類（如決策樹，支援向量機等），如果預測的變數是連續的，我們稱其為迴歸。迴歸分析中，如果只包括一個自變數和一個因變數，且二者的關係可用一條直線近似表示，這種迴歸分析稱為一元線性迴歸分析。如果迴歸分

3、TensorFlow實現Softmax迴歸識別手寫數字

一、資料集介紹 55000個訓練集、10000個測試集、5000個驗證集。手寫數字圖片28*28畫素，從二維結構轉化為一維（後面章節使用卷積神經網路會利用空間結構）＝784維特徵。 0到9共10維label特徵。 from tensorflow.examples.tut

邏輯迴歸softmax神經網路實現手寫數字識別(cs)

邏輯迴歸softmax神經網路實現手寫數字識別全過程 1 - 匯入模組 import numpy as np import matplotlib.pyplot as plt from ld_mnist import load_digits

梯度下降原理及線性迴歸程式碼實現（python/java/c++）

“梯度下降”顧名思義通過一步一步迭代逼近理想結果，當達到一定的精度或者超過迭代次數才退出，所以所獲得的結果是一個近似值。在其他部落格上面基本都有一個通俗的比喻：從山頂一步步下山。下面將用到幾個概念： - 步長：移動一步的長度。 - 維度：一個空間的表示方式，

Keras上實現Softmax迴歸模型

一、分類神經網路構建過程本例程是在MNIST資料集，構建一個簡單分類神經網路，實現對0-9這10個數字的分類。 1.資料預處理 Keras 自身包含 MNIST 這個資料集，再分成訓練集和測試集。x 是一張張圖片，y 是每張圖片對應的標籤，即它是哪個數字。輸入的 x 變成

Logistic迴歸、softmax迴歸以及tensorflow實現MNIST識別

一、Logistic迴歸 Logistic迴歸為概率型非線性迴歸模型，是研究二分類結果與一些影響因素之間關係的一種多變數分析方法。通常是用來研究某些因素條件下某個結果是否發生。在講解Logistic迴歸理論之前，我們先從LR分類器說起。LR分類器，即Logistic Regression Classifi

sigmoid和softmax函式的C++實現

float sigmoid(float x) { return (1 / (1 + exp(-x))); } float sigmoid_dy_dz(float x) { retu

Python下的Softmax迴歸函式的實現方法

Softmax迴歸函式是用於將分類結果歸一化。但它不同於一般的按照比例歸一化的方法，它通過對數變換來進行歸一化，這樣實現了較大的值在歸一化過程中收益更多的情況。 Softmax公式 Soft

線性迴歸（linear-regression）預測演算法基本概念&C++實現

linear-regression預測演算法C++實現機器學習領域，幾個常見的概念：迴歸(regression)：用已知樣本對未知公式引數的估計。線性迴歸(linear regression)：迴歸的一種，迴歸函式是一次函式，例如：result=f(X,Y,Z,…)=

從頭學pytorch(四)　softmax迴歸實現

FashionMNIST資料集共70000個樣本,60000個train,10000個test．共計10種類別. 通過如下方式下載． mnist_train = torchvision.datasets.FashionMNIST(root='/home/sc/disk/keepgoing/lear

c# 實現 ListBox 每一列可以有各自的顏色

font 效果 else graphic .com ror graphics 不能 c# 上圖是想實現的效果，註意不是所有行一個顏色首先把 listbox 的 DrawMode 屬性改為 OwnerDrawFixed 然後 override listbox

設計模式——抽象工廠模式（C++實現）

concrete out png return style bsp ctp img using 1 #include <iostream> 2 #include <string> 3 4 usin

Softmax迴歸C++實現

相關推薦