logistic 回歸（線性和非線性）

阿新 • • 發佈：2018-10-24

num itl [1] tex sns RKE rec 損失函數 pos

一：線性logistic 回歸

代碼如下：

import numpy as np
import pandas as pd
import matplotlib.pyplot as plt
import scipy.optimize as opt
import seaborn as sns

#讀取數據集
path = ‘ex2data1.txt‘
data = pd.read_csv(path, header=None, names=[‘Exam 1‘, ‘Exam 2‘, ‘Admitted‘])

#將正負數據集分開
positive = data[data[‘Admitted‘].isin([1])]
negative  
= data[data[‘Admitted‘].isin([0])]

‘‘‘
#查看分布
fig, ax = plt.subplots(figsize=(12, 8))
ax.scatter(positive[‘Exam 1‘], positive[‘Exam 2‘], s=60, c=‘b‘, marker=‘o‘, label=‘Admitted‘)
ax.scatter(negative[‘Exam 1‘], negative[‘Exam 2‘], s=50, c=‘r‘, marker=‘x‘, label=‘UnAdmitted‘)
ax.legend()
ax.set_xlabel(‘Exam 1 Score‘)
ax.set_ylabel(‘Exam 2 Score‘)
plt.show()
 
‘‘‘

#sigmoid函數實現
def sigmoid(h):
    return 1 / (1 + np.exp(-h))


‘‘‘
#測試sigmoid函數
nums = np.arange(-10, 11, step=1)
fig, ax = plt.subplots(figsize=(12, 8))
ax.plot(nums, sigmoid(nums), ‘k‘)
plt.show()
‘‘‘

#計算損失函數值
def cost(theta, X, y):
    theta = np.matrix(theta)
    X = np.matrix(X)
    y = np.matrix(y)

    part1  
= np.multiply(-y, np.log(sigmoid(X * theta.T)))
    part2 = np.multiply((1-y), np.log(1-sigmoid(X * theta.T)))
    return np.sum(part1-part2) / len(X)

#在原矩陣第1列前加一列全1
data.insert(0, ‘ones‘, 1)

cols = data.shape[1]

X = data.iloc[:, 0:cols-1]
y = data.iloc[:, cols-1:cols]

X = np.array(X.values)
y = np.array(y.values)
theta = np.zeros(3) #這裏是一個行向量


#返回梯度向量，註意是向量
def gradient(theta, X, y):
    theta = np.matrix(theta)
    X = np.matrix(X)
    y = np.matrix(y)

    parameters = theta.ravel().shape[1]
    grad = np.zeros(parameters)

    error = sigmoid(X * theta.T) - y

    grad = error.T.dot(X)
    grad = grad / len(X)
    return grad

#通過高級算法計算出最好的theta值
result = opt.fmin_tnc(func=cost, x0=theta, fprime=gradient, args=(X, y))

#print(cost(result[0], X, y))

#測試所得theta的性能
#計算原數據集的預測情況
def predict(theta, X):
    theta = np.matrix(theta)
    X = np.matrix(X)

    probability = sigmoid(X * theta.T)
    return [1 if i > 0.5 else 0 for i in probability]


theta_min = result[0]
predictions = predict(theta_min, X)

correct = [1 if((a == 1 and b == 1) or(a == 0 and b == 0)) else 0 for(a, b) in zip(predictions, y)]
accuracy = (sum(map(int, correct)) % len(correct))
print(‘accuracy = {0}%‘.format(accuracy))#訓練集測試準確度89%


# 作圖
theta_temp = theta_min
theta_temp = theta_temp / theta_temp[2]

x = np.arange(130, step=0.1)
y = -(theta_temp[0] + theta_temp[1] * x)
#畫出原點
sns.set(context=‘notebook‘, style=‘ticks‘, font_scale=1.5)
sns.lmplot(‘Exam 1‘, ‘Exam 2‘, hue=‘Admitted‘, data=data,
           size=6,
           fit_reg=False,
           scatter_kws={"s": 25}
           )
#畫出分界線
plt.plot(x, y, ‘grey‘)
plt.xlim(0, 130)
plt.ylim(0, 130)
plt.title(‘Decision Boundary‘)
plt.show()

二：非線性logistic 回歸（正則化）

代碼如下：

import pandas as pd
import numpy as np
import scipy.optimize as opt
import matplotlib.pyplot as plt


path = ‘ex2data2.txt‘
data = pd.read_csv(path, header=None, names=[‘Test 1‘, ‘Test 2‘, ‘Accepted‘])

positive = data[data[‘Accepted‘].isin([1])]
negative = data[data[‘Accepted‘].isin([0])]

‘‘‘
#顯示原始數據的分布
fig, ax = plt.subplots(figsize=(12, 8))
ax.scatter(positive[‘Test 1‘], positive[‘Test 2‘], s=50, c=‘b‘, marker=‘o‘, label=‘Accepted‘)
ax.scatter(negative[‘Test 1‘], negative[‘Test 2‘], s=50, c=‘r‘, marker=‘x‘, label=‘Unaccepted‘)
ax.legend() #顯示右上角的Accepted 和 Unaccepted標簽
ax.set_xlabel(‘Test 1 Score‘)
ax.set_ylabel(‘Test 2 Score‘)
plt.show()
‘‘‘
degree = 5
x1 = data[‘Test 1‘]
x2 = data[‘Test 2‘]
#在data的第三列插入一列全1
data.insert(3, ‘Ones‘, 1)

#創建多項式特征值，最高階為4
for i in range(1, degree):
    for j in range(0, i):
        data[‘F‘ + str(i) + str(j)] = np.power(x1, i-j) * np.power(x2, j)

#刪除原數據中的test 1和test 2兩列
data.drop(‘Test 1‘, axis=1, inplace=True)
data.drop(‘Test 2‘, axis=1, inplace=True)


#sigmoid函數實現
def sigmoid(h):
    return 1 / (1 + np.exp(-h))


def cost(theta, X, y, learnRate):
    theta = np.matrix(theta)
    X = np.matrix(X)
    y = np.matrix(y)

    first = np.multiply(-y, np.log(sigmoid(X * theta.T)))
    second = np.multiply((1 - y), np.log(1 - sigmoid(X * theta.T)))
    reg = (learnRate / (2 * len(X))) * np.sum(np.power(theta[:, 1:theta.shape[1]], 2))
    return np.sum(first - second) / len(X) + reg


learnRate = 1
cols = data.shape[1]

X = data.iloc[:, 1:cols]
y = data.iloc[:, 0:1]

X = np.array(X)
y = np.array(y)
theta = np.zeros(X.shape[1])


#計算原數據集的預測情況
def predict(theta, X):
    theta = np.matrix(theta)
    X = np.matrix(X)

    probability = sigmoid(X * theta.T)
    return [1 if i > 0.5 else 0 for i in probability]


def gradientReg(theta, X, y, learnRate):
    theta = np.matrix(theta)
    X = np.matrix(X)
    y = np.matrix(y)

    paramates = int(theta.ravel().shape[1])
    grad = np.zeros(paramates)

    grad = (sigmoid(X * theta.T) - y).T * X / len(X) + (learnRate / len(X)) * theta[:, i]
    grad[0] = grad[0] - (learnRate / len(X)) * theta[:, i]
    return grad

result = opt.fmin_tnc(func=cost, x0=theta, fprime=gradientReg, args=(X, y, learnRate))
print(result)

theta_min = np.matrix(result[0])
predictions = predict(theta_min, X)
correct = [1 if((a == 1 and b == 1) or(a == 0 and b == 0)) else 0 for(a, b) in zip(predictions, y)]
accuracy = (sum(map(int, correct)) % len(correct))

print(‘accuracy = {0}%‘.format(accuracy))

logistic 回歸（線性和非線性）

num itl [1] tex sns RKE rec 損失函數 pos 一：線性logistic 回歸代碼如下： import numpy as np import pandas as pd import matplotlib.pyplot as plt import

機器學習：邏輯回歸（損失函數）

梯度模型分享圖片 com info 而且機器學習邏輯分類 # # 由於邏輯回歸解決的是分類問題，而且是二分類，因此定義損失函數時也要有兩類　　# 1）如果 y = 1（p ≥ 0.5），p 越小，損失函數越大；　　# 2）如果 y = 0（p ≤ 0.5），

邏輯回歸（分類算法）

分類問題定性 oid 一個關系多分類研究根據 bsp 1.什麽是邏輯回歸在前面講述的回歸模型中，處理的因變量都是數值型區間變量，建立的模型描述是因變量的期望與自變量之間的線性關系。比如常見的線性回歸模型：　　　　　　　　　　　　　　　　而在采用回歸模型分析

angular 的http請求回撥（success 和 error）

前面有文章寫過angular的$http請求的簡單書寫和使用。回顧一下： var Server = angular.module("Server", []); Server.service("Api", ["$http", function ($http)

從零單排入門機器學習：線性回歸（linear regression）實踐篇

class rom enter instr function ont 線性 gin 向量線性回歸（linear regression）實踐篇之前一段時間在coursera看了Andrew ng的機器學習的課程，感覺還不錯，算是入門了。這次打算以該課程的作業

機器學習經典算法具體解釋及Python實現--線性回歸（Linear Regression）算法

ica single 方便最好的而且 == show des fun （一）認識回歸回歸是統計學中最有力的工具之中的一個。機器學習監督學習算法分為分類算法和回歸算法兩種，事實上就是依據類別標簽分布類型為離散型、連續性而定義的。顧名思義。分類算法用於離散型分布

邏輯回歸（Logistic Regression）

方差 %d pan transpose pos mit int gre cost import numpy as np import random def genData(numPoints,bias,variance):#實例偏好方差 x = np.zer

2.2 logistic回歸損失函數（非常重要，深入理解）

問題好的為知得出 cnblogs 回歸算法很多將他深入上一節當中，為了能夠訓練logistic回歸模型的參數w和b，需要定義一個成本函數使用logistic回歸訓練的成本函數為了讓模型通過學習來調整參數，要給出一個含有m和訓練樣本的訓練集很自然的，希望通過

ng機器學習視頻筆記（四） ——logistic回歸

微信 style 簡化關註 ora 微信公眾號預測縮放 log ng機器學習視頻筆記（四） ——logistic回歸（轉載請附上本文鏈接——linhxx）一、概述 1、基本概念 logistic回歸（logistic regression）

tensorflow實現svm多分類 iris 3分類——本質上在使用梯度下降法求解線性回歸（loss是定制的而已）

points near plot asi atm lob put matplot ive # Multi-class (Nonlinear) SVM Example # # This function wll illustrate how to # implement

ML:單變量線性回歸（Linear Regression With One Variable）

one mod gre line lin 我們目的技術 ESS 模型表達（model regression）用於描述回歸問題的標記 m 訓練集（training set）中實例的數量 x 特征/輸入變量 y 目標變量/輸出變量 (x,y) 訓練集中的實例 (x(

python實現線性回歸（一）原理

函數乘法學習偏移量 python實現機器線性計算梯度線性回歸是機器學習的基礎，用處非常廣泛，在日常工作中有很大作用。 1.什麽是線性回歸通過多次取點，找出符合函數的曲線，那麽就可以完成一維線性回歸。 2.數學表示是截距值，為偏移量。因為單純計算多項

在python中實現線性回歸（linear regression）

lsa d+ 分享圖片通過 nsq mps mile edi mfp 1 什麽是線性回歸確定因變量與多個自變量之間的關系，將其擬合成線性關系構建模型，進而預測因變量 2 線性回歸原理最小二乘法OLS（ordinary learst squares）模型的y與實際值y

tensorflow-非線性回歸（2）

線性 tip optimizer lob rate bre multi random ide #!/usr/bin/env python2 # -*- coding: utf-8 -*- """ Created on Sat Sep 15 10:54:53 2018 @a

怎樣區分線性和非線性_線性與非線性的區別（線性分析、線性模型）

一直對線性非線性沒有很準確的定義認識,今天特意查了查,特此記錄下。怎樣區分線性和非線性 1.線性Line，是指量與量之間按照比例成直線關係，在數學上可理解為一階導數是個常數；非線性non-line則指不按照比例不成直線關係，一節導數不為常數。 2.線性可

機器學習---線性回歸（Machine Learning Linear Regression）

包括 rest 梯度下降法向量鞍點麻煩貝葉斯 div rem 線性回歸是機器學習中最基礎的模型，掌握了線性回歸模型，有利於以後更容易地理解其它復雜的模型。線性回歸看似簡單，但是其中包含了線性代數，微積分，概率等諸多方面的知識。讓我們先從最簡單的形式開始。

機器學習/邏輯回歸（logistic regression）/--附python代碼

一個 should 示意圖 algrithm cto python ber -- 根據個人分類：機器學習本文為吳恩達《機器學習》課程的讀書筆記，並用python實現。前一篇講了線性回歸，這一篇講邏輯回歸，有了上一篇的基礎，這一篇的內容會顯得比較簡單。邏輯回歸（l

opencv中線性和非線性濾波（程式）分析

線性濾波的方框濾波，均值濾波與高斯濾波，屬於非線性濾波的中值濾波，雙邊濾波，對應的程式中都給出了，這是一個綜合的測試程式。 #include <opencv2\opencv.hpp> #include <opencv2\highgui\highgui.hpp> #in

線性回歸（一）

.com fonts 應用 eight gre 垂直三維梯度地理什麽是機器學習？機器學習：研究如何通過計算的手段，利用經驗來改善系統自身的性能。機器學習分為監督學習和非監督學習。監督學習（Supervised learning）

機器學習筆記（4）Logistic回歸

可能性相同模擬我們 inline alt 最小 cas 離散模型介紹對於分類問題，其得到的結果值是離散的，所以通常情況下，不適合使用線性回歸方法進行模擬。所以提出Logistic回歸模型。其假設函數如下： \[ h_θ(x)=g(θ^Tx) \] 函數g定義如

logistic 回歸（線性和非線性）

相關推薦