SIFT演算法特徵描述子構建---特徵描述子構建原理及程式碼

阿新 • • 發佈：2019-02-05

0.引言

sift針對區域性特徵進行特徵提取，在尺度空間尋找極值點，提取位置，尺度，旋轉不變數，生成特徵描述子。

總共分四個步驟：

4 特徵描述子構建

每個關鍵點的方向、位置、尺度資訊都具備後，可以對區域性特徵進行描述，即特徵描述子。

4.1 確定描述子區域

將關鍵點劃分為d*d(Lowe建議4)個子區域，每個子區域為一個種子點，
每個種子點有8個方向，即128維特徵。為每個子區域分配邊長為3*sigma_oct的矩形取樣，考慮實際計算用雙線性插值，以及旋轉，放大sqrt(2)*(d+1),
最終所選影象視窗半徑

4.2 座標軸旋轉為關鍵點的方向

旋轉保持旋轉不變性
這裡寫圖片描述

4.3 將子區域內的梯度值插值加權分配到8 個方向上

這裡寫圖片描述

//對每個種子點每個方向插值
//weight=w*dr^k*(1-dr)^（1-k）*dc^m*(1-dc)^(1-m)*do^n*(1-do)^(1-n)
//m,n,k為0，1
void InterpHistEntry(double*** hist, double xbin, double ybin, double obin, double mag, int bins, int d)
{
    //對鄰近兩行的貢獻因子為dr和1 - dr，對鄰近兩列的貢獻因子為dc和1 - dc，對鄰近兩個方向的貢獻因子為do和1 - do
    double 
 d_r, d_c, d_o;
    int r0, c0, o0;
    //r0取不大於xbin的正整數時。
    //r0 + 0 <= xbin <= r0 + 1
    //mag在區間[r0, r1]上做插值
    r0 = cvFloor(ybin);
    c0 = cvFloor(xbin);
    o0 = cvFloor(obin);
    d_r = ybin - r0; // 計算偏差
    d_c = xbin - c0;
    d_o = obin - o0;

    double v_r, v_c, v_o;//v_r為mag在行上、列加權，最後方向的加權
    int rb, cb, ob;//r,c,o分別取0，1時候的行列 

    double** row, *h;
    for (int r = 0; r <= 1; r++)
    {
        rb = r + r0;
        if (rb >= 0 && rb<d)//在4*4描述子內
        {
            v_r = mag*((r == 0) ? 1 - d_r : d_r);//分別計算r取0，1時的值，最後相加
            row = hist[rb];//固定行，進入hist的列
            for (int c = 0; c <= 1; c++)
            {
                cb = c0 + c;
                if (cb >= 0 && cb<d)
                {
                    v_c = v_r*((c == 0) ? 1 - d_c : d_c);
                    h = row[cb];
                    for (int o = 0; o <= 1; o++)
                    {
                        ob = (o0 + o) % bins;
                        v_o = v_c*((o == 0) ? 1 - d_o : d_o);
                        h[ob] += v_o;//累加各層取0，1時候的加權值
                    }
                }

            }
        }

    }
}

double*** CalculateDescrHist(const Mat&gauss, int x, int y, double octave_scale, double ori, int bins, int width)
{
//二維陣列指標,width 為子區域尺寸d=4*4
double *hist = new double [width];
for (int i = 0; i < width; i++)
{
//長度為width的一維陣列指標
hist[i] = new double *[width];
for (int j = 0; j < width; j++)
{
//每個hist處是一個36維陣列
hist[i][j] = new double[bins];
}
}
//初始化
for (int r = 0; r < width; r++)
for (int c = 0; c < width; c++)
for (int o = 0; o < bins; o++)
hist[r][c][o] = 0.0;

//高斯權值，Lowe建議子區域的畫素的梯度大小按sigma=0.5*d的高斯加權計算，即2
double sigma = 0.5*width;
double conste = -1.0 / (2 * sigma*sigma);

double sub_hist_width = DESCR_SCALE_ADJUST*octave_scale;//每個子區域尺寸為mσ個像元 尺度特徵點的尺度值3*sig_oct
                                                        //子區域半徑
int radius = cvRound((sqrt(2)*sub_hist_width*(width + 1)) / 2.0);
double grad_ori;
double grad_mag;
/*計算取樣區域點座標旋轉
|x`|  |cos -sin| |x|
|  | =|        |*| |
|y`|  |sin  cos| |y|
子區域下標
| x``|  1               |x|
|    |=--------------*  | | +1/d
| y``| sub_hist_width   |y|
*/
double cos_ori = cos(ori);
double sin_ori = sin(ori);
for (int i = -radius; i < radius; i++)
{
    for (int j = -radius; j < radius; j++)
    {
        double rot_x = (cos_ori*j - sin_ori + i);
        double rot_y = (sin_ori*j + cos_ori + i);   
        double xbin = rot_x / sub_hist_width + width / 2 - 0.5;                     //xbin, ybin為落在4 * 4視窗中的下標值
        double ybin = rot_y / sub_hist_width + width / 2 - 0.5;
        if (xbin>-1.0&&xbin<width&&ybin>-1 && ybin<width)
        {
            //計算關鍵點的梯度
            if (CalcGradMagOri(gauss, x + j, y + i, grad_mag, grad_ori))
            {
                //梯度方向夾角
                grad_ori = (CV_PI - grad_ori) - ori;
                while (grad_ori<0)
                {
                    grad_ori += CV_PI * 2;
                }
                while (grad_ori >= CV_PI * 2)
                {
                    grad_ori -= 2 * CV_PI;
                }
                double obin = grad_ori*(bins / (2 * CV_PI));//種子點所在子視窗的方向 
                                                            //公式子區域畫素梯度進行高斯加權：exp(-（(x`2)+（y`2））/(2*(0.5d)^2))
                double weight = exp(conste*(rot_x*rot_x + rot_y*rot_y));

                //插值計算每個種子點處的梯度
                InterpHistEntry(hist, xbin, ybin, obin, grad_mag*weight, bins, width);
            }
        }

    }
}


return hist;

}

4.4 歸一化及門限

如上統計的4*4*8=128個梯度資訊即為該關鍵點的特徵向量。特徵向量形成後，為了去除光照變化的影響，需要對它們進行歸一化處理，對於影象灰度值整體漂移，影象各點的梯度是鄰域畫素相減得到，所以也能去除。
這裡寫圖片描述

void NormalizeDescr(Keypoint& feat)
{
    double len_sq = 0;
    for (int i = 0; i < feat.descr_length; i++)
    {
        len_sq += feat.descriptor[i] * feat.descriptor[i];
    }
    len_sq = sqrt(len_sq);
    for (int i = 0; i < feat.descr_length; i++)
    {
        feat.descriptor[i] = feat.descriptor[i] / len_sq;
    }
}

設定門限
非線性光照，相機飽和度變化對造成某些方向的梯度值過大，而對方向的影響微弱。因此設定門限值(向量歸一化後，一般取0.2)截斷較大的梯度值。然後，再進行一次歸一化處理，提高特徵的鑑別性。

//直方圖存入特徵描述子
void HistToDescriptor(double***hist, int width, int bins, Keypoint& feature)
{
    int k = 0;
    for (int r = 0; r < width; r++)
    {
        for (int c = 0; c < width; c++)
        {
            for (int o = 0; o < bins; o++)
            {
                feature.descriptor[k++] = hist[r][c][o];//放進128維特徵描述子內
            }
        }
    }
    feature.descr_length = k;
    //描述子歸一化
    NormalizeDescr(feature);
    //描述子門限
    for (int i = 0; i < k; i++)
    {
        if (feature.descriptor[i]>DESCR_MAG_THR)
        {
            feature.descriptor[i] = DESCR_MAG_THR;
        }
    }
    //第二次歸一化
    NormalizeDescr(feature);
    int int_val;//整形值  將double型轉為整形描述子
    for (int i = 0; i < k; i++)
    {
        int_val = INT_DESCR_FCTR*feature.descriptor[i];
        feature.descriptor[i] = min(255, int_val);
    }

}

4.5 生成描述子

void DescriptorRepresentation(vector<Keypoint>&features, const vector<Mat>& guass_pyr, int bins, int width)
{
    double ***hist;
    for (int i = 0; i < features.size(); i++)
    {
        hist = CalculateDescrHist(guass_pyr[features[i].octave*(INTERVALS + 3) + features[i].interval], features[i].x, features[i].y, features[i].octave_scale, features[i].ori, bins, width);
        HistToDescriptor(hist, width, bins, features[i]);
        //釋放空間
        for (int j = 0; j < width; j++)
        {
            for (int k = 0; k < width; k++)
            {
                delete[] hist[j][k];
            }
            delete[] hist[j];
        }
        delete[] hist;
    }
}

SIFT演算法特徵描述子構建---特徵描述子構建原理及程式碼

0.引言

4 特徵描述子構建

4.1 確定描述子區域

4.2 座標軸旋轉為關鍵點的方向

4.3 將子區域內的梯度值插值加權分配到8 個方向上

4.4 歸一化及門限

4.5 生成描述子

SIFT演算法特徵描述子構建---關鍵點定位原理及程式碼

sift演算法特徵描述子構建程式碼實現--梯度直方圖生成原理及程式碼

SIFT演算法特徵描述子構建---特徵描述子構建原理及程式碼

【機器學習】Apriori演算法——原理及程式碼實現（Python版）

【演算法學習】AVL平衡二叉搜尋樹原理及各項操作程式設計實現（C++）

CVPR2015跟蹤演算法CFLB原理及程式碼解析

【特徵匹配】BRIEF特徵描述子原理及原始碼解析

SIFT特徵點檢測，特徵點描述，特徵點匹配理解

特徵提取與檢測（二） --- SIFT演算法

移動推薦演算法（三）：特徵構建

經典演算法研究系列九影象特徵提取與匹配之SIFT演算法

點特徵直方圖（PFH）描述（Point Feature Histograms (PFH) descriptors）

特徵點檢測學習_1(sift演算法)

SIFT演算法與SURF演算法特徵檢測效率對比

利用RobHess原始碼實現SIFT演算法及RANSAC去錯的影象特徵提取匹配及去除錯匹配

SIFT演算法描述

基於影象配準的影象特徵檢測之sift演算法----sift演算法總結

經典演算法研究系列：九、影象特徵提取與匹配之SIFT演算法

影象特徵提取與匹配之SIFT演算法

特徵點匹配——SIFT演算法詳解

SIFT演算法特徵描述子構建---特徵描述子構建原理及程式碼

0.引言

4 特徵描述子構建

4.1 確定描述子區域

4.2 座標軸旋轉為關鍵點的方向

4.3 將子區域內的梯度值插值加權分配到8 個方向上

4.4 歸一化及門限

4.5 生成描述子

相關推薦