影象金字塔以及拉普拉斯融合
本文將介紹影象金字塔以及拉普拉斯融合的相關知識。
影象金字塔
================================================
一般的的線性變換通過將一幅影象乘以transform函式分成不同的components。離散傅立葉變換、離散餘弦變換、奇異值分解 和 小波變換 都以拉普拉斯金字塔和其他獎取樣變換為簡單基礎。
真實數字影象包括一系列物體和特徵(不同scales、orientation和角度下的lines, shapes, patterns, edges)
the simple process for a pyramid with an arbitrary number of levels:
平滑影象->將影象進行下采樣(常取取樣率r=2) 而獲得,同樣的操作反覆做,金字塔層數逐漸上升,空間取樣密度逐漸下降。(如下圖)這個多維表示就像一個金字塔,其中fi表示影象,li表示低通濾波結果,hi表示高通濾波結果。li / hi通過將影象與高通/低通濾波器卷積而得。
與之相反,金字塔重建通過上取樣獲得。
以影象金字塔為基礎的雙邊濾波器是一個影象細節增強和操作的很好的框架。
影象融合(Image Blending)
================================================
原理:
1.建立兩幅影象的拉普拉斯金字塔
2.求高斯金字塔(掩模金字塔-為了拼接左右兩幅影象)
3. 進行拼接blendLapPyrs() ; 在每一層上將左右laplacian影象直接拼起來得結果金字塔resultLapPyr
4.重建影象: 從最高層結果圖
//將左右laplacian影象拼成的resultLapPyr金字塔中每一層,從上到下插值放大並和下一層相加,即得blend影象結果(reconstructImgFromLapPyramid)
Code:
配置環境:
VS2010+opencv 2.3.1(2.2版本以上均可)
-
#include
"opencv2/opencv.hpp"
-
using
namespace cv;
-
-
/************************************************************************/
-
/* 說明:
-
*金字塔從下到上依次為 [0,1,...,level-1] 層
-
*blendMask 為影象的掩模
-
*maskGaussianPyramid為金字塔每一層的掩模
-
*resultLapPyr 存放每層金字塔中直接用左右兩圖Laplacian變換拼成的影象
-
*/
-
/************************************************************************/
-
-
-
class LaplacianBlending {
-
private:
-
Mat_<Vec3f> left;
-
Mat_<Vec3f> right;
-
Mat_<
float> blendMask;
-
-
vector<Mat_<Vec3f> > leftLapPyr,rightLapPyr,resultLapPyr;
//Laplacian Pyramids
-
Mat leftHighestLevel, rightHighestLevel, resultHighestLevel;
-
vector<Mat_<Vec3f> > maskGaussianPyramid;
//masks are 3-channels for easier multiplication with RGB
-
-
int levels;
-
-
void buildPyramids() {
-
buildLaplacianPyramid(left,leftLapPyr,leftHighestLevel);
-
buildLaplacianPyramid(right,rightLapPyr,rightHighestLevel);
-
buildGaussianPyramid();
-
}
-
-
void buildGaussianPyramid() {
//金字塔內容為每一層的掩模
-
assert(leftLapPyr.size()>
0);
-
-
maskGaussianPyramid.clear();
-
Mat currentImg;
-
cvtColor(blendMask, currentImg, CV_GRAY2BGR);
//store color img of blend mask into maskGaussianPyramid
-
maskGaussianPyramid.push_back(currentImg);
//0-level
-
-
currentImg = blendMask;
-
for (
int l=
1; l<levels+
1; l++) {
-
Mat _down;
-
if (leftLapPyr.size() > l)
-
pyrDown(currentImg, _down, leftLapPyr[l].size());
-
else
-
pyrDown(currentImg, _down, leftHighestLevel.size());
//lowest level
-
-
Mat down;
-
cvtColor(_down, down, CV_GRAY2BGR);
-
maskGaussianPyramid.push_back(down);
//add color blend mask into mask Pyramid
-
currentImg = _down;
-
}
-
}
-
-
void buildLaplacianPyramid(const Mat& img, vector<Mat_<Vec3f> >& lapPyr, Mat& HighestLevel) {
-
lapPyr.clear();
-
Mat currentImg = img;
-
for (
int l=
0; l<levels; l++) {
-
Mat down,up;
-
pyrDown(currentImg, down);
-
pyrUp(down, up,currentImg.size());
-
Mat lap = currentImg - up;
-
lapPyr.push_back(lap);
-
currentImg = down;
-
}
-
currentImg.copyTo(HighestLevel);
-
}
-
-
Mat_<Vec3f> reconstructImgFromLapPyramid() {
-
//將左右laplacian影象拼成的resultLapPyr金字塔中每一層
-
//從上到下插值放大並相加,即得blend影象結果
-
Mat currentImg = resultHighestLevel;
-
for (
int l=levels
-1; l>=
0; l--) {
-
Mat up;
-
-
pyrUp(currentImg, up, resultLapPyr[l].size());
-
currentImg = up + resultLapPyr[l];
-
}
-
return currentImg;
-
}
-
-
void blendLapPyrs() {
-
//獲得每層金字塔中直接用左右兩圖Laplacian變換拼成的影象resultLapPyr
-
resultHighestLevel = leftHighestLevel.mul(maskGaussianPyramid.back()) +
-
rightHighestLevel.mul(Scalar(
1.0,
1.0,
1.0) - maskGaussianPyramid.back());
-
for (
int l=
0; l<levels; l++) {
-
Mat A = leftLapPyr[l].mul(maskGaussianPyramid[l]);
-
Mat antiMask = Scalar(
1.0,
1.0,
1.0) - maskGaussianPyramid[l];
-
Mat B = rightLapPyr[l].mul(antiMask);
-
Mat_<Vec3f> blendedLevel = A + B;
-
-
resultLapPyr.push_back(blendedLevel);
-
}
-
}
-
-
public:
-
LaplacianBlending(
const Mat_<Vec3f>& _left,
const Mat_<Vec3f>& _right,
const Mat_<
float>& _blendMask,
int _levels):
//construct function, used in LaplacianBlending lb(l,r,m,4);
-
left(_left),right(_right),blendMask(_blendMask),levels(_levels)
-
{
-
assert(_left.size() == _right.size());
-
assert(_left.size() == _blendMask.size());
-
buildPyramids();
//construct Laplacian Pyramid and Gaussian Pyramid
-
blendLapPyrs();
//blend left & right Pyramids into one Pyramid
-
};
-
-
Mat_<Vec3f> blend() {
-
return reconstructImgFromLapPyramid();
//reconstruct Image from Laplacian Pyramid
-
}
-
};
-
-
Mat_<Vec3f> LaplacianBlend(
const Mat_<Vec3f>& l,
const Mat_<Vec3f>& r,
const Mat_<
float>& m) {
-
LaplacianBlending lb(l,r,m,4);
-
return lb.blend();
-
}
-
-
int main() {
-
Mat l8u = imread(
"left.png");
-
Mat r8u = imread(
"right.png");
-
-
imshow(
"left",l8u);
-
imshow(
"right",r8u);
-
-
Mat_<Vec3f> l; l8u.convertTo(l,CV_32F,
1.0/
255.0);
//Vec3f表示有三個通道,即 l[row][column][depth]
-
Mat_<Vec3f> r; r8u.convertTo(r,CV_32F,
1.0/
255.0);
-
/***************** void convertTo( OutputArray m, int rtype, double alpha=1, double beta=0 ) const;******************/
-
/* Performs linear transformation on every source array element:
-
dst(x,y,c) = scale*src(x,y,alpha)+beta.
-
Arbitrary combination of input and output array depths are allowed
-
(number of channels must be the same), thus the function can be used
-
for type conversion */
-
-
//create blend mask matrix m
-
Mat_<
float> m(l.rows,l.cols,
0.0);
//將m全部賦值為0
-
m(Range::all(),Range(
0,m.cols/
2)) =
1.0;
//取m全部行&[0,m.cols/2]列,賦值為1.0
-
-
Mat_<Vec3f> blend = LaplacianBlend(l, r, m);
-
imshow(
"blended",blend);
-
-
waitKey(
0);
-
return
0;
-
}
效果圖: