影象金字塔以及拉普拉斯融合

阿新 • • 發佈：2018-11-28

本文將介紹影象金字塔以及拉普拉斯融合的相關知識。

影象金字塔

================================================

一般的的線性變換通過將一幅影象乘以transform函式分成不同的components。離散傅立葉變換、離散餘弦變換、奇異值分解和小波變換都以拉普拉斯金字塔和其他獎取樣變換為簡單基礎。

真實數字影象包括一系列物體和特徵（不同scales、orientation和角度下的lines, shapes, patterns, edges）

the simple process for a pyramid with an arbitrary number of levels：

平滑影象->將影象進行下采樣（常取取樣率r=2）而獲得，同樣的操作反覆做，金字塔層數逐漸上升，空間取樣密度逐漸下降。（如下圖）這個多維表示就像一個金字塔，其中fi表示影象，li表示低通濾波結果，hi表示高通濾波結果。li / hi通過將影象與高通/低通濾波器卷積而得。

與之相反，金字塔重建通過上取樣獲得。

以影象金字塔為基礎的雙邊濾波器是一個影象細節增強和操作的很好的框架。

影象融合（Image Blending）

================================================

原理：

1.建立兩幅影象的拉普拉斯金字塔
2.求高斯金字塔（掩模金字塔-為了拼接左右兩幅影象）
3. 進行拼接blendLapPyrs() ; 在每一層上將左右laplacian影象直接拼起來得結果金字塔resultLapPyr
4.重建影象: 從最高層結果圖
//將左右laplacian影象拼成的resultLapPyr金字塔中每一層，從上到下插值放大並和下一層相加，即得blend影象結果（reconstructImgFromLapPyramid）

Code：
配置環境：
VS2010+opencv 2.3.1(2.2版本以上均可)


  
   
    
     
    
    
     
      #include 
 "opencv2/opencv.hpp"
     
    
   
    
     
    
    
     
      using 
      namespace cv;
     
    
   
    
     
    
    
      
     
    
   
    
     
    
    
     
      /************************************************************************/
     
    
   
    
     
    
    
     
      /* 說明：
     
    
   
    
     
    
    
     
      *金字塔從下到上依次為 [0,1，...，level-1] 層
     
    
   
    
     
    
    
     
      *blendMask 為影象的掩模
     
    
   
    
     
    
    
     
      *maskGaussianPyramid為金字塔每一層的掩模
     
    
   
    
     
    
    
     
      *resultLapPyr 存放每層金字塔中直接用左右兩圖Laplacian變換拼成的影象
     
    
   
    
     
    
    
     
      */
     
    
   
    
     
    
    
     
      /************************************************************************/
     
    
   
    
     
    
    
      
     
    
   
    
     
    
    
      
     
    
   
    
     
    
    
     
      class LaplacianBlending {
     
    
   
    
     
    
    
     
      private:
     
    
   
    
     
    
    
     
      	Mat_<Vec3f> left;
     
    
   
    
     
    
    
     
      	Mat_<Vec3f> right;
     
    
   
    
     
    
    
     
      	Mat_<
      float> blendMask;
     
    
   
    
     
    
    
      
     
    
   
    
     
    
    
     	
      vector<Mat_<Vec3f> > leftLapPyr,rightLapPyr,resultLapPyr;
      //Laplacian Pyramids
     
    
   
    
     
    
    
     
      	Mat leftHighestLevel, rightHighestLevel, resultHighestLevel;
     
    
   
    
     
    
    
     	
      vector<Mat_<Vec3f> > maskGaussianPyramid; 
      //masks are 3-channels for easier multiplication with RGB
     
    
   
    
     
    
    
      
     
    
   
    
     
    
    
     	
      int levels;
     
    
   
    
     
    
    
      
     
    
   
    
     
    
    
     	
      void buildPyramids() {
     
    
   
    
     
    
    
     
      		buildLaplacianPyramid(left,leftLapPyr,leftHighestLevel);
     
    
   
    
     
    
    
     
      		buildLaplacianPyramid(right,rightLapPyr,rightHighestLevel);
     
    
   
    
     
    
    
     
      		buildGaussianPyramid();
     
    
   
    
     
    
    
     
      	}
     
    
   
    
     
    
    
      
     
    
   
    
     
    
    
     	
      void buildGaussianPyramid() {
      //金字塔內容為每一層的掩模
     
    
   
    
     
    
    
     
      		assert(leftLapPyr.size()>
      0);
     
    
   
    
     
    
    
      
     
    
   
    
     
    
    
     
      		maskGaussianPyramid.clear();
     
    
   
    
     
    
    
     
      		Mat currentImg;
     
    
   
    
     
    
    
     
      		cvtColor(blendMask, currentImg, CV_GRAY2BGR);
      //store color img of blend mask into maskGaussianPyramid
     
    
   
    
     
    
    
     
      		maskGaussianPyramid.push_back(currentImg); 
      //0-level
     
    
   
    
     
    
    
      
     
    
   
    
     
    
    
     
      		currentImg = blendMask;
     
    
   
    
     
    
    
     		
      for (
      int l=
      1; l<levels+
      1; l++) {
     
    
   
    
     
    
    
     
      			Mat _down;
     
    
   
    
     
    
    
     			
      if (leftLapPyr.size() > l)
     
    
   
    
     
    
    
     
      				pyrDown(currentImg, _down, leftLapPyr[l].size());
     
    
   
    
     
    
    
     			
      else
     
    
   
    
     
    
    
     
      				pyrDown(currentImg, _down, leftHighestLevel.size()); 
      //lowest level
     
    
   
    
     
    
    
      
     
    
   
    
     
    
    
     
      			Mat down;
     
    
   
    
     
    
    
     
      			cvtColor(_down, down, CV_GRAY2BGR);
     
    
   
    
     
    
    
     
      			maskGaussianPyramid.push_back(down);
      //add color blend mask into mask Pyramid
     
    
   
    
     
    
    
     
      			currentImg = _down;
     
    
   
    
     
    
    
     
      		}
     
    
   
    
     
    
    
     
      	}
     
    
   
    
     
    
    
      
     
    
   
    
     
    
    
     	
      void buildLaplacianPyramid(const Mat& img, vector<Mat_<Vec3f> >& lapPyr, Mat& HighestLevel) {
     
    
   
    
     
    
    
     
      		lapPyr.clear();
     
    
   
    
     
    
    
     
      		Mat currentImg = img;
     
    
   
    
     
    
    
     		
      for (
      int l=
      0; l<levels; l++) {
     
    
   
    
     
    
    
     
      			Mat down,up;
     
    
   
    
     
    
    
     
      			pyrDown(currentImg, down);
     
    
   
    
     
    
    
     
      			pyrUp(down, up,currentImg.size());
     
    
   
    
     
    
    
     
      			Mat lap = currentImg - up;
     
    
   
    
     
    
    
     
      			lapPyr.push_back(lap);
     
    
   
    
     
    
    
     
      			currentImg = down;
     
    
   
    
     
    
    
     
      		}
     
    
   
    
     
    
    
     
      		currentImg.copyTo(HighestLevel);
     
    
   
    
     
    
    
     
      	}
     
    
   
    
     
    
    
      
     
    
   
    
     
    
    
     
      	Mat_<Vec3f> reconstructImgFromLapPyramid() {
     
    
   
    
     
    
    
     		
      //將左右laplacian影象拼成的resultLapPyr金字塔中每一層
     
    
   
    
     
    
    
     		
      //從上到下插值放大並相加，即得blend影象結果
     
    
   
    
     
    
    
     
      		Mat currentImg = resultHighestLevel;
     
    
   
    
     
    
    
     		
      for (
      int l=levels
      -1; l>=
      0; l--) {
     
    
   
    
     
    
    
     
      			Mat up;
     
    
   
    
     
    
    
      
     
    
   
    
     
    
    
     
      			pyrUp(currentImg, up, resultLapPyr[l].size());
     
    
   
    
     
    
    
     
      			currentImg = up + resultLapPyr[l];
     
    
   
    
     
    
    
     
      		}
     
    
   
    
     
    
    
     		
      return currentImg;
     
    
   
    
     
    
    
     
      	}
     
    
   
    
     
    
    
      
     
    
   
    
     
    
    
     	
      void blendLapPyrs() {
     
    
   
    
     
    
    
     		
      //獲得每層金字塔中直接用左右兩圖Laplacian變換拼成的影象resultLapPyr
     
    
   
    
     
    
    
     
      		resultHighestLevel = leftHighestLevel.mul(maskGaussianPyramid.back()) +
     
    
   
    
     
    
    
     
      			rightHighestLevel.mul(Scalar(
      1.0,
      1.0,
      1.0) - maskGaussianPyramid.back());
     
    
   
    
     
    
    
     		
      for (
      int l=
      0; l<levels; l++) {
     
    
   
    
     
    
    
     
      			Mat A = leftLapPyr[l].mul(maskGaussianPyramid[l]);
     
    
   
    
     
    
    
     
      			Mat antiMask = Scalar(
      1.0,
      1.0,
      1.0) - maskGaussianPyramid[l];
     
    
   
    
     
    
    
     
      			Mat B = rightLapPyr[l].mul(antiMask);
     
    
   
    
     
    
    
     
      			Mat_<Vec3f> blendedLevel = A + B;
     
    
   
    
     
    
    
      
     
    
   
    
     
    
    
     
      			resultLapPyr.push_back(blendedLevel);
     
    
   
    
     
    
    
     
      		}
     
    
   
    
     
    
    
     
      	}
     
    
   
    
     
    
    
      
     
    
   
    
     
    
    
     
      public:
     
    
   
    
     
    
    
     
      	LaplacianBlending(
      const Mat_<Vec3f>& _left, 
      const Mat_<Vec3f>& _right, 
      const Mat_<
      float>& _blendMask, 
      int _levels):
      //construct function, used in LaplacianBlending lb(l,r,m,4);
     
    
   
    
     
    
    
     
      	  left(_left),right(_right),blendMask(_blendMask),levels(_levels)
     
    
   
    
     
    
    
     
      	  {
     
    
   
    
     
    
    
     
      		  assert(_left.size() == _right.size());
     
    
   
    
     
    
    
     
      		  assert(_left.size() == _blendMask.size());
     
    
   
    
     
    
    
     
      		  buildPyramids();	
      //construct Laplacian Pyramid and Gaussian Pyramid
     
    
   
    
     
    
    
     
      		  blendLapPyrs();	
      //blend left & right Pyramids into one Pyramid
     
    
   
    
     
    
    
     
      	  };
     
    
   
    
     
    
    
      
     
    
   
    
     
    
    
     
      	  Mat_<Vec3f> blend() {
     
    
   
    
     
    
    
     		  
      return reconstructImgFromLapPyramid();
      //reconstruct Image from Laplacian Pyramid
     
    
   
    
     
    
    
     
      	  }
     
    
   
    
     
    
    
     
      };
     
    
   
    
     
    
    
      
     
    
   
    
     
    
    
     
      Mat_<Vec3f> LaplacianBlend(
      const Mat_<Vec3f>& l, 
      const Mat_<Vec3f>& r, 
      const Mat_<
      float>& m) {
     
    
   
    
     
    
    
     	
      LaplacianBlending lb(l,r,m,4);
     
    
   
    
     
    
    
     	
      return lb.blend();
     
    
   
    
     
    
    
     
      }
     
    
   
    
     
    
    
      
     
    
   
    
     
    
    
     
      int main() {
     
    
   
    
     
    
    
     
      	Mat l8u = imread(
      "left.png");
     
    
   
    
     
    
    
     
      	Mat r8u = imread(
      "right.png");
     
    
   
    
     
    
    
      
     
    
   
    
     
    
    
     
      	imshow(
      "left",l8u); 
     
    
   
    
     
    
    
     
      	imshow(
      "right",r8u);
     
    
   
    
     
    
    
      
     
    
   
    
     
    
    
     
      	Mat_<Vec3f> l; l8u.convertTo(l,CV_32F,
      1.0/
      255.0);
      //Vec3f表示有三個通道，即 l[row][column][depth]
     
    
   
    
     
    
    
     
      	Mat_<Vec3f> r; r8u.convertTo(r,CV_32F,
      1.0/
      255.0);
     
    
   
    
     
    
    
     	
      /*****************    void convertTo( OutputArray m, int rtype, double alpha=1, double beta=0 ) const;******************/
     
    
   
    
     
    
    
     	
      /* Performs linear transformation on every source array element:
     
    
   
    
     
    
    
     
      	dst(x,y,c) = scale*src(x,y,alpha)+beta.
     
    
   
    
     
    
    
     
      	Arbitrary combination of input and output array depths are allowed
     
    
   
    
     
    
    
     
      	(number of channels must be the same), thus the function can be used
     
    
   
    
     
    
    
     
      	for type conversion */
     
    
   
    
     
    
    
      
     
    
   
    
     
    
    
     	
      //create blend mask matrix m
     
    
   
    
     
    
    
     
      	Mat_<
      float> m(l.rows,l.cols,
      0.0);					
      //將m全部賦值為0
     
    
   
    
     
    
    
     
      	m(Range::all(),Range(
      0,m.cols/
      2)) = 
      1.0;	
      //取m全部行&[0,m.cols/2]列，賦值為1.0
     
    
   
    
     
    
    
      
     
    
   
    
     
    
    
     
      	Mat_<Vec3f> blend = LaplacianBlend(l, r, m);
     
    
   
    
     
    
    
     
      	imshow(
      "blended",blend);
     
    
   
    
     
    
    
      
     
    
   
    
     
    
    
     
      	waitKey(
      0);
     
    
   
    
     
    
    
     	
      return 
      0;
     
    
   
    
     
    
    
     
      }

效果圖：

在這裡插入圖片描述

影象金字塔以及拉普拉斯融合

影象金字塔以及拉普拉斯融合

python+opencv影象金字塔融合

opencv學習筆記python實現影象金字塔（高斯金字塔與拉普拉斯金字塔）

影象融合之拉普拉斯融合（laplacian blending）

Python-OpenCV教程-8-影象金字塔融合

OpenCV計算機視覺學習（7）——影象金字塔（高斯金字塔，拉普拉斯金字塔）

機器學習--樸素貝葉斯分類，以及拉普拉斯校準

IMU校正以及姿態融合

NVP6324影象處理以及IMX6方案參考

0021-用OpenCV的pyrUp和pyrDown函式計算影象金字塔(向上/下采樣)

python opencv 影象金字塔

人臉檢測中，如何構建輸入影象金字塔

OpenCV影象金字塔提取影象輪廓

Opencv--影象金字塔

opencv(7)-影象金字塔+影象梯度

影象基礎以及互相轉換

Python3+OpenCV3影象處理（十一）—— 影象金字塔

影象金字塔與QGIS下金字塔的建立

資料結構篇：校園最短路徑導航（三：地圖影象顯示以及完整程式）

OpenCV-Python之影象金字塔

影象金字塔以及拉普拉斯融合

相關推薦