├── CMakeLists.txt
├── GaussianPyramid.cpp
├── GaussianPyramid.h
├── Image.h
├── ImageIO.h
├── ImageProcessing.h
├── OpticalFlow.h
├── OpticalFlowCode.cpp
├── README.md
├── img1.jpg
├── img2.jpg
├── init.lua
├── legend.png
├── liuflow.cpp
└── project.h


/CMakeLists.txt:
--------------------------------------------------------------------------------
 1 | CMAKE_MINIMUM_REQUIRED(VERSION 2.6 FATAL_ERROR)
 2 | CMAKE_POLICY(VERSION 2.6)
 3 | FIND_PACKAGE(Torch REQUIRED)
 4 | 
 5 | SET(src liuflow.cpp
 6 |         GaussianPyramid.cpp
 7 |         GaussianPyramid.h
 8 |         Image.h
 9 |         ImageIO.h
10 |         ImageProcessing.h
11 |         OpticalFlowCode.cpp
12 |         OpticalFlow.h
13 |         project.h)
14 | 
15 | SET(luasrc init.lua
16 |            img1.jpg
17 |            img2.jpg
18 |            legend.png)
19 | 
20 | SET(QT_MIN_VERSION "4.3.0")
21 | FIND_PACKAGE(Qt4)
22 | 
23 | IF (QT4_FOUND)
24 |   INCLUDE_DIRECTORIES (${QT_INCLUDES})
25 |   INCLUDE (${QT_USE_FILE})
26 |   LINK_DIRECTORIES (${QT_LIBRARY_DIR})
27 |   ADD_TORCH_PACKAGE(liuflow "${src}" "${luasrc}" "Vision")
28 |   TARGET_LINK_LIBRARIES(liuflow luaT TH ${QT_LIBRARIES})
29 | ENDIF (QT4_FOUND)
30 | 


--------------------------------------------------------------------------------
/GaussianPyramid.cpp:
--------------------------------------------------------------------------------
 1 | #include "GaussianPyramid.h"
 2 | #include "math.h"
 3 | 
 4 | GaussianPyramid::GaussianPyramid(void)
 5 | {
 6 | 	ImPyramid=NULL;
 7 | }
 8 | 
 9 | GaussianPyramid::~GaussianPyramid(void)
10 | {
11 | 	if(ImPyramid!=NULL)
12 | 		delete []ImPyramid;
13 | }
14 | 
15 | //---------------------------------------------------------------------------------------
16 | // function to construct the pyramid
17 | // this is the slow way
18 | //---------------------------------------------------------------------------------------
19 | /*void GaussianPyramid::ConstructPyramid(const DImage &image, double ratio, int minWidth)
20 | {
21 | 	// the ratio cannot be arbitrary numbers
22 | 	if(ratio>0.98 || ratio<0.4)
23 | 		ratio=0.75;
24 | 	// first decide how many levels
25 | 	nLevels=log((double)minWidth/image.width())/log(ratio);
26 | 	if(ImPyramid!=NULL)
27 | 		delete []ImPyramid;
28 | 	ImPyramid=new DImage[nLevels];
29 | 	ImPyramid[0].copyData(image);
30 | 	double baseSigma=(1/ratio-1);
31 | 	for(int i=1;i<nLevels;i++)
32 | 	{
33 | 		DImage foo;
34 | 		double sigma=baseSigma*i;
35 | 		image.GaussianSmoothing(foo,sigma,sigma*2.5);
36 | 		foo.imresize(ImPyramid[i],pow(ratio,i));
37 | 	}
38 | }//*/
39 | 
40 | //---------------------------------------------------------------------------------------
41 | // function to construct the pyramid
42 | // this is the fast way
43 | //---------------------------------------------------------------------------------------
44 | void GaussianPyramid::ConstructPyramid(const DImage &image, double ratio, int minWidth)
45 | {
46 | 	// the ratio cannot be arbitrary numbers
47 | 	if(ratio>0.98 || ratio<0.4)
48 | 		ratio=0.75;
49 | 	// first decide how many levels
50 | 	nLevels=log((double)minWidth/image.width())/log(ratio);
51 | 	if(ImPyramid!=NULL)
52 | 		delete []ImPyramid;
53 | 	ImPyramid=new DImage[nLevels];
54 | 	ImPyramid[0].copyData(image);
55 | 	double baseSigma=(1/ratio-1);
56 | 	int n=log(0.25)/log(ratio);
57 | 	double nSigma=baseSigma*n;
58 | 	for(int i=1;i<nLevels;i++)
59 | 	{
60 | 		DImage foo;
61 | 		if(i<=n)
62 | 		{
63 | 			double sigma=baseSigma*i;
64 | 			image.GaussianSmoothing(foo,sigma,sigma*3);
65 | 			foo.imresize(ImPyramid[i],pow(ratio,i));
66 | 		}
67 | 		else
68 | 		{
69 | 			ImPyramid[i-n].GaussianSmoothing(foo,nSigma,nSigma*3);
70 | 			double rate=(double)pow(ratio,i)*image.width()/foo.width();
71 | 			foo.imresize(ImPyramid[i],rate);
72 | 		}
73 | 	}
74 | }
75 | 
76 | void GaussianPyramid::displayTop(const char *filename)
77 | {
78 | 	ImPyramid[nLevels-1].imwrite(filename);
79 | }


--------------------------------------------------------------------------------
/GaussianPyramid.h:
--------------------------------------------------------------------------------
 1 | #ifndef _GaussianPyramid_h
 2 | #define _GaussianPyramid_h
 3 | 
 4 | #include "Image.h"
 5 | 
 6 | class GaussianPyramid
 7 | {
 8 | private:
 9 | 	DImage* ImPyramid;
10 | 	int nLevels;
11 | public:
12 | 	GaussianPyramid(void);
13 | 	~GaussianPyramid(void);
14 | 	void ConstructPyramid(const DImage& image,double ratio=0.8,int minWidth=30);
15 | 	void displayTop(const char* filename);
16 | 	inline int nlevels() const {return nLevels;};
17 | 	inline DImage& Image(int index) {return ImPyramid[index];};
18 | };
19 | 
20 | #endif


--------------------------------------------------------------------------------
/Image.h:
--------------------------------------------------------------------------------
   1 | #ifndef _Image_h
   2 | #define _Image_h
   3 | 
   4 | #include "project.h"
   5 | #include "stdio.h"
   6 | #include "memory.h"
   7 | #include "ImageProcessing.h"
   8 | #include <iostream>
   9 | 
  10 | #ifndef _MATLAB
  11 | 	#include <QString>
  12 | 	#include "ImageIO.h"
  13 | #else
  14 | 	#include "mex.h"
  15 | #endif
  16 | 
  17 | using namespace std;
  18 | 
  19 | // template class for image
  20 | template <class T>
  21 | class Image
  22 | {
  23 | protected:
  24 | 	T* pData;
  25 | 	int imWidth,imHeight,nChannels;
  26 | 	int nPixels,nElements;
  27 | 	bool IsDerivativeImage;
  28 | public:
  29 | 	Image(void);
  30 | 	Image(int width,int height,int nchannels=1);
  31 | 	Image(const T& value,int _width,int _height,int _nchannels=1);
  32 | #ifndef _MATLAB
  33 | 	Image(const QImage& image);
  34 | #endif
  35 | 	Image(const Image<T>& other);
  36 | 	~Image(void);
  37 | 	virtual Image<T>& operator=(const Image<T>& other);
  38 | 
  39 | 	virtual inline void computeDimension(){nPixels=imWidth*imHeight;nElements=nPixels*nChannels;};
  40 | 
  41 | 	virtual void allocate(int width,int height,int nchannels=1);
  42 | 	
  43 | 	template <class T1>
  44 | 	void allocate(const Image<T1>& other);
  45 | 
  46 | 	virtual void clear();
  47 | 	virtual void reset();
  48 | 	virtual void copyData(const Image<T>& other);
  49 | 	void setValue(const T& value);
  50 | 	void setValue(const T& value,int _width,int _height,int _nchannels=1);
  51 | 	
  52 | 	template <class T1>
  53 | 	void copy(const Image<T1>& other);
  54 | 
  55 | 	void im2double();
  56 | 
  57 | 	// function to access the member variables
  58 | 	inline T*& data(){return pData;};
  59 | 	inline const T*& data() const{return (const T*&)pData;};
  60 | 	inline int width() const {return imWidth;};
  61 | 	inline int height() const {return imHeight;};
  62 | 	inline int nchannels() const {return nChannels;};
  63 | 	inline int npixels() const {return nPixels;};
  64 | 	inline int nelements() const {return nElements;};
  65 | 	inline bool isDerivativeImage() const {return IsDerivativeImage;};
  66 | 	bool IsFloat () const;
  67 | 
  68 | 	template <class T1>
  69 | 	bool matchDimension  (const Image<T1>& image) const;
  70 | 
  71 | 	inline void setDerivative(bool isDerivativeImage=true){IsDerivativeImage=isDerivativeImage;};
  72 | 
  73 | 	// function to move this image to another one
  74 | 	template <class T1>
  75 | 	void moveto(Image<T1>& image,int x,int y,int width=0,int height=0);
  76 | 
  77 | 	// function of basic image operations
  78 | 	virtual bool imresize(double ratio);
  79 | 	template <class T1>
  80 | 	void imresize(Image<T1>& result,double ratio);
  81 | 	void imresize(int dstWidth,int dstHeight);
  82 | 
  83 | #ifndef _MATLAB
  84 | 	virtual bool imread(const QString& filename);
  85 | 	virtual void imread(const QImage& image);
  86 | 
  87 | 	virtual bool imwrite(const QString& filename,int quality=100) const;
  88 | 	virtual bool imwrite(const QString& filename,ImageIO::ImageType imagetype,int quality=100) const;
  89 | #else
  90 | 	virtual bool imread(const char* filename) const {return true;};
  91 | 	virtual bool imwrite(const char* filename) const {return true;};
  92 | #endif
  93 | 
  94 | 	template <class T1>
  95 | 	Image<T1> dx(bool IsAdvancedFilter=false) const;
  96 | 
  97 | 	template <class T1>
  98 | 	void dx(Image<T1>& image,bool IsAdvancedFilter=false) const;
  99 | 
 100 | 	template<class T1>
 101 | 	Image<T1> dy(bool IsAdvancedFilter=false) const;
 102 | 
 103 | 	template <class T1>
 104 | 	void dy(Image<T1>& image,bool IsAdvancedFilter=false) const;
 105 | 
 106 | 	template <class T1>
 107 | 	void GaussianSmoothing(Image<T1>& image,double sigma,int fsize) const;
 108 | 
 109 | 	template <class T1>
 110 | 	void smoothing(Image<T1>& image,double factor=4);
 111 | 
 112 | 	template <class T1>
 113 | 	Image<T1> smoothing(double factor=4);
 114 | 
 115 | 	void smoothing(double factor=4);
 116 | 
 117 | 	// funciton for filtering
 118 | 	template <class T1>
 119 | 	void imfilter(Image<T1>& image,double* filter,int fsize) const;
 120 | 
 121 | 	template <class T1>
 122 | 	Image<T1> imfilter(double* filter,int fsize);
 123 | 
 124 | 	template <class T1>
 125 | 	void imfilter_h(Image<T1>& image,double* filter,int fsize) const;
 126 | 
 127 | 	template <class T1>
 128 | 	void imfilter_v(Image<T1>& image,double* filter,int fsize) const;
 129 | 
 130 | 	template <class T1>
 131 | 	void imfilter_hv(Image<T1>& image,double* hfilter,int hfsize,double* vfilter,int vfsize) const;
 132 | 
 133 | 	// function to desaturating
 134 | 	template <class T1>
 135 | 	void desaturate(Image<T1>& image) const;
 136 | 
 137 | 	template <class T1>
 138 | 	void collapse(Image<T1>& image) const;
 139 | 
 140 | 	// function to concatenate images
 141 | 	template <class T1,class T2>
 142 | 	void concatenate(Image<T1>& destImage,const Image<T2>& addImage) const;
 143 | 
 144 | 	template <class T1>
 145 | 	Image<T> concatenate(const Image<T1>& addImage) const;
 146 | 
 147 | 	// function to separate the channels of the image
 148 | 	template <class T1,class T2>
 149 | 	void separate(unsigned firstNChannels,Image<T1>& image1,Image<T2>& image2) const;
 150 | 
 151 | 	// function to sample patch
 152 | 	template <class T1>
 153 | 	void getPatch(Image<T1>& patch,double x,double y,int fsize) const;
 154 | 
 155 | 	// function to crop the image
 156 | 	template <class T1>
 157 | 	void crop(Image<T1>& patch,int Lef,int Top,int Width,int Height) const;
 158 | 
 159 | 	// basic numerics of images
 160 | 	template <class T1,class T2>
 161 | 	void Multiply(const Image<T1>& image1,const Image<T2>& image2);
 162 | 
 163 | 	template <class T1,class T2,class T3>
 164 | 	void Multiply(const Image<T1>& image1,const Image<T2>& image2,const Image<T3>& image3);
 165 | 
 166 | 	template <class T1>
 167 | 	void Multiplywith(const Image<T1>& image1);
 168 | 
 169 | 	void Multiplywith(double value);
 170 | 
 171 | 	template <class T1,class T2>
 172 | 	void Add(const Image<T1>& image1,const Image<T2>& image2);
 173 | 
 174 | 	template <class T1,class T2>
 175 | 	void Add(const Image<T1>& image1,const Image<T2>& image2,double ratio);
 176 | 
 177 | 	void Add(const T value);
 178 | 
 179 | 	template <class T1>
 180 | 	void Add(const Image<T1>& image1,const double value);
 181 | 
 182 | 	template <class T1,class T2>
 183 | 	void Subtract(const Image<T1>& image1,const Image<T2>& image2);
 184 | 
 185 | 	// function to normalize an image
 186 | 	void normalize(Image<T>& image);
 187 | 
 188 | 	// function to compute the statistics of the image
 189 | 	double norm2() const;
 190 | 
 191 | 	template <class T1>
 192 | 	double innerproduct(Image<T1>& image) const;
 193 | 
 194 | #ifdef _MATLAB
 195 | 	template <class T1>
 196 | 	void LoadMatlabImage(const mxArray* image);
 197 | 
 198 | 	template <class T1>
 199 | 	void ConvertFromMatlab(const T1* pMatlabPlane,int _width,int _height,int _nchannels);
 200 | 
 201 | 	void OutputToMatlab(mxArray*& matrix);
 202 | 
 203 | 	template <class T1>
 204 | 	void ConvertToMatlab(T1* pMatlabPlane);
 205 | #endif
 206 | };
 207 | 
 208 | 
 209 | typedef Image<unsigned char> BiImage;
 210 | typedef Image<short int> IntImage;
 211 | typedef Image<float> FImage;
 212 | typedef Image<double> DImage;
 213 | 
 214 | //------------------------------------------------------------------------------------------
 215 | // constructor
 216 | //------------------------------------------------------------------------------------------
 217 | template <class T>
 218 | Image<T>::Image()
 219 | {
 220 | 	pData=NULL;
 221 | 	imWidth=imHeight=nChannels=nPixels=nElements=0;
 222 | 	IsDerivativeImage=false;
 223 | }
 224 | 
 225 | //------------------------------------------------------------------------------------------
 226 | // constructor with specified dimensions
 227 | //------------------------------------------------------------------------------------------
 228 | template <class T>
 229 | Image<T>::Image(int width,int height,int nchannels)
 230 | {
 231 | 	imWidth=width;
 232 | 	imHeight=height;
 233 | 	nChannels=nchannels;
 234 | 	computeDimension();
 235 | 	pData=NULL;
 236 | 	pData=new T[nElements];
 237 | 	if(nElements>0)
 238 | 		memset(pData,0,sizeof(T)*nElements);
 239 | 	IsDerivativeImage=false;
 240 | }
 241 | 
 242 | template <class T>
 243 | Image<T>::Image(const T& value,int _width,int _height,int _nchannels)
 244 | {
 245 | 	pData=NULL;
 246 | 	allocate(_width,_height,_nchannels);
 247 | 	setValue(value);
 248 | }
 249 | 
 250 | #ifndef _MATLAB
 251 | template <class T>
 252 | Image<T>::Image(const QImage& image)
 253 | {
 254 | 	pData=NULL;
 255 | 	imread(image);
 256 | }
 257 | #endif
 258 | 
 259 | template <class T>
 260 | void Image<T>::allocate(int width,int height,int nchannels)
 261 | {
 262 | 	clear();
 263 | 	imWidth=width;
 264 | 	imHeight=height;
 265 | 	nChannels=nchannels;
 266 | 	computeDimension();
 267 | 	pData=NULL;
 268 | 	pData=new T[nElements];
 269 | 	if(nElements>0)
 270 | 		memset(pData,0,sizeof(T)*nElements);
 271 | }
 272 | 
 273 | template <class T>
 274 | template <class T1>
 275 | void Image<T>::allocate(const Image<T1> &other)
 276 | {
 277 | 	allocate(other.width(),other.height(),other.nchannels());
 278 | }
 279 | 
 280 | //------------------------------------------------------------------------------------------
 281 | // copy constructor
 282 | //------------------------------------------------------------------------------------------
 283 | template <class T>
 284 | Image<T>::Image(const Image<T>& other)
 285 | {
 286 | 	pData=NULL;
 287 | 	copyData(other);
 288 | }
 289 | 
 290 | //------------------------------------------------------------------------------------------
 291 | // destructor
 292 | //------------------------------------------------------------------------------------------
 293 | template <class T>
 294 | Image<T>::~Image()
 295 | {
 296 | 	if(pData!=NULL)
 297 | 		delete []pData;
 298 | }
 299 | 
 300 | //------------------------------------------------------------------------------------------
 301 | // clear the image
 302 | //------------------------------------------------------------------------------------------
 303 | template <class T>
 304 | void Image<T>::clear()
 305 | {
 306 | 	if(pData!=NULL)
 307 | 		delete []pData;
 308 | 	pData=NULL;
 309 | 	imWidth=imHeight=nChannels=nPixels=nElements=0;
 310 | }
 311 | 
 312 | //------------------------------------------------------------------------------------------
 313 | // reset the image (reset the buffer to zero)
 314 | //------------------------------------------------------------------------------------------
 315 | template <class T>
 316 | void Image<T>::reset()
 317 | {
 318 | 	if(pData!=NULL)
 319 | 		memset(pData,0,sizeof(T)*nElements);
 320 | }
 321 | 
 322 | template <class T>
 323 | void Image<T>::setValue(const T &value)
 324 | {
 325 | 	for(int i=0;i<nElements;i++)
 326 | 		pData[i]=value;
 327 | }
 328 | 
 329 | template <class T>
 330 | void Image<T>::setValue(const T& value,int _width,int _height,int _nchannels)
 331 | {
 332 | 	if(imWidth!=_width || imHeight!=_height || nChannels!=_nchannels)
 333 | 		allocate(_width,_height,_nchannels);
 334 | 	setValue(value);
 335 | }
 336 | 
 337 | //------------------------------------------------------------------------------------------
 338 | // copy from other image
 339 | //------------------------------------------------------------------------------------------
 340 | template <class T>
 341 | void Image<T>::copyData(const Image<T>& other)
 342 | {
 343 | 	imWidth=other.imWidth;
 344 | 	imHeight=other.imHeight;
 345 | 	nChannels=other.nChannels;
 346 | 	nPixels=other.nPixels;
 347 | 	IsDerivativeImage=other.IsDerivativeImage;
 348 | 
 349 | 	if(nElements!=other.nElements)
 350 | 	{
 351 | 		nElements=other.nElements;		
 352 | 		if(pData!=NULL)
 353 | 			delete []pData;
 354 | 		pData=NULL;
 355 | 		pData=new T[nElements];
 356 | 	}
 357 | 	if(nElements>0)
 358 | 		memcpy(pData,other.pData,sizeof(T)*nElements);
 359 | }
 360 | 
 361 | template <class T>
 362 | template <class T1>
 363 | void Image<T>::copy(const Image<T1>& other)
 364 | {
 365 | 	clear();
 366 | 
 367 | 	imWidth=other.width();
 368 | 	imHeight=other.height();
 369 | 	nChannels=other.nchannels();
 370 | 	computeDimension();
 371 | 
 372 | 	IsDerivativeImage=other.isDerivativeImage();
 373 | 
 374 | 	pData=NULL;
 375 | 	pData=new T[nElements];
 376 | 	const T1*& srcData=other.data();
 377 | 	for(int i=0;i<nElements;i++)
 378 | 		pData[i]=srcData[i];
 379 | }
 380 | 
 381 | template <class T>
 382 | void Image<T>::im2double()
 383 | {
 384 | 	if(IsFloat())
 385 | 		for(int i=0;i<nElements;i++)
 386 | 			pData[i]/=255;
 387 | }
 388 | 
 389 | //------------------------------------------------------------------------------------------
 390 | // override equal operator
 391 | //------------------------------------------------------------------------------------------
 392 | template <class T>
 393 | Image<T>& Image<T>::operator=(const Image<T>& other)
 394 | {
 395 | 	copyData(other);
 396 | 	return *this;
 397 | }
 398 | 
 399 | template <class T>
 400 | bool Image<T>::IsFloat() const
 401 | {
 402 | 	if(typeid(T)==typeid(float) || typeid(T)==typeid(double) || typeid(T)==typeid(long double))
 403 | 		return true;
 404 | 	else
 405 | 		return false;
 406 | }
 407 | 
 408 | template <class T>
 409 | template <class T1>
 410 | bool Image<T>::matchDimension(const Image<T1>& image) const
 411 | {
 412 | 	if(imWidth==image.width() && imHeight==image.height() && nChannels==image.nchannels())
 413 | 		return true;
 414 | 	else
 415 | 		return false;
 416 | }
 417 | 
 418 | //------------------------------------------------------------------------------------------
 419 | // function to move this image to a dest image at (x,y) with specified width and height
 420 | //------------------------------------------------------------------------------------------
 421 | template <class T>
 422 | template <class T1>
 423 | void Image<T>::moveto(Image<T1>& image,int x0,int y0,int width,int height)
 424 | {
 425 | 	if(width==0)
 426 | 		width=imWidth;
 427 | 	if(height==0)
 428 | 		height=imHeight;
 429 | 	int NChannels=__min(nChannels,image.nchannels());
 430 | 
 431 | 	int x,y;
 432 | 	for(int i=0;i<height;i++)
 433 | 	{
 434 | 		y=y0+i;
 435 | 		if(y>=image.height())
 436 | 			break;
 437 | 		for(int j=0;j<width;j++)
 438 | 		{
 439 | 			x=x0+j;
 440 | 			if(x>=image.width())
 441 | 				break;
 442 | 			for(int k=0;k<NChannels;k++)
 443 | 				image.data()[(y*image.width()+x)*image.nchannels()+k]=pData[(i*imWidth+j)*nChannels+k];
 444 | 		}
 445 | 	}
 446 | }
 447 | 
 448 | 
 449 | //------------------------------------------------------------------------------------------
 450 | // resize the image
 451 | //------------------------------------------------------------------------------------------
 452 | template <class T>
 453 | bool Image<T>::imresize(double ratio)
 454 | {
 455 | 	if(pData==NULL)
 456 | 		return false;
 457 | 
 458 | 	T* pDstData;
 459 | 	int DstWidth,DstHeight;
 460 | 	DstWidth=(double)imWidth*ratio;
 461 | 	DstHeight=(double)imHeight*ratio;
 462 | 	pDstData=new T[DstWidth*DstHeight*nChannels];
 463 | 
 464 | 	ImageProcessing::ResizeImage(pData,pDstData,imWidth,imHeight,nChannels,ratio);
 465 | 
 466 | 	delete []pData;
 467 | 	pData=pDstData;
 468 | 	imWidth=DstWidth;
 469 | 	imHeight=DstHeight;
 470 | 	computeDimension();
 471 | 	return true;
 472 | }
 473 | 
 474 | template <class T>
 475 | template <class T1>
 476 | void Image<T>::imresize(Image<T1>& result,double ratio)
 477 | {
 478 | 	int DstWidth,DstHeight;
 479 | 	DstWidth=(double)imWidth*ratio;
 480 | 	DstHeight=(double)imHeight*ratio;
 481 | 	if(result.width()!=DstWidth || result.height()!=DstHeight || result.nchannels()!=nChannels)
 482 | 		result.allocate(DstWidth,DstHeight,nChannels);
 483 | 	ImageProcessing::ResizeImage(pData,result.data(),imWidth,imHeight,nChannels,ratio);
 484 | }
 485 | 
 486 | template <class T>
 487 | void Image<T>::imresize(int dstWidth,int dstHeight)
 488 | {
 489 | 	DImage foo(dstWidth,dstHeight,nChannels);
 490 | 	ImageProcessing::ResizeImage(pData,foo.data(),imWidth,imHeight,nChannels,dstWidth,dstHeight);
 491 | 	copyData(foo);
 492 | }
 493 | 
 494 | //------------------------------------------------------------------------------------------
 495 | // function to load the image
 496 | //------------------------------------------------------------------------------------------
 497 | #ifndef _MATLAB
 498 | template <class T>
 499 | bool Image<T>::imread(const QString &filename)
 500 | {
 501 | 	clear();
 502 | 	if(ImageIO::loadImage(filename,pData,imWidth,imHeight,nChannels))
 503 | 	{
 504 | 		computeDimension();
 505 | 		return true;
 506 | 	}
 507 | 	return false;
 508 | }
 509 | 
 510 | template <class T>
 511 | void Image<T>::imread(const QImage& image)
 512 | {
 513 | 	clear();
 514 | 	ImageIO::loadImage(image,pData,imWidth,imHeight,nChannels);
 515 | 	computeDimension();
 516 | }
 517 | 
 518 | //------------------------------------------------------------------------------------------
 519 | // function to write the image
 520 | //------------------------------------------------------------------------------------------
 521 | template <class T>
 522 | bool Image<T>::imwrite(const QString& filename,int quality) const
 523 | {
 524 | 	ImageIO::ImageType type;
 525 | 	if(IsDerivativeImage)
 526 | 		type=ImageIO::derivative;
 527 | 	else
 528 | 		type=ImageIO::standard;
 529 | 
 530 | 	return ImageIO::writeImage(filename,(const T*&)pData,imWidth,imHeight,nChannels,type,quality);
 531 | }
 532 | 
 533 | template <class T>
 534 | bool Image<T>::imwrite(const QString &filename, ImageIO::ImageType imagetype, int quality) const
 535 | {
 536 | 	return ImageIO::writeImage(filename,(const T*&)pData,imWidth,imHeight,nChannels,imagetype,quality);
 537 | }
 538 | #endif
 539 | 
 540 | //------------------------------------------------------------------------------------------
 541 | // function to get x-derivative of the image
 542 | //------------------------------------------------------------------------------------------
 543 | template <class T>
 544 | template <class T1>
 545 | void Image<T>::dx(Image<T1>& result,bool IsAdvancedFilter) const
 546 | {
 547 | 	if(matchDimension(result)==false)
 548 | 		result.allocate(imWidth,imHeight,nChannels);
 549 | 	result.reset();
 550 | 	result.setDerivative();
 551 | 	T1*& data=result.data();
 552 | 	int i,j,k,offset;
 553 | 	if(IsAdvancedFilter==false)
 554 | 		for(i=0;i<imHeight;i++)
 555 | 			for(j=0;j<imWidth-1;j++)
 556 | 			{
 557 | 				offset=i*imWidth+j;
 558 | 				for(k=0;k<nChannels;k++)
 559 | 					data[offset*nChannels+k]=(T1)pData[(offset+1)*nChannels+k]-pData[offset*nChannels+k];
 560 | 			}
 561 | 	else
 562 | 	{
 563 | 		double xFilter[5]={1,-8,0,8,-1};
 564 | 		for(i=0;i<5;i++)
 565 | 			xFilter[i]/=12;
 566 | 		ImageProcessing::hfiltering(pData,data,imWidth,imHeight,nChannels,xFilter,2);
 567 | 	}
 568 | }
 569 | 
 570 | template <class T>
 571 | template <class T1>
 572 | Image<T1> Image<T>::dx(bool IsAdvancedFilter) const
 573 | {
 574 | 	Image<T1> result;
 575 | 	dx<T1>(result,IsAdvancedFilter);
 576 | 	return result;
 577 | }
 578 | 
 579 | //------------------------------------------------------------------------------------------
 580 | // function to get y-derivative of the image
 581 | //------------------------------------------------------------------------------------------
 582 | template <class T>
 583 | template <class T1>
 584 | void Image<T>::dy(Image<T1>& result,bool IsAdvancedFilter) const
 585 | {
 586 | 	if(matchDimension(result)==false)
 587 | 		result.allocate(imWidth,imHeight,nChannels);
 588 | 	result.setDerivative();
 589 | 	T1*& data=result.data();
 590 | 	int i,j,k,offset;
 591 | 	if(IsAdvancedFilter==false)
 592 | 		for(i=0;i<imHeight-1;i++)
 593 | 			for(j=0;j<imWidth;j++)
 594 | 			{
 595 | 				offset=i*imWidth+j;
 596 | 				for(k=0;k<nChannels;k++)
 597 | 					data[offset*nChannels+k]=(T1)pData[(offset+imWidth)*nChannels+k]-pData[offset*nChannels+k];
 598 | 			}
 599 | 	else
 600 | 	{
 601 | 		double yFilter[5]={1,-8,0,8,-1};
 602 | 		for(i=0;i<5;i++)
 603 | 			yFilter[i]/=12;
 604 | 		ImageProcessing::vfiltering(pData,data,imWidth,imHeight,nChannels,yFilter,2);
 605 | 	}
 606 | }
 607 | 
 608 | template <class T>
 609 | template <class T1>
 610 | Image<T1> Image<T>::dy(bool IsAdvancedFilter) const
 611 | {
 612 | 	Image<T1> result;
 613 | 	dy<T1>(result,IsAdvancedFilter);
 614 | 	return result;
 615 | }
 616 | 
 617 | //------------------------------------------------------------------------------------------
 618 | // function to do Gaussian smoothing
 619 | //------------------------------------------------------------------------------------------
 620 | template <class T>
 621 | template <class T1>
 622 | void Image<T>::GaussianSmoothing(Image<T1>& image,double sigma,int fsize) const 
 623 | {
 624 | 	Image<T1> foo;
 625 | 	// constructing the 1D gaussian filter
 626 | 	double* gFilter;
 627 | 	gFilter=new double[fsize*2+1];
 628 | 	double sum=0;
 629 | 	sigma=sigma*sigma*2;
 630 | 	for(int i=-fsize;i<=fsize;i++)
 631 | 	{
 632 | 		gFilter[i+fsize]=exp(-(double)(i*i)/sigma);
 633 | 		sum+=gFilter[i+fsize];
 634 | 	}
 635 | 	for(int i=0;i<2*fsize+1;i++)
 636 | 		gFilter[i]/=sum;
 637 | 
 638 | 	// apply filtering
 639 | 	imfilter_hv(image,gFilter,fsize,gFilter,fsize);
 640 | 
 641 | 	delete gFilter;
 642 | }
 643 | 
 644 | //------------------------------------------------------------------------------------------
 645 | // function to smooth the image using a simple 3x3 filter
 646 | // the filter is [1 factor 1]/(factor+2), applied horizontally and vertically
 647 | //------------------------------------------------------------------------------------------
 648 | template <class T>
 649 | template <class T1>
 650 | void Image<T>::smoothing(Image<T1>& image,double factor)
 651 | {
 652 | 	// build 
 653 | 	double filter2D[9]={1,0,1,0, 0, 0,1, 0,1};
 654 | 	filter2D[1]=filter2D[3]=filter2D[5]=filter2D[7]=factor;
 655 | 	filter2D[4]=factor*factor;
 656 | 	for(int i=0;i<9;i++)
 657 | 		filter2D[i]/=(factor+2)*(factor+2);
 658 | 
 659 | 	if(matchDimension(image)==false)
 660 | 		image.allocate(imWidth,imHeight,nChannels);
 661 | 	imfilter<T1>(image,filter2D,1);
 662 | }
 663 | 
 664 | template <class T>
 665 | template <class T1>
 666 | Image<T1> Image<T>::smoothing(double factor)
 667 | {
 668 | 	Image<T1> result;
 669 | 	smoothing(result,factor);
 670 | 	return result;
 671 | }
 672 | 
 673 | template <class T>
 674 | void Image<T>::smoothing(double factor)
 675 | {
 676 | 	Image<T> result(imWidth,imHeight,nChannels);
 677 | 	smoothing(result,factor);
 678 | 	copyData(result);
 679 | }
 680 | 
 681 | //------------------------------------------------------------------------------------------
 682 | //	 function of image filtering
 683 | //------------------------------------------------------------------------------------------
 684 | template <class T>
 685 | template <class T1>
 686 | void Image<T>::imfilter(Image<T1>& image,double* filter,int fsize) const
 687 | {
 688 | 	if(matchDimension(image)==false)
 689 | 		image.allocate(imWidth,imHeight,nChannels);
 690 | 	ImageProcessing::filtering(pData,image.data(),imWidth,imHeight,nChannels,filter,fsize);
 691 | }
 692 | 
 693 | template <class T>
 694 | template <class T1>
 695 | Image<T1> Image<T>::imfilter(double *filter, int fsize)
 696 | {
 697 | 	Image<T1> result;
 698 | 	imfilter(result,filter,fsize);
 699 | 	return result;
 700 | }
 701 | 
 702 | template <class T>
 703 | template <class T1>
 704 | void Image<T>::imfilter_h(Image<T1>& image,double* filter,int fsize) const
 705 | {
 706 | 	if(matchDimension(image)==false)
 707 | 		image.allocate(imWidth,imHeight,nChannels);
 708 | 	ImageProcessing::hfiltering(pData,image.data(),imWidth,imHeight,nChannels,filter,fsize);
 709 | }
 710 | 
 711 | template <class T>
 712 | template <class T1>
 713 | void Image<T>::imfilter_v(Image<T1>& image,double* filter,int fsize) const
 714 | {
 715 | 	if(matchDimension(image)==false)
 716 | 		image.allocate(imWidth,imHeight,nChannels);
 717 | 	ImageProcessing::vfiltering(pData,image.data(),imWidth,imHeight,nChannels,filter,fsize);
 718 | }
 719 | 
 720 | 
 721 | template <class T>
 722 | template <class T1>
 723 | void Image<T>::imfilter_hv(Image<T1> &image, double *hfilter, int hfsize, double *vfilter, int vfsize) const
 724 | {
 725 | 	if(matchDimension(image)==false)
 726 | 		image.allocate(imWidth,imHeight,nChannels);
 727 | 	T1* pTempBuffer;
 728 | 	pTempBuffer=new T1[nElements];
 729 | 	ImageProcessing::hfiltering(pData,pTempBuffer,imWidth,imHeight,nChannels,hfilter,hfsize);
 730 | 	ImageProcessing::vfiltering(pTempBuffer,image.data(),imWidth,imHeight,nChannels,vfilter,vfsize);
 731 |     delete pTempBuffer;
 732 | }
 733 | 
 734 | //------------------------------------------------------------------------------------------
 735 | //	 function for desaturation
 736 | //------------------------------------------------------------------------------------------
 737 | template <class T>
 738 | template <class T1>
 739 | void Image<T>::desaturate(Image<T1> &image) const
 740 | {
 741 | 	if(nChannels!=3)
 742 | 	{
 743 | 		collapse(image);
 744 | 		return;
 745 | 	}
 746 | 	if(!(image.width()==imWidth && image.height()==imHeight && image.nChannels==1))
 747 | 		image.allocate(imWidth,imHeight,1);
 748 | 	T1* data=image.data();
 749 | 	int offset;
 750 | 	for(int i=0;i<nPixels;i++)
 751 | 	{
 752 | 		offset=i*3;
 753 | 		data[i]=(double)pData[offset]*.299+pData[offset+1]*.587+pData[offset+2]*.114;
 754 | 	}
 755 | }
 756 | 
 757 | template <class T>
 758 | template <class T1>
 759 | void Image<T>::collapse(Image<T1> &image) const
 760 | {
 761 | 	if(!(image.width()==imWidth && image.height()==imHeight && image.nChannels==1))
 762 | 		image.allocate(imWidth,imHeight,1);
 763 | 	T1* data=image.data();
 764 | 	int offset;
 765 | 	double temp;
 766 | 	for(int i=0;i<nPixels;i++)
 767 | 	{
 768 | 		offset=i*nChannels;
 769 | 		temp=0;
 770 | 		for(int j=0;j<nChannels;j++)
 771 | 			temp+=pData[offset+j];
 772 | 		data[i]=temp/nChannels;
 773 | 	}
 774 | }
 775 | 
 776 | //------------------------------------------------------------------------------------------
 777 | //  function to concatenate two images
 778 | //------------------------------------------------------------------------------------------
 779 | template <class T>
 780 | template <class T1,class T2>
 781 | void Image<T>::concatenate(Image<T1> &destImage, const Image<T2> &addImage) const
 782 | {
 783 | 	if(addImage.width()!=imWidth || addImage.height()!=imHeight)
 784 | 	{
 785 | 		destImage.copy(*this);
 786 | 		return;
 787 | 	}
 788 | 	int extNChannels=nChannels+addImage.nchannels();
 789 | 	if(destImage.width()!=imWidth || destImage.height()!=imHeight || destImage.nchannels()!=extNChannels)
 790 | 		destImage.allocate(imWidth,imHeight,extNChannels);
 791 | 	int offset;
 792 | 	T1*& pDestData=destImage.data();
 793 | 	const T2*& pAddData=addImage.data();
 794 | 	for(int i=0;i<imHeight;i++)
 795 | 		for(int j=0;j<imWidth;j++)
 796 | 		{
 797 | 			offset=i*imWidth+j;
 798 | 			for(int k=0;k<nChannels;k++)
 799 | 				pDestData[offset*extNChannels+k]=pData[offset*nChannels+k];
 800 | 			for(int k=nChannels;k<extNChannels;k++)
 801 | 				pDestData[offset*extNChannels+k]=pAddData[offset*addImage.nchannels()+k-nChannels];
 802 | 		}
 803 | }
 804 | 
 805 | template <class T>
 806 | template <class T1>
 807 | Image<T> Image<T>::concatenate(const Image<T1> &addImage) const
 808 | {
 809 | 	Image<T> destImage;
 810 | 	concatenate(destImage,addImage);
 811 | 	return destImage;
 812 | }
 813 | 
 814 | //------------------------------------------------------------------------------------------
 815 | // function to separate the image into two
 816 | //------------------------------------------------------------------------------------------
 817 | template <class T>
 818 | template <class T1,class T2>
 819 | void Image<T>::separate(unsigned int firstNChannels, Image<T1> &image1, Image<T2> &image2) const
 820 | {
 821 | 	image1.IsDerivativeImage=IsDerivativeImage;
 822 | 	image2.IsDerivativeImage=IsDerivativeImage;
 823 | 
 824 | 	if(firstNChannels>=nChannels)
 825 | 	{
 826 | 		image1=*this;
 827 | 		image2.allocate(imWidth,imHeight,0);
 828 | 		return;
 829 | 	}
 830 | 	if(firstNChannels==0)
 831 | 	{
 832 | 		image1.allocate(imWidth,imHeight,0);
 833 | 		image2=*this;
 834 | 		return;
 835 | 	}
 836 | 	int secondNChannels=nChannels-firstNChannels;
 837 | 	if(image1.width()!=imWidth || image1.height()!=imHeight || image1.nchannels()!=firstNChannels)
 838 | 		image1.allocate(imWidth,imHeight,firstNChannels);
 839 | 	if(image2.width()!=imWidth || image2.height()!=imHeight || image2.nchannels()!=secondNChannels)
 840 | 		image2.allocate(imWidth,imHeight,secondNChannels);
 841 | 
 842 | 	for(int i=0;i<imHeight;i++)
 843 | 		for(int j=0;j<imWidth;j++)
 844 | 		{
 845 | 			int offset=i*imWidth+j;
 846 | 			for(int k=0;k<firstNChannels;k++)
 847 | 				image1.pData[offset*firstNChannels+k]=pData[offset*nChannels+k];
 848 | 			for(int k=firstNChannels;k<nChannels;k++)
 849 | 				image2.pData[offset*secondNChannels+k-firstNChannels]=pData[offset*nChannels+k];
 850 | 		}
 851 | }
 852 | 
 853 | //------------------------------------------------------------------------------------------
 854 | // function to separate the image into two
 855 | //------------------------------------------------------------------------------------------
 856 | template <class T>
 857 | template <class T1>
 858 | void Image<T>::getPatch(Image<T1>& patch,double x,double y,int wsize) const
 859 | {
 860 | 	int wlength=wsize*2+1;
 861 | 	if(patch.width()!=wlength || patch.height()!=wlength || patch.nchannels()!=nChannels)
 862 | 		patch.allocate(wlength,wlength,nChannels);
 863 | 	else
 864 | 		patch.reset();
 865 | 	ImageProcessing::getPatch(pData,patch.data(),imWidth,imHeight,nChannels,x,y,wsize);
 866 | }
 867 | 
 868 | //------------------------------------------------------------------------------------------
 869 | // function to crop an image
 870 | //------------------------------------------------------------------------------------------
 871 | template <class T>
 872 | template <class T1>
 873 | void Image<T>::crop(Image<T1>& patch,int Left,int Top,int Width,int Height) const
 874 | {
 875 | 	if(patch.width()!=Width || patch.height()!=Height || patch.nchannels()!=nChannels)
 876 | 		patch.allocate(Width,Height,nChannels);
 877 | 	// make sure that the cropping is valid
 878 | 	if(Left<0 || Top<0 || Left>=imWidth || Top>=imHeight)
 879 | 	{
 880 | 		cout<<"The cropping coordinate is outside the image boundary!"<<endl;
 881 | 		return;
 882 | 	}
 883 | 	if(Width<0 || Height<0 || Width+Left>imWidth || Height+Top>imHeight)
 884 | 	{
 885 | 		cout<<"The patch to crop is invalid!"<<endl;
 886 | 		return;
 887 | 	}
 888 | 	ImageProcessing::cropImage(pData,imWidth,imHeight,nChannels,patch.data(),Left,Top,Width,Height);
 889 | }
 890 | 
 891 | //------------------------------------------------------------------------------------------
 892 | // function to multiply image1, image2 and image3 to the current image
 893 | //------------------------------------------------------------------------------------------
 894 | template <class T>
 895 | template <class T1,class T2,class T3>
 896 | void Image<T>::Multiply(const Image<T1>& image1,const Image<T2>& image2,const Image<T3>& image3)
 897 | {
 898 | 	if(image1.matchDimension(image2)==false || image2.matchDimension(image3)==false)
 899 | 	{
 900 | 		cout<<"Error in image dimensions--function Image<T>::Multiply()!"<<endl;
 901 | 		return;
 902 | 	}
 903 | 	if(matchDimension(image1)==false)
 904 | 		allocate(image1);
 905 | 
 906 | 	const T1*& pData1=image1.data();
 907 | 	const T2*& pData2=image2.data();
 908 | 	const T3*& pData3=image3.data();
 909 | 
 910 | 	for(int i=0;i<nElements;i++)
 911 | 		pData[i]=pData1[i]*pData2[i]*pData3[i];
 912 | }
 913 | 
 914 | template <class T>
 915 | template <class T1,class T2>
 916 | void Image<T>::Multiply(const Image<T1>& image1,const Image<T2>& image2)
 917 | {
 918 | 	if(image1.matchDimension(image2)==false)
 919 | 	{
 920 | 		cout<<"Error in image dimensions--function Image<T>::Multiply()!"<<endl;
 921 | 		return;
 922 | 	}
 923 | 	if(matchDimension(image1)==false)
 924 | 		allocate(image1);
 925 | 
 926 | 	const T1*& pData1=image1.data();
 927 | 	const T2*& pData2=image2.data();
 928 | 
 929 | 	for(int i=0;i<nElements;i++)
 930 | 		pData[i]=pData1[i]*pData2[i];
 931 | }
 932 | 
 933 | template <class T>
 934 | template <class T1>
 935 | void Image<T>::Multiplywith(const Image<T1> &image1)
 936 | {
 937 | 	if(matchDimension(image1)==false)
 938 | 	{
 939 | 		cout<<"Error in image dimensions--function Image<T>::Multiplywith()!"<<endl;
 940 | 		return;
 941 | 	}
 942 | 	const T1*& pData1=image1.data();
 943 | 	for(int i=0;i<nElements;i++)
 944 | 		pData[i]*=pData1[i];
 945 | }
 946 | 
 947 | template <class T>
 948 | void Image<T>::Multiplywith(double value)
 949 | {
 950 | 	for(int i=0;i<nElements;i++)
 951 | 		pData[i]*=value;
 952 | }
 953 | 
 954 | //------------------------------------------------------------------------------------------
 955 | // function to add image2 to image1 to the current image
 956 | //------------------------------------------------------------------------------------------
 957 | template <class T>
 958 | template <class T1,class T2>
 959 | void Image<T>::Add(const Image<T1>& image1,const Image<T2>& image2)
 960 | {
 961 | 	if(image1.matchDimension(image2)==false)
 962 | 	{
 963 | 		cout<<"Error in image dimensions--function Image<T>::Add()!"<<endl;
 964 | 		return;
 965 | 	}
 966 | 	if(matchDimension(image1)==false)
 967 | 		allocate(image1);
 968 | 
 969 | 	const T1*& pData1=image1.data();
 970 | 	const T2*& pData2=image2.data();
 971 | 	for(int i=0;i<nElements;i++)
 972 | 		pData[i]=pData1[i]+pData2[i];	
 973 | }
 974 | 
 975 | template <class T>
 976 | template <class T1,class T2>
 977 | void Image<T>::Add(const Image<T1>& image1,const Image<T2>& image2,double ratio)
 978 | {
 979 | 	if(image1.matchDimension(image2)==false)
 980 | 	{
 981 | 		cout<<"Error in image dimensions--function Image<T>::Add()!"<<endl;
 982 | 		return;
 983 | 	}
 984 | 	if(matchDimension(image1)==false)
 985 | 		allocate(image1);
 986 | 
 987 | 	const T1*& pData1=image1.data();
 988 | 	const T2*& pData2=image2.data();
 989 | 	for(int i=0;i<nElements;i++)
 990 | 		pData[i]=pData1[i]+pData2[i]*ratio;	
 991 | }
 992 | 
 993 | template <class T>
 994 | template <class T1>
 995 | void Image<T>::Add(const Image<T1>& image1,const double ratio)
 996 | {
 997 | 	if(matchDimension(image1)==false)
 998 | 	{
 999 | 		cout<<"Error in image dimensions--function Image<T>::Add()!"<<endl;
1000 | 		return;
1001 | 	}
1002 | 	const T1*& pData1=image1.data();
1003 | 	for(int i=0;i<nElements;i++)
1004 | 		pData[i]+=pData1[i]*ratio;	
1005 | }
1006 | 
1007 | template <class T>
1008 | void Image<T>::Add(const T value)
1009 | {
1010 | 	for(int i=0;i<nElements;i++)
1011 | 		pData[i]+=value;
1012 | }
1013 | 
1014 | //------------------------------------------------------------------------------------------
1015 | // function to subtract image2 from image1
1016 | //------------------------------------------------------------------------------------------
1017 | template <class T>
1018 | template <class T1,class T2>
1019 | void Image<T>::Subtract(const Image<T1> &image1, const Image<T2> &image2)
1020 | {
1021 | 	if(image1.matchDimension(image2)==false)
1022 | 	{
1023 | 		cout<<"Error in image dimensions--function Image<T>::Add()!"<<endl;
1024 | 		return;
1025 | 	}
1026 | 	if(matchDimension(image1)==false)
1027 | 		allocate(image1);
1028 | 
1029 | 	const T1*& pData1=image1.data();
1030 | 	const T2*& pData2=image2.data();
1031 | 	for(int i=0;i<nElements;i++)
1032 | 		pData[i]=pData1[i]-pData2[i];
1033 | }
1034 | 
1035 | //------------------------------------------------------------------------------------------
1036 | // normalize an image
1037 | //------------------------------------------------------------------------------------------
1038 | template <class T>
1039 | void Image<T>::normalize(Image<T>& image)
1040 | {
1041 | 	if(image.width()!=imWidth || image.height()!=imHeight || image.nchannels()!=nChannels)
1042 | 		image.allocate(imWidth,imHeight,nChannels);
1043 | 	T Max,Min;
1044 | 	Max=Min=pData[0];
1045 | 	for(int i=0;i<nElements;i++)
1046 | 	{
1047 | 		Max=qMax(Max,pData[i]);
1048 | 		Min=qMin(Min,pData[i]);
1049 | 	}
1050 | 	if(Max==Min)
1051 | 		return;
1052 | 	double ratio=1/(Max-Min);
1053 | 	if(IsFloat()==false)
1054 | 		ratio*=255;
1055 | 	T* data=image.data();
1056 | 	for(int i=0;i<nElements;i++)
1057 | 		data[i]=(double)(pData[i]-Min)*ratio;
1058 | }
1059 | 
1060 | template <class T>
1061 | double Image<T>::norm2() const
1062 | {
1063 | 	double result=0;
1064 | 	for(int i=0;i<nElements;i++)
1065 | 		result+=pData[i]*pData[i];
1066 | 	return result;
1067 | }
1068 | 
1069 | template <class T>
1070 | template <class T1>
1071 | double Image<T>::innerproduct(Image<T1> &image) const
1072 | {
1073 | 	double result=0;
1074 | 	const T1* pData1=image.data();
1075 | 	for(int i=0;i<nElements;i++)
1076 | 		result+=pData[i]*pData1[i];
1077 | 	return result;
1078 | }
1079 | 
1080 | #ifdef _MATLAB
1081 | 
1082 | template <class T>
1083 | template <class T1>
1084 | void Image<T>::LoadMatlabImage(const mxArray *image)
1085 | {
1086 | 	int nDim = mxGetNumberOfDimensions(image);
1087 | 	const int* imDim = mxGetDimensions(image);
1088 | 	if(nDim==2)
1089 | 		allocate(imDim[1],imDim[0]);
1090 | 	else if(nDim==3)
1091 | 		allocate(imDim[1],imDim[0],imDim[2]);
1092 | 	else
1093 | 		mexErrMsgTxt("The image doesn't have the appropriate dimension!");
1094 | 	T1* pMatlabPlane=(T1*)mxGetData(image);
1095 | 	bool IsMatlabFloat;
1096 | 	if(typeid(T1)==typeid(float) || typeid(T1)==typeid(double) || typeid(T1)==typeid(long double))
1097 | 		IsMatlabFloat=true;
1098 | 	else
1099 | 		IsMatlabFloat=false;
1100 | 	bool isfloat=IsFloat();
1101 | 	if(isfloat==IsMatlabFloat)
1102 | 	{
1103 | 		ConvertFromMatlab<T1>(pMatlabPlane,imWidth,imHeight,nChannels);
1104 | 		return;
1105 | 	}
1106 | 	int offset=0;
1107 | 	if(isfloat==true)
1108 | 		for(int i=0;i<imHeight;i++)
1109 | 			for(int j=0;j<imWidth;j++)
1110 | 				for(int k=0;k<nChannels;k++)
1111 | 					pData[offset++]=(double)pMatlabPlane[k*nPixels+j*imHeight+i]/255;
1112 | 	else
1113 | 		for(int i=0;i<imHeight;i++)
1114 | 			for(int j=0;j<imWidth;j++)
1115 | 				for(int k=0;k<nChannels;k++)
1116 | 					pData[offset++]=(double)pMatlabPlane[k*nPixels+j*imHeight+i]*255;
1117 | }
1118 | 
1119 | template <class T>
1120 | template <class T1>
1121 | void Image<T>::ConvertFromMatlab(const T1 *pMatlabPlane, int _width, int _height, int _nchannels)
1122 | {
1123 | 	if(imWidth!=_width || imHeight!=_height || nChannels!=_nchannels)
1124 | 		allocate(_width,_height,_nchannels);
1125 | 	int offset=0;
1126 | 	for(int i=0;i<imHeight;i++)
1127 | 		for(int j=0;j<imWidth;j++)
1128 | 			for(int k=0;k<nChannels;k++)
1129 | 				pData[offset++]=pMatlabPlane[k*nPixels+j*imHeight+i];
1130 | }
1131 | 
1132 | // convert image data to matlab matrix
1133 | template <class T>
1134 | template <class T1>
1135 | void Image<T>::ConvertToMatlab(T1 *pMatlabPlane)
1136 | {
1137 | 	int offset=0;
1138 | 	for(int i=0;i<imHeight;i++)
1139 | 		for(int j=0;j<imWidth;j++)
1140 | 			for(int k=0;k<nChannels;k++)
1141 | 				pMatlabPlane[k*nPixels+j*imHeight+i]=pData[offset++];
1142 | }
1143 | 
1144 | template <class T>
1145 | void Image<T>::OutputToMatlab(mxArray *&matrix)
1146 | {
1147 | 	int dims[3];
1148 | 	dims[0]=imHeight;
1149 | 	dims[1]=imWidth;
1150 | 	dims[2]=nChannels;
1151 | 	if(nChannels==1)
1152 | 		matrix=mxCreateNumericArray(2, dims,mxDOUBLE_CLASS, mxREAL);
1153 | 	else
1154 | 		matrix=mxCreateNumericArray(3, dims,mxDOUBLE_CLASS, mxREAL);
1155 | 	ConvertToMatlab<double>((double*)mxGetData(matrix));
1156 | }
1157 | 
1158 | #endif
1159 | 
1160 | 
1161 | #endif
1162 | 


--------------------------------------------------------------------------------
/ImageIO.h:
--------------------------------------------------------------------------------
  1 | #ifndef _ImageIO_h
  2 | #define _ImageIO_h
  3 | 
  4 | #include <QVector>
  5 | #include <QImage>
  6 | #include <QString>
  7 | #include "math.h"
  8 | //-----------------------------------------------------------------------------------------
  9 | // this class is a wrapper to use QImage to load image into image planes
 10 | //-----------------------------------------------------------------------------------------
 11 | 
 12 | class ImageIO
 13 | {
 14 | public:
 15 | 	enum ImageType{standard, derivative, normalized};
 16 | 	ImageIO(void);
 17 | 	~ImageIO(void);
 18 | public:
 19 | 	template <class T>
 20 | 	static void loadImage(const QImage& image,T*& pImagePlane,int& width,int& height,int& nchannels);
 21 | 	template <class T>
 22 | 	static bool loadImage(const QString& filename,T*& pImagePlane,int& width,int& height,int& nchannels);
 23 | 
 24 | 	template <class T>
 25 | 	static unsigned char convertPixel(const T& value,bool IsFloat,ImageType type,T& _Max,T& _Min);
 26 | 
 27 | 	template <class T>
 28 | 	static bool writeImage(const QString& filename, const T*& pImagePlane,int width,int height,int nchannels,ImageType type=standard,int quality=-1);
 29 | };
 30 | 
 31 | template <class T>
 32 | void ImageIO::loadImage(const QImage& image, T*& pImagePlane,int& width,int& height,int& nchannels)
 33 | {
 34 | 	// get the image information
 35 | 	width=image.width();
 36 | 	height=image.height();
 37 | 	nchannels=3;
 38 | 	pImagePlane=new T[width*height*nchannels];
 39 | 
 40 | 	// check whether the type is float point
 41 | 	bool IsFloat=false;
 42 | 	if(typeid(T)==typeid(double) || typeid(T)==typeid(float) || typeid(T)==typeid(long double))
 43 | 		IsFloat=true;
 44 | 
 45 | 	const unsigned char* plinebuffer;
 46 | 	for(int i=0;i<height;i++)
 47 | 	{
 48 | 		plinebuffer=image.scanLine(i);
 49 | 		for(int j=0;j<width;j++)
 50 | 		{
 51 | 			if(IsFloat)
 52 | 			{
 53 | 				pImagePlane[(i*width+j)*3]=(T)plinebuffer[j*4]/255;
 54 | 				pImagePlane[(i*width+j)*3+1]=(T)plinebuffer[j*4+1]/255;
 55 | 				pImagePlane[(i*width+j)*3+2]=(T)plinebuffer[j*4+2]/255;
 56 | 			}
 57 | 			else
 58 | 			{
 59 | 				pImagePlane[(i*width+j)*3]=plinebuffer[j*4];
 60 | 				pImagePlane[(i*width+j)*3+1]=plinebuffer[j*4+1];
 61 | 				pImagePlane[(i*width+j)*3+2]=plinebuffer[j*4+2];
 62 | 			}
 63 | 		}
 64 | 	}
 65 | }
 66 | 
 67 | template <class T>
 68 | bool ImageIO::loadImage(const QString&filename, T*& pImagePlane,int& width,int& height,int& nchannels)
 69 | {
 70 | 	QImage image;
 71 | 	if(image.load(filename)==false)
 72 | 		return false;
 73 | 	if(image.format()!=QImage::Format_RGB32)
 74 | 	{
 75 | 		QImage temp=image.convertToFormat(QImage::Format_RGB32);
 76 | 		image=temp;
 77 | 	}
 78 | 	loadImage(image,pImagePlane,width,height,nchannels);
 79 | 	return true;
 80 | }
 81 | 
 82 | template <class T>
 83 | bool ImageIO::writeImage(const QString& filename, const T*& pImagePlane,int width,int height,int nchannels,ImageType type,int quality)
 84 | {
 85 | 	int nPixels=width*height,nElements;
 86 | 	nElements=nPixels*nchannels;
 87 | 	unsigned char* pTempBuffer;
 88 | 	pTempBuffer=new unsigned char[nPixels*4];
 89 | 	memset(pTempBuffer,0,nPixels*4);
 90 | 
 91 | 	// check whether the type is float point
 92 | 	bool IsFloat=false;
 93 | 	if(typeid(T)==typeid(double) || typeid(T)==typeid(float) || typeid(T)==typeid(long double))
 94 | 		IsFloat=true;
 95 | 
 96 | 	T _Max=0,_Min=0;
 97 | 	switch(type){
 98 | 		case standard:
 99 | 			break;
100 | 		case derivative:
101 | 			_Max=0;
102 | 			for(int i=0;i<nPixels;i++)
103 | 			{
104 | 				if(IsFloat)
105 | 					_Max=__max(_Max,fabs((double)pImagePlane[i]));
106 | 				else
107 | 					_Max=__max(_Max,abs(pImagePlane[i]));
108 | 			}
109 | 			break;
110 | 		case normalized:
111 | 			_Min=_Max=pImagePlane[0];
112 | 			for(int i=1;i<nElements;i++)
113 | 			{
114 | 				_Min=__min(_Min,pImagePlane[i]);
115 | 				_Max=__max(_Max,pImagePlane[i]);
116 | 			}
117 | 			break;
118 | 	}
119 | 
120 | 	for(int i=0;i<nPixels;i++)
121 | 	{
122 | 		if(nchannels>=3)
123 | 		{
124 | 			pTempBuffer[i*4]=convertPixel(pImagePlane[i*nchannels],IsFloat,type,_Max,_Min);
125 | 			pTempBuffer[i*4+1]=convertPixel(pImagePlane[i*nchannels+1],IsFloat,type,_Max,_Min);
126 | 			pTempBuffer[i*4+2]=convertPixel(pImagePlane[i*nchannels+2],IsFloat,type,_Max,_Min);
127 | 		}
128 | 		else 
129 | 			for (int j=0;j<3;j++)
130 | 				pTempBuffer[i*4+j]=convertPixel(pImagePlane[i*nchannels],IsFloat,type,_Max,_Min);
131 | 		pTempBuffer[i*4+3]=255;
132 | 	}
133 | 	QImage *pQImage=new QImage(pTempBuffer,width,height,QImage::Format_RGB32);
134 | 	bool result= pQImage->save(filename,0,quality);
135 | 	delete pQImage;
136 | 	delete pTempBuffer;
137 | 	return result;
138 | }
139 | 
140 | template <class T>
141 | unsigned char ImageIO::convertPixel(const T& value,bool IsFloat,ImageType type,T& _Max,T& _Min)
142 | {
143 | 	switch(type){
144 | 		case standard:
145 | 			if(IsFloat)
146 | 				return __max(__min(value*255,255),0);
147 | 			else
148 | 				return __max(__min(value,255),0);
149 | 			break;
150 | 		case derivative:
151 | 			return (double)((double)value/_Max+1)/2*255;
152 | 			break;
153 | 		case normalized:
154 | 			return (double)(value-_Min)/(_Max-_Min)*255;
155 | 			break;
156 | 	}
157 | 	return 0;
158 | }
159 | 
160 | #endif


--------------------------------------------------------------------------------
/ImageProcessing.h:
--------------------------------------------------------------------------------
  1 | #ifndef _ImageProcessing_h
  2 | #define _ImageProcessing_h
  3 | 
  4 | #include "math.h"
  5 | #include "stdio.h"
  6 | #include "stdlib.h"
  7 | #include <typeinfo>
  8 | //----------------------------------------------------------------------------------
  9 | // class to handle basic image processing functions
 10 | // this is a collection of template functions. These template functions are
 11 | // used in other image classes such as BiImage, IntImage and FImage 
 12 | //----------------------------------------------------------------------------------
 13 | 
 14 | class ImageProcessing
 15 | {
 16 | public:
 17 | 	ImageProcessing(void);
 18 | 	~ImageProcessing(void);
 19 | public:
 20 | 	// basic functions
 21 | 	template <class T>
 22 | 	static inline T EnforceRange(const T& x,const int& MaxValue) {return __min(__max(x,0),MaxValue-1);};
 23 | 
 24 | 	//---------------------------------------------------------------------------------
 25 | 	// function to interpolate the image plane
 26 | 	//---------------------------------------------------------------------------------
 27 | 	template <class T1,class T2> 
 28 | 	static inline void BilinearInterpolate(const T1* pImage,int width,int height,int nChannels,double x,double y,T2* result);
 29 | 
 30 | 	template <class T1,class T2>
 31 | 	static void ResizeImage(const T1* pSrcImage,T2* pDstImage,int SrcWidth,int SrcHeight,int nChannels,double Ratio);
 32 | 
 33 | 	template <class T1,class T2>
 34 | 	static void ResizeImage(const T1* pSrcImage,T2* pDstImage,int SrcWidth,int SrcHeight,int nChannels,int DstWidth,int DstHeight);
 35 | 
 36 | 	//---------------------------------------------------------------------------------
 37 | 	// functions for 1D filtering
 38 | 	//---------------------------------------------------------------------------------
 39 | 	template <class T1,class T2>
 40 | 	static void hfiltering(const T1* pSrcImage,T2* pDstImage,int width,int height,int nChannels,double* pfilter1D,int fsize);
 41 | 
 42 | 	template <class T1,class T2>
 43 | 	static void vfiltering(const T1* pSrcImage,T2* pDstImage,int width,int height,int nChannels,double* pfilter1D,int fsize);
 44 | 
 45 | 	//---------------------------------------------------------------------------------
 46 | 	// functions for 2D filtering
 47 | 	//---------------------------------------------------------------------------------
 48 | 	template <class T1,class T2>
 49 | 	static void filtering(const T1* pSrcImage,T2* pDstImage,int width,int height,int nChannels,double* pfilter2D,int fsize);
 50 | 
 51 | 	//---------------------------------------------------------------------------------
 52 | 	// functions for sample a patch from the image
 53 | 	//---------------------------------------------------------------------------------
 54 | 	template <class T1,class T2>
 55 | 	static void getPatch(const T1* pSrcImgae,T2* pPatch,int width,int height,int nChannels,double x,double y,int wsize);
 56 | 
 57 | 	//---------------------------------------------------------------------------------
 58 | 	// function to warp image
 59 | 	//---------------------------------------------------------------------------------
 60 | 	template <class T1,class T2>
 61 | 	static void warpImage(T1* pWarpIm2,const T1* pIm1,const T1* pIm2,const T2* pVx,const T2* pVy,int width,int height,int nChannels);
 62 | 
 63 | 	//---------------------------------------------------------------------------------
 64 | 	// function to crop an image
 65 | 	//---------------------------------------------------------------------------------
 66 | 	template <class T1,class T2>
 67 | 	static void cropImage(const T1* pSrcImage,int SrcWidth,int SrcHeight,int nChannels,T2* pDstImage,int Left,int Top,int DstWidth,int DstHeight);
 68 | 	//---------------------------------------------------------------------------------
 69 | 
 70 | 	//---------------------------------------------------------------------------------
 71 | 	// function to generate a 2D Gaussian 
 72 | 	//---------------------------------------------------------------------------------
 73 | 	template <class T>
 74 | 	static void generate2DGaussian(T*& pImage,int wsize,double sigma=-1);
 75 | };
 76 | 
 77 | //--------------------------------------------------------------------------------------------------
 78 | // function to interplate multi-channel image plane for (x,y)
 79 | // --------------------------------------------------------------------------------------------------
 80 | template <class T1,class T2>
 81 | inline void ImageProcessing::BilinearInterpolate(const T1* pImage,int width,int height,int nChannels,double x,double y,T2* result)
 82 | {
 83 | 	int xx,yy,m,n,u,v,l,offset;
 84 | 	xx=x;
 85 | 	yy=y;
 86 | 	double dx,dy,s;
 87 | 	dx=__max(__min(x-xx,1),0);
 88 | 	dy=__max(__min(y-yy,1),0);
 89 | 
 90 | 	memset(result,0,sizeof(T2)*nChannels);
 91 | 
 92 | 	for(m=0;m<=1;m++)
 93 | 		for(n=0;n<=1;n++)
 94 | 		{
 95 | 			u=EnforceRange(xx+m,width);
 96 | 			v=EnforceRange(yy+n,height);
 97 | 			offset=(v*width+u)*nChannels;
 98 | 			s=fabs(1-m-dx)*fabs(1-n-dy);
 99 | 			for(l=0;l<nChannels;l++)
100 | 				result[l]+=pImage[offset+l]*s;
101 | 		}
102 | }
103 | 
104 | //------------------------------------------------------------------------------------------------------------
105 | // this is the most general function for reszing an image with a varying nChannels
106 | // bilinear interpolation is used for now. It might be replaced by other (bicubic) interpolation methods 
107 | //------------------------------------------------------------------------------------------------------------
108 | template <class T1,class T2>
109 | void ImageProcessing::ResizeImage(const T1* pSrcImage,T2* pDstImage,int SrcWidth,int SrcHeight,int nChannels,double Ratio)
110 | {
111 | 	int DstWidth,DstHeight;
112 | 	DstWidth=(double)SrcWidth*Ratio;
113 | 	DstHeight=(double)SrcHeight*Ratio;
114 | 	memset(pDstImage,sizeof(T2)*DstWidth*DstHeight*nChannels,0);
115 | 	
116 | 	double x,y;
117 | 
118 | 	for(int i=0;i<DstHeight;i++)
119 | 		for(int j=0;j<DstWidth;j++)
120 | 		{
121 | 			x=(double)(j+1)/Ratio-1;
122 | 			y=(double)(i+1)/Ratio-1;
123 | 
124 | 			// bilinear interpolation
125 | 			BilinearInterpolate(pSrcImage,SrcWidth,SrcHeight,nChannels,x,y,pDstImage+(i*DstWidth+j)*nChannels);
126 | 		}
127 | }
128 | 
129 | template <class T1,class T2>
130 | void ImageProcessing::ResizeImage(const T1 *pSrcImage, T2 *pDstImage, int SrcWidth, int SrcHeight, int nChannels, int DstWidth, int DstHeight)
131 | {
132 | 	double xRatio=(double)DstWidth/SrcWidth;
133 | 	double yRatio=(double)DstHeight/SrcHeight;
134 | 	memset(pDstImage,sizeof(T2)*DstWidth*DstHeight*nChannels,0);
135 | 
136 | 	double x,y;
137 | 
138 | 	for(int i=0;i<DstHeight;i++)
139 | 		for(int j=0;j<DstWidth;j++)
140 | 		{
141 | 			x=(double)(j+1)/xRatio-1;
142 | 			y=(double)(i+1)/yRatio-1;
143 | 
144 | 			// bilinear interpolation
145 | 			BilinearInterpolate(pSrcImage,SrcWidth,SrcHeight,nChannels,x,y,pDstImage+(i*DstWidth+j)*nChannels);
146 | 		}
147 | }
148 | 
149 | //------------------------------------------------------------------------------------------------------------
150 | //  horizontal direction filtering
151 | //------------------------------------------------------------------------------------------------------------
152 | template <class T1,class T2>
153 | void ImageProcessing::hfiltering(const T1* pSrcImage,T2* pDstImage,int width,int height,int nChannels,double* pfilter1D,int fsize)
154 | {
155 | 	memset(pDstImage,0,sizeof(T2)*width*height*nChannels);
156 | 	T2* pBuffer;
157 | 	double w;
158 | 	int i,j,l,k,offset,jj;
159 | 	for(i=0;i<height;i++)
160 | 		for(j=0;j<width;j++)
161 | 		{
162 | 			offset=i*width*nChannels;
163 | 			pBuffer=pDstImage+offset+j*nChannels;
164 | 			for(l=-fsize;l<=fsize;l++)
165 | 			{
166 | 				w=pfilter1D[l+fsize];
167 | 				jj=EnforceRange(j+l,width);
168 | 				for(k=0;k<nChannels;k++)
169 | 					pBuffer[k]+=pSrcImage[offset+jj*nChannels+k]*w;
170 | 			}
171 | 		}
172 | }
173 | 
174 | //------------------------------------------------------------------------------------------------------------
175 | // vertical direction filtering
176 | //------------------------------------------------------------------------------------------------------------
177 | template <class T1,class T2>
178 | void ImageProcessing::vfiltering(const T1* pSrcImage,T2* pDstImage,int width,int height,int nChannels,double* pfilter1D,int fsize)
179 | {
180 | 	memset(pDstImage,0,sizeof(T2)*width*height*nChannels);
181 | 	T2* pBuffer;
182 | 	double w;
183 | 	int i,j,l,k,offset,ii;
184 | 	for(i=0;i<height;i++)
185 | 		for(j=0;j<width;j++)
186 | 		{
187 | 			pBuffer=pDstImage+(i*width+j)*nChannels;
188 | 			for(l=-fsize;l<=fsize;l++)
189 | 			{
190 | 				w=pfilter1D[l+fsize];
191 | 				ii=EnforceRange(i+l,height);
192 | 				for(k=0;k<nChannels;k++)
193 | 					pBuffer[k]+=pSrcImage[(ii*width+j)*nChannels+k]*w;
194 | 			}
195 | 		}
196 | }
197 | 
198 | //------------------------------------------------------------------------------------------------------------
199 | // 2d filtering
200 | //------------------------------------------------------------------------------------------------------------
201 | template <class T1,class T2>
202 | void ImageProcessing::filtering(const T1* pSrcImage,T2* pDstImage,int width,int height,int nChannels,double* pfilter2D,int fsize)
203 | {
204 | 	double w;
205 | 	int i,j,u,v,k,ii,jj,wsize,offset;
206 | 	wsize=fsize*2+1;
207 | 	double* pBuffer=new double[nChannels];
208 | 	for(i=0;i<height;i++)
209 | 		for(j=0;j<width;j++)
210 | 		{
211 | 			for(k=0;k<nChannels;k++)
212 | 				pBuffer[k]=0;
213 | 			for(u=-fsize;u<=fsize;u++)
214 | 				for(v=-fsize;v<=fsize;v++)
215 | 				{
216 | 					w=pfilter2D[(u+fsize)*wsize+v+fsize];
217 | 					ii=EnforceRange(i+u,height);
218 | 					jj=EnforceRange(j+v,width);
219 | 					offset=(ii*width+jj)*nChannels;
220 | 					for(k=0;k<nChannels;k++)
221 | 						pBuffer[k]+=pSrcImage[offset+k]*w;
222 | 				}
223 | 			offset=(i*width+j)*nChannels;
224 | 			for(k=0;k<nChannels;k++)
225 | 				pDstImage[offset+k]=pBuffer[k];
226 | 		}
227 | 	delete pBuffer;
228 | }
229 | 
230 | //------------------------------------------------------------------------------------------------------------
231 | // function to sample a patch from the source image
232 | //------------------------------------------------------------------------------------------------------------
233 | template <class T1,class T2>
234 | void ImageProcessing::getPatch(const T1* pSrcImage,T2* pPatch,int width,int height,int nChannels,double x0,double y0,int wsize)
235 | {
236 | 	// suppose pPatch has been allocated and cleared before calling the function
237 | 	int wlength=wsize*2+1;
238 | 	double x,y;
239 | 	for(int i=-wsize;i<=wsize;i++)
240 | 		for(int j=-wsize;j<=wsize;j++)
241 | 		{
242 | 			y=y0+i;
243 | 			x=x0+j;
244 | 			if(x<0 || x>width-1 || y<0 || y>height-1)
245 | 				continue;
246 | 			BilinearInterpolate(pSrcImage,width,height,nChannels,x,y,pPatch+((i+wsize)*wlength+j+wsize)*nChannels);
247 | 		}
248 | }
249 | 
250 | //------------------------------------------------------------------------------------------------------------
251 | // function to warp an image with respect to flow field
252 | // pWarpIm2 has to be allocated before hands
253 | //------------------------------------------------------------------------------------------------------------
254 | template <class T1,class T2>
255 | void ImageProcessing::warpImage(T1 *pWarpIm2, const T1 *pIm1, const T1 *pIm2, const T2 *pVx, const T2 *pVy, int width, int height, int nChannels)
256 | {
257 | 	for(int i=0;i<height;i++)
258 | 		for(int j=0;j<width;j++)
259 | 		{
260 | 			int offset=i*width+j;
261 | 			double x,y;
262 | 			y=i+pVy[offset];
263 | 			x=j+pVx[offset];
264 | 			offset*=nChannels;
265 | 			if(x<0 || x>width-1 || y<0 || y>height-1)
266 | 			{
267 | 				for(int k=0;k<nChannels;k++)
268 | 					pWarpIm2[offset+k]=pIm1[offset+k];
269 | 				continue;
270 | 			}
271 | 			BilinearInterpolate(pIm2,width,height,nChannels,x,y,pWarpIm2+offset);
272 | 		}
273 | }
274 | 
275 | //------------------------------------------------------------------------------------------------------------
276 | // function to crop an image from the source
277 | // assume that pDstImage has been allocated
278 | // also Left and Top must be valid, DstWidth and DstHeight should ensure that the image lies
279 | // inside the image boundary
280 | //------------------------------------------------------------------------------------------------------------
281 | template <class T1,class T2>
282 | void ImageProcessing::cropImage(const T1 *pSrcImage, int SrcWidth, int SrcHeight, int nChannels, T2 *pDstImage, int Left, int Top, int DstWidth, int DstHeight)
283 | {
284 | 	if(typeid(T1)==typeid(T2))
285 | 	{
286 | 		for(int i=0;i<DstHeight;i++)
287 | 			memcpy(pDstImage+i*DstWidth*nChannels,pSrcImage+((i+Top)*SrcWidth+Left)*nChannels,sizeof(T1)*DstWidth*nChannels);
288 | 		return;
289 | 	}
290 | 	int offsetSrc,offsetDst;
291 | 	for(int i=0;i<DstHeight;i++)
292 | 		for(int j=0;j<DstWidth;j++)
293 | 		{
294 | 			offsetSrc=((i+Top)*SrcWidth+Left+j)*nChannels;
295 | 			offsetDst=(i*DstWidth+j)*nChannels;
296 | 			for(int k=0;k<nChannels;k++)
297 | 				pDstImage[offsetDst+k]=pSrcImage[offsetSrc+k];
298 | 		}
299 | }
300 | 
301 | //------------------------------------------------------------------------------------------------------------
302 | // function to generate a 2D Gaussian image
303 | // pImage must be allocated before calling the function
304 | //------------------------------------------------------------------------------------------------------------
305 | template <class T>
306 | void ImageProcessing::generate2DGaussian(T*& pImage, int wsize, double sigma)
307 | {
308 | 	if(sigma==-1)
309 | 		sigma=wsize;
310 | 	double alpha=1/(2*sigma*sigma);
311 | 	int winlength=wsize*2+1;
312 | 	if(pImage==NULL)
313 | 		pImage=new T[winlength*winlength];
314 | 	for(int i=-wsize;i<=wsize;i++)
315 | 		for(int j=-wsize;j<=wsize;j++)
316 | 			pImage[(i+wsize)*winlength+j+wsize]=exp(-(double)(i*i+j*j)*alpha);
317 | }
318 | #endif


--------------------------------------------------------------------------------
/OpticalFlow.h:
--------------------------------------------------------------------------------
 1 | #ifndef _OpticalFlow_h
 2 | #define _OpticalFlow_h
 3 | 
 4 | #include "Image.h"
 5 | 
 6 | class OpticalFlow
 7 | {
 8 | private:
 9 | 	static bool IsDisplay;
10 | public:
11 | 	OpticalFlow(void);
12 | 	~OpticalFlow(void);
13 | public:
14 | 	static void getDxs(DImage& imdx,DImage& imdy,DImage& imdt,const DImage& im1,const DImage& im2);
15 | 	static void SanityCheck(const DImage& imdx,const DImage& imdy,const DImage& imdt,double du,double dv);
16 | 	static void warpFL(DImage& warpIm2,const DImage& Im1,const DImage& Im2,const DImage& vx,const DImage& vy);
17 | 	static void genConstFlow(DImage& flow,double value,int width,int height);
18 | 	static void genInImageMask(DImage& mask,const DImage& vx,const DImage& vy);
19 | 	static void SmoothFlowPDE(const DImage& Im1,const DImage& Im2, DImage& warpIm2,DImage& vx,DImage& vy,
20 | 														 double alpha,int nOuterFPIterations,int nInnerFPIterations,int nCGIterations);
21 | 	static void Laplacian(DImage& output,const DImage& input,const DImage& weight);
22 | 	static void testLaplacian(int dim=3);
23 | 
24 | 	// function of coarse to fine optical flow
25 | 	static void Coarse2FineFlow(DImage& vx,DImage& vy,DImage &warpI2,const DImage& Im1,const DImage& Im2,double alpha,double ratio,int minWidth,
26 | 															int nOuterFPIterations,int nInnerFPIterations,int nCGIterations);
27 | 	// function to convert image to features
28 | 	static void im2feature(DImage& imfeature,const DImage& im);
29 | };
30 | 
31 | #endif


--------------------------------------------------------------------------------
/OpticalFlowCode.cpp:
--------------------------------------------------------------------------------
  1 | #include "OpticalFlow.h"
  2 | #include "ImageProcessing.h"
  3 | #include "GaussianPyramid.h"
  4 | #include <cstdlib> 
  5 | #include <iostream>
  6 | 
  7 | using namespace std;
  8 | 
  9 | bool OpticalFlow::IsDisplay=false;
 10 | 
 11 | OpticalFlow::OpticalFlow(void)
 12 | {
 13 | }
 14 | 
 15 | OpticalFlow::~OpticalFlow(void)
 16 | {
 17 | }
 18 | 
 19 | //--------------------------------------------------------------------------------------------------------
 20 | //  function to compute dx, dy and dt for motion estimation
 21 | //--------------------------------------------------------------------------------------------------------
 22 | void OpticalFlow::getDxs(DImage &imdx, DImage &imdy, DImage &imdt, const DImage &im1, const DImage &im2)
 23 | {
 24 | 	// Im1 and Im2 are the smoothed version of im1 and im2
 25 | 	DImage Im1,Im2;
 26 | 	double gfilter[5]={0.05,0.2,0.5,0.2,0.05};
 27 | 	im1.imfilter_hv(Im1,gfilter,2,gfilter,2);
 28 | 	im2.imfilter_hv(Im2,gfilter,2,gfilter,2);
 29 | 
 30 |     //Im1.copyData(im1);
 31 |     //Im2.copyData(im2);
 32 |     
 33 | 	Im2.dx(imdx,true);
 34 | 	Im2.dy(imdy,true);
 35 | 	imdt.Subtract(Im2,Im1);
 36 | 	imdx.setDerivative();
 37 | 	imdy.setDerivative();
 38 | 	imdt.setDerivative();
 39 | }
 40 | 
 41 | //--------------------------------------------------------------------------------------------------------
 42 | // function to do sanity check: imdx*du+imdy*dy+imdt=0
 43 | //--------------------------------------------------------------------------------------------------------
 44 | void OpticalFlow::SanityCheck(const DImage &imdx, const DImage &imdy, const DImage &imdt, double du, double dv)
 45 | {
 46 | 	if(imdx.matchDimension(imdy)==false || imdx.matchDimension(imdt)==false)
 47 | 	{
 48 | 		cout<<"The dimensions of the derivatives don't match!"<<endl;
 49 | 		return;
 50 | 	}
 51 | 	const double* pImDx,*pImDy,*pImDt;
 52 | 	pImDx=imdx.data();
 53 | 	pImDy=imdy.data();
 54 | 	pImDt=imdt.data();
 55 | 	double error=0;
 56 | 	for(int i=0;i<imdx.height();i++)
 57 | 		for(int j=0;j<imdx.width();j++)
 58 | 			for(int k=0;k<imdx.nchannels();k++)
 59 | 			{
 60 | 				int offset=(i*imdx.width()+j)*imdx.nchannels()+k;
 61 | 				double temp=pImDx[offset]*du+pImDy[offset]*dv+pImDt[offset];
 62 | 				error+=fabs(temp);
 63 | 			}
 64 | 	error/=imdx.nelements();
 65 | 	cout<<"The mean error of |dx*u+dy*v+dt| is "<<error<<endl;
 66 | }
 67 | 
 68 | //--------------------------------------------------------------------------------------------------------
 69 | // function to warp image based on the flow field
 70 | //--------------------------------------------------------------------------------------------------------
 71 | void OpticalFlow::warpFL(DImage &warpIm2, const DImage &Im1, const DImage &Im2, const DImage &vx, const DImage &vy)
 72 | {
 73 | 	if(warpIm2.matchDimension(Im2)==false)
 74 | 		warpIm2.allocate(Im2.width(),Im2.height(),Im2.nchannels());
 75 | 	ImageProcessing::warpImage(warpIm2.data(),Im1.data(),Im2.data(),vx.data(),vy.data(),Im2.width(),Im2.height(),Im2.nchannels());
 76 | }
 77 | 
 78 | //--------------------------------------------------------------------------------------------------------
 79 | // function to generate mask of the pixels that move inside the image boundary
 80 | //--------------------------------------------------------------------------------------------------------
 81 | void OpticalFlow::genInImageMask(DImage &mask, const DImage &vx, const DImage &vy)
 82 | {
 83 | 	int imWidth,imHeight;
 84 | 	imWidth=vx.width();
 85 | 	imHeight=vx.height();
 86 | 	if(mask.matchDimension(vx)==false)
 87 | 		mask.allocate(imWidth,imHeight);
 88 | 	const double *pVx,*pVy;
 89 | 	double *pMask;
 90 | 	pVx=vx.data();
 91 | 	pVy=vy.data();
 92 | 	mask.reset();
 93 | 	pMask=mask.data();
 94 | 	double x,y;
 95 | 	for(int i=0;i<imHeight;i++)
 96 | 		for(int j=0;j<imWidth;j++)
 97 | 		{
 98 | 			int offset=i*imWidth+j;
 99 | 			y=i+pVx[offset];
100 | 			x=j+pVy[offset];
101 | 			if(x<0  || x>imWidth-1 || y<0 || y>imHeight-1)
102 | 				continue;
103 | 			pMask[offset]=1;
104 | 		}
105 | }
106 | 
107 | //--------------------------------------------------------------------------------------------------------
108 | // function to compute optical flow field using two fixed point iterations
109 | // Input arguments:
110 | //     Im1, Im2:						frame 1 and frame 2
111 | //	warpIm2:						the warped frame 2 according to the current flow field u and v
112 | //	u,v:									the current flow field, NOTICE that they are also output arguments
113 | //	
114 | //--------------------------------------------------------------------------------------------------------
115 | void OpticalFlow::SmoothFlowPDE(const DImage &Im1, const DImage &Im2, DImage &warpIm2, DImage &u, DImage &v, 
116 | 																    double alpha, int nOuterFPIterations, int nInnerFPIterations, int nCGIterations)
117 | {
118 | 	DImage mask,imdx,imdy,imdt;
119 | 	int imWidth,imHeight,nChannels,nPixels;
120 | 	imWidth=Im1.width();
121 | 	imHeight=Im1.height();
122 | 	nChannels=Im1.nchannels();
123 | 	nPixels=imWidth*imHeight;
124 | 
125 | 	DImage du(imWidth,imHeight),dv(imWidth,imHeight);
126 | 	DImage uu(imWidth,imHeight),vv(imWidth,imHeight);
127 | 	DImage ux(imWidth,imHeight),uy(imWidth,imHeight);
128 | 	DImage vx(imWidth,imHeight),vy(imWidth,imHeight);
129 | 	DImage Phi_1st(imWidth,imHeight);
130 | 	DImage Psi_1st(imWidth,imHeight,nChannels);
131 | 
132 | 	DImage imdxy,imdx2,imdy2,imdtdx,imdtdy;
133 | 	DImage ImDxy,ImDx2,ImDy2,ImDtDx,ImDtDy;
134 | 	DImage A11,A12,A22,b1,b2;
135 | 	DImage foo1,foo2;
136 | 
137 | 	// variables for conjugate gradient
138 | 	DImage r1,r2,p1,p2,q1,q2;
139 | 	double* rou;
140 | 	rou=new double[nCGIterations];
141 | 
142 | 	double varepsilon_phi=pow(0.001,2);
143 | 	double varepsilon_psi=pow(0.001,2);
144 | 
145 | 	//--------------------------------------------------------------------------
146 | 	// the outer fixed point iteration
147 | 	//--------------------------------------------------------------------------
148 | 	for(int count=0;count<nOuterFPIterations;count++)
149 | 	{
150 | 		// compute the gradient
151 | 		getDxs(imdx,imdy,imdt,Im1,warpIm2);
152 | 
153 | 		// generate the mask to set the weight of the pxiels moving outside of the image boundary to be zero
154 | 		genInImageMask(mask,vx,vy);
155 | 
156 | 		// set the derivative of the flow field to be zero
157 | 		du.reset();
158 | 		dv.reset();
159 | 
160 | 		//--------------------------------------------------------------------------
161 | 		// the inner fixed point iteration
162 | 		//--------------------------------------------------------------------------
163 | 		for(int hh=0;hh<nInnerFPIterations;hh++)
164 | 		{
165 | 			// compute the derivatives of the current flow field
166 | 			if(hh==0)
167 | 			{
168 | 				uu.copyData(u);
169 | 				vv.copyData(v);
170 | 			}
171 | 			else
172 | 			{
173 | 				uu.Add(u,du);
174 | 				vv.Add(v,dv);
175 | 			}
176 | 			uu.dx(ux);
177 | 			uu.dy(uy);
178 | 			vv.dx(vx);
179 | 			vv.dy(vy);
180 | 
181 | 			// compute the weight of phi
182 | 			Phi_1st.reset();
183 | 			double* phiData=Phi_1st.data();
184 | 			double temp;
185 | 			const double *uxData,*uyData,*vxData,*vyData;
186 | 			uxData=ux.data();
187 | 			uyData=uy.data();
188 | 			vxData=vx.data();
189 | 			vyData=vy.data();
190 | 			for(int i=0;i<nPixels;i++)
191 | 			{
192 | 				temp=uxData[i]*uxData[i]+uyData[i]*uyData[i]+vxData[i]*vxData[i]+vyData[i]*vyData[i];
193 | 				phiData[i]=1/(2*sqrt(temp+varepsilon_phi));
194 | 			}
195 | 
196 | 			// compute the nonlinear term of psi
197 | 			Psi_1st.reset();
198 | 			double* psiData=Psi_1st.data();
199 | 			const double *imdxData,*imdyData,*imdtData;
200 | 			const double *duData,*dvData;
201 | 			imdxData=imdx.data();
202 | 			imdyData=imdy.data();
203 | 			imdtData=imdt.data();
204 | 			duData=du.data();
205 | 			dvData=dv.data();
206 | 		
207 | 			double _a  = 10000, _b = 0.1;
208 | 			if(nChannels==1)
209 | 			{
210 | 				for(int i=0;i<nPixels;i++)
211 | 				{
212 | 					temp=imdtData[i]+imdxData[i]*duData[i]+imdyData[i]*dvData[i];
213 | 					//if(temp*temp<0.04)
214 | 					psiData[i]=1/(2*sqrt(temp*temp+varepsilon_psi));
215 | 					//psiData[i] = _a*_b/(1+_a*temp*temp);
216 | 				}
217 | 			}
218 | 			else
219 | 			{
220 | 				for(int i=0;i<nPixels;i++)
221 | 					for(int k=0;k<nChannels;k++)
222 | 					{
223 | 						int offset=i*nChannels+k;
224 | 						temp=imdtData[offset]+imdxData[offset]*duData[i]+imdyData[offset]*dvData[i];
225 | 						//if(temp*temp<0.04)
226 | 						psiData[offset]=1/(2*sqrt(temp*temp+varepsilon_psi));
227 | 						//psiData[offset] =  _a*_b/(1+_a*temp*temp);
228 | 					}
229 | 			}
230 | 
231 | 			// prepare the components of the large linear system
232 | 			ImDxy.Multiply(Psi_1st,imdx,imdy);
233 | 			ImDx2.Multiply(Psi_1st,imdx,imdx);
234 | 			ImDy2.Multiply(Psi_1st,imdy,imdy);
235 | 			ImDtDx.Multiply(Psi_1st,imdx,imdt);
236 | 			ImDtDy.Multiply(Psi_1st,imdy,imdt);
237 | 
238 | 			if(nChannels>1)
239 | 			{
240 | 				ImDxy.collapse(imdxy);
241 | 				ImDx2.collapse(imdx2);
242 | 				ImDy2.collapse(imdy2);
243 | 				ImDtDx.collapse(imdtdx);
244 | 				ImDtDy.collapse(imdtdy);
245 | 			}
246 | 			else
247 | 			{
248 | 				imdxy.copyData(ImDxy);
249 | 				imdx2.copyData(ImDx2);
250 | 				imdy2.copyData(ImDy2);
251 | 				imdtdx.copyData(ImDtDx);
252 | 				imdtdy.copyData(ImDtDy);
253 | 			}
254 | 
255 | 			// filtering
256 | 			imdx2.smoothing(A11,3);
257 | 			imdxy.smoothing(A12,3);
258 | 			imdy2.smoothing(A22,3);
259 | 
260 | 			// add epsilon to A11 and A22
261 | 			A11.Add(alpha*0.1);
262 | 			A22.Add(alpha*0.1);
263 | 
264 | 			// form b
265 | 			imdtdx.smoothing(b1,3);
266 | 			imdtdy.smoothing(b2,3);
267 | 			// laplacian filtering of the current flow field
268 | 		    Laplacian(foo1,u,Phi_1st);
269 | 			Laplacian(foo2,v,Phi_1st);
270 | 			double *b1Data,*b2Data;
271 | 			const double *foo1Data,*foo2Data;
272 | 			b1Data=b1.data();
273 | 			b2Data=b2.data();
274 | 			foo1Data=foo1.data();
275 | 			foo2Data=foo2.data();
276 | 
277 | 			for(int i=0;i<nPixels;i++)
278 | 			{
279 | 				b1Data[i]=-b1Data[i]-alpha*foo1Data[i];
280 | 				b2Data[i]=-b2Data[i]-alpha*foo2Data[i];
281 | 			}
282 | 
283 | 			// for debug only, displaying the matrix coefficients
284 | 			//A11.imwrite("A11.bmp",ImageIO::normalized);
285 | 			//A12.imwrite("A12.bmp",ImageIO::normalized);
286 | 			//A22.imwrite("A22.bmp",ImageIO::normalized);
287 | 			//b1.imwrite("b1.bmp",ImageIO::normalized);
288 | 			//b2.imwrite("b2.bmp",ImageIO::normalized);
289 | 
290 | 			//-----------------------------------------------------------------------
291 | 			// conjugate gradient algorithm
292 | 			//-----------------------------------------------------------------------
293 | 			r1.copyData(b1);
294 | 			r2.copyData(b2);
295 | 			du.reset();
296 | 			dv.reset();
297 | 
298 | 			for(int k=0;k<nCGIterations;k++)
299 | 			{
300 | 				rou[k]=r1.norm2()+r2.norm2();
301 | 				//cout<<rou[k]<<endl;
302 | 				if(rou[k]<1E-10)
303 | 					break;
304 | 				if(k==0)
305 | 				{
306 | 					p1.copyData(r1);
307 | 					p2.copyData(r2);
308 | 				}
309 | 				else
310 | 				{
311 | 					double ratio=rou[k]/rou[k-1];
312 | 					p1.Add(r1,p1,ratio);
313 | 					p2.Add(r2,p2,ratio);
314 | 				}
315 | 				// go through the large linear system
316 | 				foo1.Multiply(A11,p1);
317 | 				foo2.Multiply(A12,p2);
318 | 				q1.Add(foo1,foo2);
319 | 				Laplacian(foo1,p1,Phi_1st);
320 | 				q1.Add(foo1,alpha);
321 | 
322 | 				foo1.Multiply(A12,p1);
323 | 				foo2.Multiply(A22,p2);
324 | 				q2.Add(foo1,foo2);
325 | 				Laplacian(foo2,p2,Phi_1st);
326 | 				q2.Add(foo2,alpha);
327 | 
328 | 				double beta;
329 | 				beta=rou[k]/(p1.innerproduct(q1)+p2.innerproduct(q2));
330 | 				
331 | 				du.Add(p1,beta);
332 | 				dv.Add(p2,beta);
333 | 
334 | 				r1.Add(q1,-beta);
335 | 				r2.Add(q2,-beta);
336 | 			}
337 | 			//-----------------------------------------------------------------------
338 | 			// end of conjugate gradient algorithm
339 | 			//-----------------------------------------------------------------------
340 | 		}// end of inner fixed point iteration
341 | 		
342 | 		// the following procedure is merely for debugging
343 | 		//cout<<"du "<<du.norm2()<<" dv "<<dv.norm2()<<endl;
344 | 		// update the flow field
345 | 		u.Add(du,1);
346 | 		v.Add(dv,1);
347 | 		warpFL(warpIm2,Im1,Im2,u,v);
348 | 	}// end of outer fixed point iteration
349 | 	
350 | 	
351 | 	delete rou;
352 | }
353 | 
354 | void OpticalFlow::Laplacian(DImage &output, const DImage &input, const DImage& weight)
355 | {
356 | 	if(output.matchDimension(input)==false)
357 | 		output.allocate(input);
358 | 	output.reset();
359 | 
360 | 	if(input.matchDimension(weight)==false)
361 | 	{
362 | 		cout<<"Error in image dimension matching OpticalFlow::Laplacian()!"<<endl;
363 | 		return;
364 | 	}
365 | 	
366 | 	const double *inputData=input.data(),*weightData=weight.data();
367 | 	int width=input.width(),height=input.height();
368 | 	DImage foo(width,height);
369 | 	double *fooData=foo.data(),*outputData=output.data();
370 | 
371 | 	// horizontal filtering
372 | 	for(int i=0;i<height;i++)
373 | 		for(int j=0;j<width-1;j++)
374 | 		{
375 | 			int offset=i*width+j;
376 | 			fooData[offset]=(inputData[offset+1]-inputData[offset])*weightData[offset];
377 | 		}
378 | 	for(int i=0;i<height;i++)
379 | 		for(int j=0;j<width;j++)
380 | 		{
381 | 			int offset=i*width+j;
382 | 			if(j<width-1)
383 | 				outputData[offset]-=fooData[offset];
384 | 			if(j>0)
385 | 				outputData[offset]+=fooData[offset-1];
386 | 		}
387 | 	foo.reset();
388 | 	// vertical filtering
389 | 	for(int i=0;i<height-1;i++)
390 | 		for(int j=0;j<width;j++)
391 | 		{
392 | 			int offset=i*width+j;
393 | 			fooData[offset]=(inputData[offset+width]-inputData[offset])*weightData[offset];
394 | 		}
395 | 	for(int i=0;i<height;i++)
396 | 		for(int j=0;j<width;j++)
397 | 		{
398 | 			int offset=i*width+j;
399 | 			if(i<height-1)
400 | 				outputData[offset]-=fooData[offset];
401 | 			if(i>0)
402 | 				outputData[offset]+=fooData[offset-width];
403 | 		}
404 | }
405 | 
406 | void OpticalFlow::testLaplacian(int dim)
407 | {
408 | 	// generate the random weight
409 | 	DImage weight(dim,dim);
410 | 	for(int i=0;i<dim;i++)
411 | 		for(int j=0;j<dim;j++)
412 | 			//weight.data()[i*dim+j]=(double)rand()/RAND_MAX+1;
413 | 			weight.data()[i*dim+j]=1;
414 | 	// go through the linear system;
415 | 	DImage sysMatrix(dim*dim,dim*dim);
416 | 	DImage u(dim,dim),du(dim,dim);
417 | 	for(int i=0;i<dim*dim;i++)
418 | 	{
419 | 		u.reset();
420 | 		u.data()[i]=1;
421 | 		Laplacian(du,u,weight);
422 | 		for(int j=0;j<dim*dim;j++)
423 | 			sysMatrix.data()[j*dim*dim+i]=du.data()[j];
424 | 	}
425 | 	// test whether the matrix is symmetric
426 | 	for(int i=0;i<dim*dim;i++)
427 | 	{
428 | 		for(int j=0;j<dim*dim;j++)
429 | 		{
430 | 			if(sysMatrix.data()[i*dim*dim+j]>=0)
431 | 				printf(" ");
432 | 			printf(" %1.0f ",sysMatrix.data()[i*dim*dim+j]);
433 | 		}
434 | 		printf("\n");
435 | 	}
436 | }
437 | 
438 | //--------------------------------------------------------------------------------------
439 | // function to perfomr coarse to fine optical flow estimation
440 | //--------------------------------------------------------------------------------------
441 | void OpticalFlow::Coarse2FineFlow(DImage &vx, DImage &vy, DImage &warpI2,const DImage &Im1, const DImage &Im2, double alpha, double ratio, int minWidth, 
442 | 																	 int nOuterFPIterations, int nInnerFPIterations, int nCGIterations)
443 | {
444 | 	// first build the pyramid of the two images
445 | 	GaussianPyramid GPyramid1;
446 | 	GaussianPyramid GPyramid2;
447 | 	if(IsDisplay)
448 | 		cout<<"Constructing pyramid...";
449 | 	GPyramid1.ConstructPyramid(Im1,ratio,minWidth);
450 | 	GPyramid2.ConstructPyramid(Im2,ratio,minWidth);
451 | 	if(IsDisplay)
452 | 		cout<<"done!"<<endl;
453 | 	
454 | 	// now iterate from the top level to the bottom
455 | 	DImage Image1,Image2,WarpImage2;
456 | 
457 | 	for(int k=GPyramid1.nlevels()-1;k>=0;k--)
458 | 	{
459 | 		if(IsDisplay)
460 | 			cout<<"Pyramid level "<<k;
461 | 		int width=GPyramid1.Image(k).width();
462 | 		int height=GPyramid1.Image(k).height();
463 | 		im2feature(Image1,GPyramid1.Image(k));
464 | 		im2feature(Image2,GPyramid2.Image(k));
465 | 
466 | 		if(k==GPyramid1.nlevels()-1) // if at the top level
467 | 		{
468 | 			vx.allocate(width,height);
469 | 			vy.allocate(width,height);
470 | 			//warpI2.copyData(Image2);
471 | 			WarpImage2.copyData(Image2);
472 | 		}
473 | 		else
474 | 		{
475 | 
476 | 			vx.imresize(width,height);
477 | 			vx.Multiplywith(1/ratio);
478 | 			vy.imresize(width,height);
479 | 			vy.Multiplywith(1/ratio);
480 | 			//warpFL(warpI2,GPyramid1.Image(k),GPyramid2.Image(k),vx,vy);
481 | 			warpFL(WarpImage2,Image1,Image2,vx,vy);
482 | 		}
483 | 		//SmoothFlowPDE(GPyramid1.Image(k),GPyramid2.Image(k),warpI2,vx,vy,alpha,nOuterFPIterations,nInnerFPIterations,nCGIterations);
484 | 		//SmoothFlowPDE(Image1,Image2,WarpImage2,vx,vy,alpha*pow((1/ratio),k),nOuterFPIterations,nInnerFPIterations,nCGIterations);
485 | 		SmoothFlowPDE(Image1,Image2,WarpImage2,vx,vy,alpha,nOuterFPIterations,nInnerFPIterations,nCGIterations);
486 | 		if(IsDisplay)
487 | 			cout<<endl;
488 | 	}
489 | 	warpFL(warpI2,Im1,Im2,vx,vy);
490 | }
491 | 
492 | //---------------------------------------------------------------------------------------
493 | // function to convert image to feature image
494 | //---------------------------------------------------------------------------------------
495 | void OpticalFlow::im2feature(DImage &imfeature, const DImage &im)
496 | {
497 | 	int width=im.width();
498 | 	int height=im.height();
499 | 	int nchannels=im.nchannels();
500 | 	if(nchannels==1)
501 | 	{
502 | 		imfeature.allocate(im.width(),im.height(),3);
503 | 		DImage imdx,imdy;
504 | 		im.dx(imdx,true);
505 | 		im.dy(imdy,true);
506 | 		double* data=imfeature.data();
507 | 		for(int i=0;i<height;i++)
508 | 			for(int j=0;j<width;j++)
509 | 			{
510 | 				int offset=i*width+j;
511 | 				data[offset*3]=im.data()[offset];
512 | 				data[offset*3+1]=imdx.data()[offset];
513 | 				data[offset*3+2]=imdy.data()[offset];
514 | 			}
515 | 	}
516 | 	else if(nchannels==3)
517 | 	{
518 | 		DImage grayImage;
519 | 		im.desaturate(grayImage);
520 | 
521 | 		imfeature.allocate(im.width(),im.height(),5);
522 | 		DImage imdx,imdy;
523 | 		grayImage.dx(imdx,true);
524 | 		grayImage.dy(imdy,true);
525 | 		double* data=imfeature.data();
526 | 		for(int i=0;i<height;i++)
527 | 			for(int j=0;j<width;j++)
528 | 			{
529 | 				int offset=i*width+j;
530 | 				data[offset*5]=grayImage.data()[offset];
531 | 				data[offset*5+1]=imdx.data()[offset];
532 | 				data[offset*5+2]=imdy.data()[offset];
533 | 				data[offset*5+3]=im.data()[offset*3+1]-im.data()[offset*3];
534 | 				data[offset*5+4]=im.data()[offset*3+1]-im.data()[offset*3+2];
535 | 			}
536 | 	}
537 | 	else
538 | 		imfeature.copyData(im);
539 | }
540 | 


--------------------------------------------------------------------------------
/README.md:
--------------------------------------------------------------------------------
 1 | # liuflow: a wrapper around C.Liu's optical flow
 2 | 
 3 | Note: this bit of code is a simple wrapper around the optical-flow
 4 | algorithm developped/published by C.Liu:
 5 | 
 6 | C. Liu. Beyond Pixels: Exploring New Representations and Applications
 7 | for Motion Analysis. Doctoral Thesis. Massachusetts Institute of 
 8 | Technology. May 2009.
 9 | 
10 | More at: http://people.csail.mit.edu/celiu/OpticalFlow/
11 | 


--------------------------------------------------------------------------------
/img1.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/clementfarabet/lua---liuflow/0c5d1064c848085eb7a65b39e98f07c0b918908f/img1.jpg


--------------------------------------------------------------------------------
/img2.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/clementfarabet/lua---liuflow/0c5d1064c848085eb7a65b39e98f07c0b918908f/img2.jpg


--------------------------------------------------------------------------------
/init.lua:
--------------------------------------------------------------------------------
  1 | -- 
  2 | -- Note: this bit of code is a simple wrapper around the optical-flow
  3 | -- algorithm developped/published by C.Liu:
  4 | --
  5 | -- C. Liu. Beyond Pixels: Exploring New Representations and Applications
  6 | -- for Motion Analysis. Doctoral Thesis. Massachusetts Institute of 
  7 | -- Technology. May 2009.
  8 | --
  9 | -- More at: http://people.csail.mit.edu/celiu/OpticalFlow/
 10 | --
 11 | -- Wrapper: Clement Farabet.
 12 | -- 
 13 | 
 14 | -- load C lib
 15 | require 'libliuflow'
 16 | 
 17 | local infer_help_desc =
 18 | [[Computes the optical flow of a pair of images, and returns
 19 | the norm and the direction fields, plus a warped version of the second
 20 | image, according to the flow field.
 21 | 
 22 | The flow field is computed using CG, as described in
 23 | "Exploring New Representations and Applications for Motion Analysis",
 24 | by C. Liu (Doctoral Thesis).
 25 | More at http://people.csail.mit.edu/celiu/OpticalFlow/
 26 | 
 27 | The input images must be a NxHxW tensor, where N is the number
 28 | of channels (colors).]]
 29 | 
 30 | ------------------------------------------------------------
 31 | -- Liu's optical flow algorithm.
 32 | --
 33 | -- C. Liu. Beyond Pixels: Exploring New Representations and Applications
 34 | -- for Motion Analysis. Doctoral Thesis. Massachusetts Institute of 
 35 | -- Technology. May 2009.
 36 | --
 37 | -- To load: require 'liuflow'
 38 | --
 39 | -- @release 2010 Clement Farabet
 40 | ------------------------------------------------------------
 41 | liuflow = {}
 42 | 
 43 | ------------------------------------------------------------
 44 | -- Computes the optical flow of a pair of images, and returns
 45 | -- the norm and the direction fields, plus a warped version of the second
 46 | -- image, according to the flow field.
 47 | --
 48 | -- The flow field is computed using CG, as described in
 49 | -- "Exploring New Representations and Applications for Motion Analysis",
 50 | -- by C. Liu (Doctoral Thesis).
 51 | -- More at http://people.csail.mit.edu/celiu/OpticalFlow/
 52 | --
 53 | -- The input images must be a NxHxW tensor, where N is the number
 54 | -- of channels (colors).
 55 | --
 56 | -- @usage opticalFlow.infer() -- prints online help
 57 | --
 58 | -- @param pair  a pair of images (2 NxHxW tensor) [type = table]
 59 |    -- @param image1  the first image (NxHxW tensor) [type = torch.Tensor]
 60 | -- @param image2  the second image (NxHxW tensor) [type = torch.Tensor]
 61 | -- @param alpha  regularization weight [default = 0.01] [type = number]
 62 | -- @param ratio  downsample ratio [default = 0.75] [type = number]
 63 | -- @param minWidth  width of the coarsest level [default = 30] [type = number]
 64 | -- @param nOuterFPIterations  number of outer fixed-point iterations [default = 15] [type = number]
 65 | -- @param nInnerFPIterations  number of inner fixed-point iterations [default = 1] [type = number]
 66 | -- @param nCGIterations  number of CG iterations [default = 20] [type = number]
 67 | ------------------------------------------------------------
 68 | liuflow.infer = function(...)
 69 |            -- check args
 70 |            local args, pair, img1, img2, alpha, ratio, minWidth, 
 71 |            nOuterFPIterations, nInnerFPIterations, nCGIterations = dok.unpack(
 72 |               {...},
 73 |               'opticalFlow.infer',
 74 |               infer_help_desc,
 75 |               {arg='pair', type='table', help='a pair of images (2 NxHxW tensor)'},
 76 |               {arg='image1', type='torch.Tensor', help='the first image (NxHxW tensor)'},
 77 |               {arg='image2', type='torch.Tensor', help='the second image (NxHxW tensor)'},
 78 |               {arg='alpha', type='number', help='regularization weight', default=0.01},
 79 |               {arg='ratio', type='number', help='downsample ratio', default=0.75},
 80 |               {arg='minWidth', type='number', help='width of the coarsest level', default=30},
 81 |               {arg='nOuterFPIterations', type='number', help='number of outer fixed-point iterations', default=15},
 82 |               {arg='nInnerFPIterations', type='number', help='number of inner fixed-point iterations', default=1},
 83 |               {arg='nCGIterations', type='number', help='number of CG iterations', default=20}
 84 |            )
 85 |            
 86 |            -- pair ?
 87 |            if pair then 
 88 |               img1 = pair[1]
 89 |               img2 = pair[2]
 90 |            end
 91 | 
 92 |            -- check dims
 93 |            if img1:nDimension() ~= 3 then
 94 |               error('image should be a NxHxW tensor')
 95 |            end
 96 | 
 97 |            -- compute flow
 98 |            local flow_x, flow_y, warp = libliuflow.infer(img1, img2,
 99 |                                                          alpha, ratio, minWidth,
100 |                                                          nOuterFPIterations, nInnerFPIterations,
101 |                                                          nCGIterations)
102 | 
103 |    	     local flow_norm  = liuflow.computeNorm(flow_x,flow_y)
104 | 	        local flow_angle = liuflow.computeAngle(flow_x,flow_y)
105 | 
106 |            -- return results
107 |            return flow_norm, flow_angle, warp, flow_x, flow_y
108 |         end
109 | 
110 | -- warper
111 | liuflow.warp = function(...)
112 |           local args, inp, vx, vy = dok.unpack(
113 |              {...},
114 |              'opticalFlow.warp', 
115 |              'warps an image according to a flow field:\n'
116 |                 ..'if flow was computed from img1->img2, then warp(img2,vx,vy) will compute\n'
117 |                 ..'a reconstruction of img1',
118 |              {arg='image', type='torch.Tensor', help='input image (NxHxW tensor)', req=true},
119 |              {arg='flow_x', type='torch.Tensor', help='x component of flow field', req=true},
120 |              {arg='flow_y', type='torch.Tensor', help='y component of flow field', req=true}
121 |           )
122 |           if inp:nDimension() ~= 3 then
123 |              xerror('image should be a NxHxW tensor',nil,args.usage)
124 |           end
125 |           return libliuflow.warp(inp, vx, vy)
126 |        end
127 | 
128 | ------------------------------------------------------------
129 | -- Computes the optical flow on some example images
130 | --
131 | -- @see                  opticalFlow.infer
132 | ------------------------------------------------------------
133 | liuflow.testme = function()
134 |             require 'image'
135 | 
136 |             local img1 = image.load(paths.concat(paths.install_lua_path, 'liuflow/img1.jpg')):float()
137 |             local img2 = image.load(paths.concat(paths.install_lua_path, 'liuflow/img2.jpg')):float()
138 |             local img1s = image.scale(img1,img1:size(3)/2,img1:size(2)/2)
139 |             local img2s = image.scale(img2,img1:size(3)/2,img1:size(2)/2)
140 |             
141 |             print('computing optical on ' .. img1s:size(3) .. 'x' .. img1s:size(2) .. ' image')
142 | 
143 |             local resn,resa,warp,resx,resy = liuflow.infer{ pair={img1s,img2s},
144 |                                                             alpha=0.005,
145 |                                                             ratio=0.6,
146 |                                                             minWidth=50,
147 |                                                             nOuterFPIterations=6,
148 |                                                             nInnerFPIterations=1,
149 |                                                             nCGIterations=40 }
150 | 
151 |             local resn_q = resn:clone():div(resn:max()):mul(6):floor():div(8)
152 |             local resa_q = resa:clone():div(360/16):floor():mul(360/16)
153 |             
154 |             image.display{image={img1s, liuflow.field2rgb(resn,resa), 
155 |                                  img1s, (img2s-img1s):abs(),
156 |                                  img2s, liuflow.field2rgb(resn_q,resa_q), 
157 |                                  warp, (warp-img1s):abs()}, 
158 |                               zoom=1,
159 |                               min=0, max=1,
160 |                               nrow=4,
161 |                               legends={'input 1', 'flow field', 'input 1', 
162 |                                        'input 1 - input 2',
163 |                                        'input 2', 'quantized flow field', 
164 |                                        'warped(input 2)', 
165 |                                        'input 1 - warped(input 2)'},
166 |                               legend="optical flow, method = C.Liu"}
167 |             
168 |             return resn, resa, warp
169 |          end
170 | 
171 | ------------------------------------------------------------
172 | -- computes norm (size) of flow field from flow_x and flow_y,
173 | --
174 | -- @usage opticalFlow.computeNorm() -- prints online help
175 | --
176 | -- @param flow_x  flow field (x), (WxH) [required] [type = torch.Tensor]
177 | -- @param flow_y  flow field (y), (WxH) [required] [type = torch.Tensor]
178 | ------------------------------------------------------------
179 | liuflow.computeNorm = function(...)
180 |                  -- check args
181 |                  local args, flow_x, flow_y = dok.unpack(
182 |                     {...},
183 |                     'opticalFlow.computeNorm',
184 |                     'computes norm (size) of flow field from flow_x and flow_y,\n',
185 |                     {arg='flow_x', type='torch.Tensor', help='flow field (x), (WxH)', req=true},
186 |                     {arg='flow_y', type='torch.Tensor', help='flow field (y), (WxH)', req=true}
187 |                  )
188 |                  local flow_norm = flow_y:clone():cmul(flow_y)
189 |                  local x_squared = flow_x:clone():cmul(flow_x)
190 |                  flow_norm:add(x_squared):sqrt()
191 |                  return flow_norm
192 |               end
193 | 
194 | ------------------------------------------------------------
195 | -- computes angle (direction) of flow field from flow_x and flow_y,
196 | --
197 | -- @usage opticalFlow.computeAngle() -- prints online help
198 | --
199 | -- @param flow_x  flow field (x), (WxH) [required] [type = torch.Tensor]
200 | -- @param flow_y  flow field (y), (WxH) [required] [type = torch.Tensor]
201 | ------------------------------------------------------------
202 | liuflow.computeAngle = function(...)
203 |                   -- check args
204 |                   local args, flow_x, flow_y = dok.unpack(
205 |                      {...},
206 |                      'opticalFlow.computeAngle',
207 |                      'computes angle (direction) of flow field from flow_x and flow_y,\n',
208 |                      {arg='flow_x', type='torch.Tensor', help='flow field (x), (WxH)', req=true},
209 |                      {arg='flow_y', type='torch.Tensor', help='flow field (y), (WxH)', req=true}
210 |                   )
211 |                   local flow_angle = flow_y:clone():cdiv(flow_x):abs():atan():mul(180/math.pi)
212 |                   flow_angle:map2(flow_x, flow_y, function(h,x,y)
213 |                                                      if x == 0 and y >= 0 then
214 |                                                         return 90
215 |                                                      elseif x == 0 and y <= 0 then
216 |                                                         return 270
217 |                                                      elseif x >= 0 and y >= 0 then
218 |                                                         -- all good
219 |                                                      elseif x >= 0 and y < 0 then
220 |                                                         return 360 - h
221 |                                                      elseif x < 0 and y >= 0 then
222 |                                                         return 180 - h
223 |                                                      elseif x < 0 and y < 0 then
224 |                                                         return 180 + h
225 |                                                      end
226 |                                                   end)
227 |                   return flow_angle
228 |                end
229 | 
230 | ------------------------------------------------------------
231 | -- merges Norm and Angle flow fields into a single RGB image,
232 | -- where saturation=intensity, and hue=direction
233 | --
234 | -- @usage opticalFlow.field2rgb() -- prints online help
235 | --
236 | -- @param norm  flow field (norm), (WxH) [required] [type = torch.Tensor]
237 | -- @param angle  flow field (angle), (WxH) [required] [type = torch.Tensor]
238 | -- @param max  if not provided, norm:max() is used [type = number]
239 | -- @param legend  prints a legend on the image [type = boolean]
240 | ------------------------------------------------------------
241 | liuflow.field2rgb = function (...)
242 |                -- check args
243 |                local args, norm, angle, max, legend = dok.unpack(
244 |                   {...},
245 |                   'opticalFlow.field2rgb',
246 |                   'merges Norm and Angle flow fields into a single RGB image,\n'
247 |                      .. 'where saturation=intensity, and hue=direction',
248 |                   {arg='norm', type='torch.Tensor', help='flow field (norm), (WxH)', req=true},
249 |                   {arg='angle', type='torch.Tensor', help='flow field (angle), (WxH)', req=true},
250 |                   {arg='max', type='number', help='if not provided, norm:max() is used'},
251 |                   {arg='legend', type='boolean', help='prints a legend on the image', default=false}
252 |                )
253 | 
254 |                -- max
255 |                local saturate = false
256 |                if max then saturate = true end
257 |                max = math.max(max or norm:max(), 1e-2)
258 | 
259 |                -- redim?
260 |                if norm:nDimension() == 3 then
261 |                   norm = norm[1]
262 |                end
263 |                if angle:nDimension() == 3 then
264 |                   angle = angle[1]
265 |                end
266 | 
267 |                -- merge them into an HSL image
268 |                local hsl = torch.Tensor(3, norm:size(1), norm:size(2))
269 |                -- hue = angle:
270 |                hsl:select(1,1):copy(angle):div(360)
271 |                -- saturation = normalized intensity:
272 |                hsl:select(1,2):copy(norm):div(max)
273 |                if saturate then hsl:select(1,2):tanh() end
274 |                -- light varies inversely from saturation (null flow = white):
275 |                hsl:select(1,3):copy(hsl:select(1,2)):mul(-0.5):add(1)
276 | 
277 |                -- convert HSL to RGB
278 |                local rgb = image.hsl2rgb(hsl)
279 | 
280 |                -- legend
281 |                if legend then
282 |                   _legend_ = _legend_
283 |                      or image.load(paths.concat(paths.install_lua_path, 'liuflow/legend.png'))
284 |                   local legend = image.scale(_legend_, hsl:size(2)/8, hsl:size(2)/8)
285 |                   rgb:narrow(3,1,legend:size(2)):narrow(2,hsl:size(2)-legend:size(2)+1,legend:size(2)):copy(legend)
286 |                end
287 | 
288 |                -- done
289 |                return rgb
290 |             end
291 | 
292 | ------------------------------------------------------------
293 | -- Simplifies display of flow field in HSV colorspace when the
294 | -- available field is in x,y displacement
295 | --
296 | -- @usage opticalFlow.xy2rgb() -- prints online help
297 | --
298 | -- @param x  flow field (x), (WxH) [required] [type = torch.Tensor]
299 | -- @param y  flow field (y), (WxH) [required] [type = torch.Tensor]
300 | ------------------------------------------------------------
301 | liuflow.xy2rgb = function (...)
302 |             -- check args
303 |             local args, x, y, max = dok.unpack(
304 |                {...},
305 |                'opticalFlow.xy2rgb',
306 |                'merges x and y flow fields into a single RGB image,\n'
307 |                   .. 'where saturation=intensity, and hue=direction',
308 |                {arg='x', type='torch.Tensor', help='flow field (norm), (WxH)', req=true},
309 |                {arg='y', type='torch.Tensor', help='flow field (angle), (WxH)', req=true},
310 |                {arg='max', type='number', help='if not provided, norm:max() is used'}
311 |             )
312 |             
313 |             local norm = liuflow.computeNorm(x,y)
314 |             local angle = liuflow.computeAngle(x,y)
315 |             return liuflow.field2rgb(norm,angle,max)
316 |          end
317 | 


--------------------------------------------------------------------------------
/legend.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/clementfarabet/lua---liuflow/0c5d1064c848085eb7a65b39e98f07c0b918908f/legend.png


--------------------------------------------------------------------------------
/liuflow.cpp:
--------------------------------------------------------------------------------
  1 | 
  2 | // To load this lib in LUA:
  3 | // require 'libliuflow'
  4 | 
  5 | #include <luaT.h>
  6 | #include <TH.h>
  7 | 
  8 | #include "project.h"
  9 | #include "Image.h"
 10 | #include "OpticalFlow.h"
 11 | #include <iostream>
 12 | 
 13 | using namespace std;
 14 | 
 15 | // conversion functions
 16 | static DImage *tensor_to_image(THFloatTensor *tensor) {
 17 |   // create output
 18 |   int w = tensor->size[2];
 19 |   int h = tensor->size[1];
 20 |   int c = tensor->size[0];
 21 |   DImage *img = new DImage(w,h,c);
 22 | 
 23 |   // copy data
 24 |   int i1,i0,i2;
 25 |   double *dest = img->data();
 26 |   int offset = 0;
 27 |   for (i1=0; i1<tensor->size[1]; i1++) {
 28 |     for (i2=0; i2<tensor->size[2]; i2++) {
 29 |       for (i0=0; i0<tensor->size[0]; i0++) {
 30 |         dest[offset++] = THFloatTensor_get3d(tensor, i0, i1, i2);
 31 |       }
 32 |     }
 33 |   }
 34 | 
 35 |   // return result
 36 |   return img;
 37 | }
 38 | 
 39 | static THFloatTensor *image_to_tensor(DImage *img) {
 40 |   // create output
 41 |   THFloatTensor *tensor = THFloatTensor_newWithSize3d(img->nchannels(), img->height(), img->width());
 42 | 
 43 |   // copy data
 44 |   int i1,i0,i2;
 45 |   double *src = img->data();
 46 |   int offset = 0;
 47 |   for (i1=0; i1<tensor->size[1]; i1++) {
 48 |     for (i2=0; i2<tensor->size[2]; i2++) {
 49 |       for (i0=0; i0<tensor->size[0]; i0++) {
 50 |         THFloatTensor_set3d(tensor, i0, i1, i2, src[offset++]);
 51 |       }
 52 |     }
 53 |   }
 54 | 
 55 |   // return result
 56 |   return tensor;
 57 | }
 58 | 
 59 | int optflow_lua(lua_State *L) {
 60 |   // defaults
 61 |   double alpha=0.01;
 62 |   double ratio=0.75;
 63 |   int minWidth=30;
 64 |   int nOuterFPIterations=15;
 65 |   int nInnerFPIterations=1;
 66 |   int nCGIterations=40;
 67 | 
 68 |   // get args
 69 |   THFloatTensor *ten1 = (THFloatTensor *)luaT_checkudata(L, 1, luaT_checktypename2id(L, "torch.FloatTensor"));
 70 |   THFloatTensor *ten2 = (THFloatTensor *)luaT_checkudata(L, 2, luaT_checktypename2id(L, "torch.FloatTensor"));
 71 |   if (lua_isnumber(L, 3)) alpha = lua_tonumber(L, 3);
 72 |   if (lua_isnumber(L, 4)) ratio = lua_tonumber(L, 4);
 73 |   if (lua_isnumber(L, 5)) minWidth = lua_tonumber(L, 5);
 74 |   if (lua_isnumber(L, 6)) nOuterFPIterations = lua_tonumber(L, 6);
 75 |   if (lua_isnumber(L, 7)) nInnerFPIterations = lua_tonumber(L, 7);
 76 |   if (lua_isnumber(L, 8)) nCGIterations = lua_tonumber(L, 8);
 77 | 
 78 |   // copy tensors to images
 79 |   DImage *img1 = tensor_to_image(ten1);
 80 |   DImage *img2 = tensor_to_image(ten2);
 81 | 
 82 |   // declare outputs, and process
 83 |   DImage vx,vy,warpI2;
 84 |   OpticalFlow::Coarse2FineFlow(vx,vy,warpI2,         // outputs
 85 |                                *img1,*img2,          // inputs
 86 |                                alpha,ratio,minWidth, // params
 87 |                                nOuterFPIterations,nInnerFPIterations,nCGIterations);
 88 | 
 89 |   // return result
 90 |   THFloatTensor *ten_vx = image_to_tensor(&vx);
 91 |   THFloatTensor *ten_vy = image_to_tensor(&vy);
 92 |   THFloatTensor *ten_warp = image_to_tensor(&warpI2);
 93 |   luaT_pushudata(L, ten_vx, luaT_checktypename2id(L, "torch.FloatTensor"));
 94 |   luaT_pushudata(L, ten_vy, luaT_checktypename2id(L, "torch.FloatTensor"));
 95 |   luaT_pushudata(L, ten_warp, luaT_checktypename2id(L, "torch.FloatTensor"));
 96 | 
 97 |   // cleanup
 98 |   delete(img1);
 99 |   delete(img2);
100 | 
101 |   return 3;
102 | }
103 | 
104 | int warp_lua(lua_State *L) {
105 |   // get args
106 |   THFloatTensor *ten_inp = (THFloatTensor *)luaT_checkudata(L, 1, luaT_checktypename2id(L, "torch.Tensor"));
107 |   THFloatTensor *ten_vx = (THFloatTensor *)luaT_checkudata(L, 2, luaT_checktypename2id(L, "torch.Tensor"));
108 |   THFloatTensor *ten_vy = (THFloatTensor *)luaT_checkudata(L, 3, luaT_checktypename2id(L, "torch.Tensor"));
109 | 
110 |   // copy tensors to images
111 |   DImage *input = tensor_to_image(ten_inp);
112 |   DImage *vx = tensor_to_image(ten_vx);
113 |   DImage *vy = tensor_to_image(ten_vy);
114 | 
115 |   // declare outputs, and process
116 |   DImage warpedInput;
117 |   OpticalFlow::warpFL(warpedInput,   // warped input
118 |                       *input,*input, // input
119 |                       *vx, *vy         // flow
120 |                       );
121 | 
122 |   // return result
123 |   THFloatTensor *ten_warp = image_to_tensor(&warpedInput);
124 |   luaT_pushudata(L, ten_warp, luaT_checktypename2id(L, "torch.Tensor"));
125 | 
126 |   // cleanup
127 |   delete(input);
128 |   delete(vx);
129 |   delete(vy);
130 | 
131 |   return 1;
132 | }
133 | 
134 | // Register functions in LUA
135 | static const struct luaL_reg liuflow [] = {
136 |   {"infer", optflow_lua},
137 |   {"warp", warp_lua},
138 |   {NULL, NULL}  /* sentinel */
139 | };
140 | 
141 | extern "C" {
142 |   int luaopen_libliuflow (lua_State *L) {
143 |     luaL_openlib(L, "libliuflow", liuflow, 0);
144 |     return 1; 
145 |   }
146 | }
147 | 


--------------------------------------------------------------------------------
/project.h:
--------------------------------------------------------------------------------
1 | 
2 | // some global macros
3 | #define __min(x,y) ((x)<(y)?(x):(y))
4 | #define __max(x,y) ((x)>(y)?(x):(y))
5 | 


--------------------------------------------------------------------------------