├── .gitignore
├── LICENSE
├── README.md
├── demo.py
├── examples
    ├── car1.jpg
    ├── car2.jpg
    ├── car2Warped.jpg
    └── outFlow.png
├── pyflow.pyx
├── setup.py
└── src
    ├── Coarse2FineFlowWrapper.cpp
    ├── Coarse2FineFlowWrapper.h
    ├── GaussianPyramid.cpp
    ├── GaussianPyramid.h
    ├── Image.h
    ├── ImageIO.h
    ├── ImageProcessing.h
    ├── Matrix.h
    ├── NoiseModel.h
    ├── OpticalFlow.cpp
    ├── OpticalFlow.h
    ├── Stochastic.cpp
    ├── Stochastic.h
    ├── Vector.h
    └── project.h


/.gitignore:
--------------------------------------------------------------------------------
1 | build
2 | *.cpp
3 | **/*.npy
4 | *.so
5 | examples/car2Warped_new.jpg
6 | examples/outFlow_new.png
7 | *.pyc
8 | __init__.py


--------------------------------------------------------------------------------
/LICENSE:
--------------------------------------------------------------------------------
 1 | This is a python wrapper around the Ce Liu's optical flow code downloaded
 2 | from here: https://people.csail.mit.edu/celiu/OpticalFlow/. The following
 3 | license applies for python wrapper only.
 4 | 
 5 | --------------------------------------------------------------------------------
 6 | MIT License
 7 | 
 8 | Copyright (c) 2017 Deepak Pathak
 9 | 
10 | Permission is hereby granted, free of charge, to any person obtaining a copy
11 | of this software and associated documentation files (the "Software"), to deal
12 | in the Software without restriction, including without limitation the rights
13 | to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
14 | copies of the Software, and to permit persons to whom the Software is
15 | furnished to do so, subject to the following conditions:
16 | 
17 | The above copyright notice and this permission notice shall be included in all
18 | copies or substantial portions of the Software.
19 | 
20 | THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
21 | IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
22 | FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
23 | AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
24 | LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
25 | OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
26 | SOFTWARE.
27 | --------------------------------------------------------------------------------
28 | 


--------------------------------------------------------------------------------
/README.md:
--------------------------------------------------------------------------------
 1 | ## Python Dense Optical Flow
 2 | 
 3 | **Python** wrapper for Ce Liu's [C++ implementation](https://people.csail.mit.edu/celiu/OpticalFlow/) of Coarse2Fine Optical Flow. This is **super fast and accurate** optical flow method based on Coarse2Fine warping method from Thomas Brox. This python wrapper has minimal dependencies, and it also eliminates the need for C++ OpenCV library. For real time performance, one can additionally resize the images to a smaller size.
 4 | 
 5 | Run the following steps to download, install and demo the library:
 6 |   ```Shell
 7 |   git clone https://github.com/pathak22/pyflow.git
 8 |   cd pyflow/
 9 |   python setup.py build_ext -i
10 |   python demo.py    # -viz option to visualize output
11 |   ```
12 | 
13 | This wrapper code was developed as part of our [CVPR 2017 paper on Unsupervised Learning using unlabeled videos](http://cs.berkeley.edu/~pathak/unsupervised_video/). Github repository for our CVPR 17 paper is [here](https://github.com/pathak22/unsupervised-video).
14 | 


--------------------------------------------------------------------------------
/demo.py:
--------------------------------------------------------------------------------
 1 | # Author: Deepak Pathak (c) 2016
 2 | 
 3 | from __future__ import absolute_import
 4 | from __future__ import division
 5 | from __future__ import print_function
 6 | # from __future__ import unicode_literals
 7 | import numpy as np
 8 | from PIL import Image
 9 | import time
10 | import argparse
11 | import pyflow
12 | 
13 | parser = argparse.ArgumentParser(
14 |     description='Demo for python wrapper of Coarse2Fine Optical Flow')
15 | parser.add_argument(
16 |     '-viz', dest='viz', action='store_true',
17 |     help='Visualize (i.e. save) output of flow.')
18 | args = parser.parse_args()
19 | 
20 | im1 = np.array(Image.open('examples/car1.jpg'))
21 | im2 = np.array(Image.open('examples/car2.jpg'))
22 | im1 = im1.astype(float) / 255.
23 | im2 = im2.astype(float) / 255.
24 | 
25 | # Flow Options:
26 | alpha = 0.012
27 | ratio = 0.75
28 | minWidth = 20
29 | nOuterFPIterations = 7
30 | nInnerFPIterations = 1
31 | nSORIterations = 30
32 | colType = 0  # 0 or default:RGB, 1:GRAY (but pass gray image with shape (h,w,1))
33 | 
34 | s = time.time()
35 | u, v, im2W = pyflow.coarse2fine_flow(
36 |     im1, im2, alpha, ratio, minWidth, nOuterFPIterations, nInnerFPIterations,
37 |     nSORIterations, colType)
38 | e = time.time()
39 | print('Time Taken: %.2f seconds for image of size (%d, %d, %d)' % (
40 |     e - s, im1.shape[0], im1.shape[1], im1.shape[2]))
41 | flow = np.concatenate((u[..., None], v[..., None]), axis=2)
42 | np.save('examples/outFlow.npy', flow)
43 | 
44 | if args.viz:
45 |     import cv2
46 |     hsv = np.zeros(im1.shape, dtype=np.uint8)
47 |     hsv[:, :, 0] = 255
48 |     hsv[:, :, 1] = 255
49 |     mag, ang = cv2.cartToPolar(flow[..., 0], flow[..., 1])
50 |     hsv[..., 0] = ang * 180 / np.pi / 2
51 |     hsv[..., 2] = cv2.normalize(mag, None, 0, 255, cv2.NORM_MINMAX)
52 |     rgb = cv2.cvtColor(hsv, cv2.COLOR_HSV2BGR)
53 |     cv2.imwrite('examples/outFlow_new.png', rgb)
54 |     cv2.imwrite('examples/car2Warped_new.jpg', im2W[:, :, ::-1] * 255)
55 | 


--------------------------------------------------------------------------------
/examples/car1.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/pathak22/pyflow/8f8ab9e90845f1b819b3833f995f481cb5d92166/examples/car1.jpg


--------------------------------------------------------------------------------
/examples/car2.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/pathak22/pyflow/8f8ab9e90845f1b819b3833f995f481cb5d92166/examples/car2.jpg


--------------------------------------------------------------------------------
/examples/car2Warped.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/pathak22/pyflow/8f8ab9e90845f1b819b3833f995f481cb5d92166/examples/car2Warped.jpg


--------------------------------------------------------------------------------
/examples/outFlow.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/pathak22/pyflow/8f8ab9e90845f1b819b3833f995f481cb5d92166/examples/outFlow.png


--------------------------------------------------------------------------------
/pyflow.pyx:
--------------------------------------------------------------------------------
 1 | # distutils: language = c++
 2 | # distutils: sources = src/Coarse2FineFlowWrapper.cpp
 3 | from __future__ import absolute_import
 4 | from __future__ import division
 5 | from __future__ import print_function
 6 | # from __future__ import unicode_literals
 7 | import numpy as np
 8 | cimport numpy as np
 9 | # Author: Deepak Pathak (c) 2016
10 | 
11 | cdef extern from "src/Coarse2FineFlowWrapper.h":
12 |     void Coarse2FineFlowWrapper(double * vx, double * vy, double * warpI2,
13 |                                   const double * Im1, const double * Im2,
14 |                                   double alpha, double ratio, int minWidth,
15 |                                   int nOuterFPIterations, int nInnerFPIterations,
16 |                                   int nSORIterations, int colType,
17 |                                   int h, int w, int c);
18 | 
19 | def coarse2fine_flow(np.ndarray[double, ndim=3, mode="c"] Im1 not None,
20 |                         np.ndarray[double, ndim=3, mode="c"] Im2 not None,
21 |                         double alpha=1, double ratio=0.5, int minWidth=40,
22 |                         int nOuterFPIterations=3, int nInnerFPIterations=1,
23 |                         int nSORIterations=20, int colType=0):
24 |     """
25 |     Input Format:
26 |       double * vx, double * vy, double * warpI2,
27 |       const double * Im1 (range [0,1]), const double * Im2 (range [0,1]),
28 |       double alpha (1), double ratio (0.5), int minWidth (40),
29 |       int nOuterFPIterations (3), int nInnerFPIterations (1),
30 |       int nSORIterations (20),
31 |       int colType (0 or default:RGB, 1:GRAY)
32 |     Images Format: (h,w,c): float64: [0,1]
33 |     """
34 |     cdef int h = Im1.shape[0]
35 |     cdef int w = Im1.shape[1]
36 |     cdef int c = Im1.shape[2]
37 |     cdef np.ndarray[double, ndim=2, mode="c"] vx = \
38 |         np.ascontiguousarray(np.zeros((h, w), dtype=np.float64))
39 |     cdef np.ndarray[double, ndim=2, mode="c"] vy = \
40 |         np.ascontiguousarray(np.zeros((h, w), dtype=np.float64))
41 |     cdef np.ndarray[double, ndim=3, mode="c"] warpI2 = \
42 |         np.ascontiguousarray(np.zeros((h, w, c), dtype=np.float64))
43 |     Im1 = np.ascontiguousarray(Im1)
44 |     Im2 = np.ascontiguousarray(Im2)
45 | 
46 |     Coarse2FineFlowWrapper(&vx[0, 0], &vy[0, 0], &warpI2[0, 0, 0],
47 |                             &Im1[0, 0, 0], &Im2[0, 0, 0],
48 |                             alpha, ratio, minWidth, nOuterFPIterations,
49 |                             nInnerFPIterations, nSORIterations, colType,
50 |                             h, w, c)
51 |     return vx, vy, warpI2
52 | 


--------------------------------------------------------------------------------
/setup.py:
--------------------------------------------------------------------------------
 1 | # Author: Deepak Pathak (c) 2016
 2 | 
 3 | from __future__ import absolute_import
 4 | from __future__ import division
 5 | from __future__ import print_function
 6 | # from __future__ import unicode_literals
 7 | from distutils.core import setup
 8 | from Cython.Build import cythonize
 9 | from distutils.extension import Extension
10 | from glob import glob
11 | 
12 | import numpy
13 | 
14 | sourcefiles = ['pyflow.pyx', ]
15 | sourcefiles.extend(glob("src/*.cpp"))
16 | extensions = [Extension("pyflow", sourcefiles, include_dirs=[numpy.get_include()])]
17 | setup(
18 |     name="pyflow",
19 |     version="1.0",
20 |     description="Python wrapper for the Coarse2Fine Optical Flow code.",
21 |     author="Deepak Pathak",
22 |     ext_modules=cythonize(extensions),
23 |     include_dirs=[numpy.get_include()]
24 | )
25 | 


--------------------------------------------------------------------------------
/src/Coarse2FineFlowWrapper.cpp:
--------------------------------------------------------------------------------
 1 | // This is a wrapper for Ce Liu's Coarse2Fine optical flow implementation.
 2 | // It converts the contiguous image array to the format needed by the optical
 3 | // flow code. Handling conversion in the wrapper makes the cythonization
 4 | // simpler.
 5 | // Author: Deepak Pathak (c) 2016
 6 | 
 7 | #include "Coarse2FineFlowWrapper.h"
 8 | #include "Image.h"
 9 | #include "OpticalFlow.h"
10 | using namespace std;
11 | 
12 | void Coarse2FineFlowWrapper(double * vx, double * vy, double * warpI2,
13 |                               const double * Im1, const double * Im2,
14 |                               double alpha, double ratio, int minWidth,
15 |                               int nOuterFPIterations, int nInnerFPIterations,
16 |                               int nSORIterations, int colType,
17 |                               int h, int w, int c) {
18 |   DImage ImFormatted1, ImFormatted2;
19 |   DImage vxFormatted, vyFormatted, warpI2Formatted;
20 | 
21 |   // format input in the format needed by backend
22 |   ImFormatted1.allocate(w, h, c);
23 |   ImFormatted2.allocate(w, h, c);
24 |   memcpy(ImFormatted1.pData, Im1, h * w * c * sizeof(double));
25 |   memcpy(ImFormatted2.pData, Im2, h * w * c * sizeof(double));
26 |   ImFormatted1.setColorType(colType);
27 |   ImFormatted2.setColorType(colType);
28 | 
29 |   // call optical flow backend
30 |   OpticalFlow::Coarse2FineFlow(vxFormatted, vyFormatted, warpI2Formatted,
31 |                                 ImFormatted1, ImFormatted2,
32 |                                 alpha, ratio, minWidth,
33 |                                 nOuterFPIterations, nInnerFPIterations,
34 |                                 nSORIterations);
35 | 
36 |   // copy formatted output to a contiguous memory to be returned
37 |   memcpy(vx, vxFormatted.pData, h * w * sizeof(double));
38 |   memcpy(vy, vyFormatted.pData, h * w * sizeof(double));
39 |   memcpy(warpI2, warpI2Formatted.pData, h * w * c * sizeof(double));
40 | 
41 |   // clear c memory
42 |   ImFormatted1.clear();
43 |   ImFormatted2.clear();
44 |   vxFormatted.clear();
45 |   vyFormatted.clear();
46 |   warpI2Formatted.clear();
47 | 
48 |   return;
49 | }
50 | 


--------------------------------------------------------------------------------
/src/Coarse2FineFlowWrapper.h:
--------------------------------------------------------------------------------
 1 | // This is a wrapper for Ce Liu's Coarse2Fine optical flow implementation.
 2 | // It converts the contiguous image array to the format needed by the optical
 3 | // flow code. Handling conversion in the wrapper makes the cythonization
 4 | // simpler.
 5 | // Author: Deepak Pathak (c) 2016
 6 | 
 7 | // override-include-guard
 8 | extern void Coarse2FineFlowWrapper(double * vx, double * vy, double * warpI2,
 9 |                               const double * Im1, const double * Im2,
10 |                               double alpha, double ratio, int minWidth,
11 |                               int nOuterFPIterations, int nInnerFPIterations,
12 |                               int nSORIterations, int colType,
13 |                               int h, int w, int c);
14 | 


--------------------------------------------------------------------------------
/src/GaussianPyramid.cpp:
--------------------------------------------------------------------------------
  1 | // Author: Ce Liu (c) Dec, 2009; celiu@mit.edu
  2 | // Modified By: Deepak Pathak (c) 2016; pathak@berkeley.edu
  3 | 
  4 | #include "GaussianPyramid.h"
  5 | #include "math.h"
  6 | 
  7 | GaussianPyramid::GaussianPyramid(void)
  8 | {
  9 | 	ImPyramid=NULL;
 10 | }
 11 | 
 12 | GaussianPyramid::~GaussianPyramid(void)
 13 | {
 14 | 	if(ImPyramid!=NULL)
 15 | 		delete []ImPyramid;
 16 | }
 17 | 
 18 | //---------------------------------------------------------------------------------------
 19 | // function to construct the pyramid
 20 | // this is the slow way
 21 | //---------------------------------------------------------------------------------------
 22 | /*void GaussianPyramid::ConstructPyramid(const DImage &image, double ratio, int minWidth)
 23 | {
 24 | 	// the ratio cannot be arbitrary numbers
 25 | 	if(ratio>0.98 || ratio<0.4)
 26 | 		ratio=0.75;
 27 | 	// first decide how many levels
 28 | 	nLevels=log((double)minWidth/image.width())/log(ratio);
 29 | 	if(ImPyramid!=NULL)
 30 | 		delete []ImPyramid;
 31 | 	ImPyramid=new DImage[nLevels];
 32 | 	ImPyramid[0].copyData(image);
 33 | 	double baseSigma=(1/ratio-1);
 34 | 	for(int i=1;i<nLevels;i++)
 35 | 	{
 36 | 		DImage foo;
 37 | 		double sigma=baseSigma*i;
 38 | 		image.GaussianSmoothing(foo,sigma,sigma*2.5);
 39 | 		foo.imresize(ImPyramid[i],pow(ratio,i));
 40 | 	}
 41 | }//*/
 42 | 
 43 | //---------------------------------------------------------------------------------------
 44 | // function to construct the pyramid
 45 | // this is the fast way
 46 | //---------------------------------------------------------------------------------------
 47 | void GaussianPyramid::ConstructPyramid(const DImage &image, double ratio, int minWidth)
 48 | {
 49 | 	// the ratio cannot be arbitrary numbers
 50 | 	if(ratio>0.98 || ratio<0.4)
 51 | 		ratio=0.75;
 52 | 	// first decide how many levels
 53 | 	nLevels=log((double)minWidth/image.width())/log(ratio);
 54 | 	if(ImPyramid!=NULL)
 55 | 		delete []ImPyramid;
 56 | 	ImPyramid=new DImage[nLevels];
 57 | 	ImPyramid[0].copyData(image);
 58 | 	double baseSigma=(1/ratio-1);
 59 | 	int n=log(0.25)/log(ratio);
 60 | 	double nSigma=baseSigma*n;
 61 | 	for(int i=1;i<nLevels;i++)
 62 | 	{
 63 | 		DImage foo;
 64 | 		if(i<=n)
 65 | 		{
 66 | 			double sigma=baseSigma*i;
 67 | 			image.GaussianSmoothing(foo,sigma,sigma*3);
 68 | 			foo.imresize(ImPyramid[i],pow(ratio,i));
 69 | 		}
 70 | 		else
 71 | 		{
 72 | 			ImPyramid[i-n].GaussianSmoothing(foo,nSigma,nSigma*3);
 73 | 			double rate=(double)pow(ratio,i)*image.width()/foo.width();
 74 | 			foo.imresize(ImPyramid[i],rate);
 75 | 		}
 76 | 	}
 77 | }
 78 | 
 79 | void GaussianPyramid::ConstructPyramidLevels(const DImage &image, double ratio, int _nLevels)
 80 | {
 81 | 	// the ratio cannot be arbitrary numbers
 82 | 	if(ratio>0.98 || ratio<0.4)
 83 | 		ratio=0.75;
 84 | 	nLevels = _nLevels;
 85 | 	if(ImPyramid!=NULL)
 86 | 		delete []ImPyramid;
 87 | 	ImPyramid=new DImage[nLevels];
 88 | 	ImPyramid[0].copyData(image);
 89 | 	double baseSigma=(1/ratio-1);
 90 | 	int n=log(0.25)/log(ratio);
 91 | 	double nSigma=baseSigma*n;
 92 | 	for(int i=1;i<nLevels;i++)
 93 | 	{
 94 | 		DImage foo;
 95 | 		if(i<=n)
 96 | 		{
 97 | 			double sigma=baseSigma*i;
 98 | 			image.GaussianSmoothing(foo,sigma,sigma*3);
 99 | 			foo.imresize(ImPyramid[i],pow(ratio,i));
100 | 		}
101 | 		else
102 | 		{
103 | 			ImPyramid[i-n].GaussianSmoothing(foo,nSigma,nSigma*3);
104 | 			double rate=(double)pow(ratio,i)*image.width()/foo.width();
105 | 			foo.imresize(ImPyramid[i],rate);
106 | 		}
107 | 	}
108 | }
109 | 
110 | void GaussianPyramid::displayTop(const char *filename)
111 | {
112 | 	// ImPyramid[nLevels-1].imwrite(filename);
113 | }
114 | 


--------------------------------------------------------------------------------
/src/GaussianPyramid.h:
--------------------------------------------------------------------------------
 1 | // Author: Ce Liu (c) Dec, 2009; celiu@mit.edu
 2 | // Modified By: Deepak Pathak (c) 2016; pathak@berkeley.edu
 3 | 
 4 | #ifndef _GaussianPyramid_h
 5 | #define _GaussianPyramid_h
 6 | 
 7 | #include "Image.h"
 8 | 
 9 | class GaussianPyramid
10 | {
11 | private:
12 | 	DImage* ImPyramid;
13 | 	int nLevels;
14 | public:
15 | 	GaussianPyramid(void);
16 | 	~GaussianPyramid(void);
17 | 	void ConstructPyramid(const DImage& image,double ratio=0.8,int minWidth=30);
18 | 	void ConstructPyramidLevels(const DImage& image,double ratio =0.8,int _nLevels = 2);
19 | 	void displayTop(const char* filename);
20 | 	inline int nlevels() const {return nLevels;};
21 | 	inline DImage& Image(int index) {return ImPyramid[index];};
22 | };
23 | 
24 | #endif
25 | 


--------------------------------------------------------------------------------
/src/ImageIO.h:
--------------------------------------------------------------------------------
  1 | // Author: Ce Liu (c) Dec, 2009; celiu@mit.edu
  2 | // Modified By: Deepak Pathak (c) 2016; pathak@berkeley.edu
  3 | 
  4 | #ifndef _ImageIO_h
  5 | #define _ImageIO_h
  6 | 
  7 | // No need of OpenCV; python wrapper handles it
  8 | // #include "cv.h"
  9 | // #include "highgui.h"
 10 | // #include "opencv2/core/core.hpp"
 11 | // #include "opencv2/highgui/highgui.hpp"
 12 | 
 13 | class ImageIO
 14 | {
 15 | public:
 16 |     enum ImageType{standard, derivative, normalized};
 17 |     ImageIO(void);
 18 |     ~ImageIO(void);
 19 | public:
 20 |     template <class T>
 21 |     static bool loadImage(const char* filename,T*& pImagePlane,int& width,int& height, int& nchannels);
 22 |     template <class T>
 23 |     static bool saveImage(const char* filename,const T* pImagePlane,int width,int height, int nchannels,ImageType imtype = standard);
 24 | 
 25 | };
 26 | 
 27 | // template <class T>
 28 | // bool ImageIO::loadImage(const char *filename, T *&pImagePlane, int &width, int &height, int &nchannels)
 29 | // {
 30 | //  cv::Mat im = cv::imread(filename);
 31 | //  if(im.data == NULL) // if allocation fails
 32 | //      return false;
 33 | //  if(im.type()!= CV_8UC1 && im.type()!=CV_8UC3 && im.type()!=CV_8UC4) // we only support three types of image information for now
 34 | //      return false;
 35 | //  width = im.size().width;
 36 | //  height = im.size().height;
 37 | //  nchannels = im.channels();
 38 | //  pImagePlane = new T[width*height*nchannels];
 39 | //
 40 | //  if(typeid(T) == typeid(unsigned char))
 41 | //  {
 42 | //      for(int i = 0;i<height;i++)
 43 | //          memcpy(pImagePlane+i*im.step,im.data+i*im.step,width*nchannels);
 44 | //      return true;
 45 | //  }
 46 | //
 47 | //  // check whether the type is float point
 48 | //  bool IsFloat=false;
 49 | //  if(typeid(T)==typeid(double) || typeid(T)==typeid(float) || typeid(T)==typeid(long double))
 50 | //      IsFloat=true;
 51 | //
 52 | //  for(int i =0;i<height;i++)
 53 | //  {
 54 | //      int offset1 = i*width*nchannels;
 55 | //      int offset2 = i*im.step;
 56 | //      for(int j=0;j<im.step;j++)
 57 | //      {
 58 | //          if(IsFloat)
 59 | //              pImagePlane[offset1+j] = (T)im.data[offset2+j]/255;
 60 | //          else
 61 | //              pImagePlane[offset1+j] = im.data[offset2+j];
 62 | //      }
 63 | //  }
 64 | //  return true;
 65 | // }
 66 | 
 67 | // template <class T>
 68 | // bool ImageIO::saveImage(const char* filename,const T* pImagePlane,int width,int height, int nchannels,ImageType imtype)
 69 | // {
 70 | //  cv::Mat im;
 71 | //  switch(nchannels){
 72 | //      case 1:
 73 | //          im.create(height,width,CV_8UC1);
 74 | //          break;
 75 | //      case 3:
 76 | //          im.create(height,width,CV_8UC3);
 77 | //          break;
 78 | //      default:
 79 | //          return -1;
 80 | //  }
 81 | //  // check whether the type is float point
 82 | //  bool IsFloat=false;
 83 | //  if(typeid(T)==typeid(double) || typeid(T)==typeid(float) || typeid(T)==typeid(long double))
 84 | //      IsFloat=true;
 85 | //
 86 | //  T Max,Min;
 87 | //  int nElements = width*height*nchannels;
 88 | //  switch(imtype){
 89 | //      case standard:
 90 | //          break;
 91 | //      case derivative:
 92 | //          // find the max of the absolute value
 93 | //          Max = pImagePlane[0];
 94 | //          if(!IsFloat)
 95 | //              for(int i = 0;i<nElements;i++)
 96 | //                  Max = __max(Max,abs(pImagePlane[i]));
 97 | //          else
 98 | //              for(int i=0;i<nElements;i++)
 99 | //                  Max = __max(Max,fabs((double)pImagePlane[i]));
100 | //          Max*=2;
101 | //          break;
102 | //      case normalized:
103 | //          Max = Min = pImagePlane[0];
104 | //          for(int i = 0;i<nElements;i++)
105 | //          {
106 | //              Max = __max(Max,pImagePlane[i]);
107 | //              Min = __min(Min,pImagePlane[i]);
108 | //          }
109 | //          break;
110 | //  }
111 | //  if(typeid(T) == typeid(unsigned char) && imtype == standard)
112 | //  {
113 | //      for(int i = 0;i<height;i++)
114 | //          memcpy(im.data+i*im.step,pImagePlane+i*im.step,width*nchannels);
115 | //  }
116 | //  else
117 | //  {
118 | //      for(int i =0;i<height;i++)
119 | //      {
120 | //          int offset1 = i*width*nchannels;
121 | //          int offset2 = i*im.step;
122 | //          for(int j=0;j<im.step;j++)
123 | //          {
124 | //              switch(imtype){
125 | //                  case standard:
126 | //                      if(IsFloat)
127 | //                          im.data[offset2+j] = pImagePlane[offset1+j]*255;
128 | //                      else
129 | //                          im.data[offset2+j] = __max(__min(pImagePlane[offset1+j],255),0);
130 | //                      break;
131 | //                  case derivative:
132 | //
133 | //                      if(IsFloat)
134 | //                          im.data[offset2+j] = (double)(pImagePlane[offset1+j]/Max+0.5)*255;
135 | //                      else
136 | //                          im.data[offset2+j] = ((double)pImagePlane[offset1+j]/Max+0.5)*255;
137 | //                      break;
138 | //                  case normalized:
139 | //                      im.data[offset2+j] = (double)(pImagePlane[offset1+j]-Min)/(Max-Min)*255;
140 | //                      break;
141 | //              }
142 | //          }
143 | //      }
144 | //  }
145 | //  return cv::imwrite(filename,im);
146 | // }
147 | 
148 | 
149 | 
150 | /*
151 | #include <QVector>
152 | #include <QImage>
153 | #include <QString>
154 | #include "math.h"
155 | //-----------------------------------------------------------------------------------------
156 | // this class is a wrapper to use QImage to load image into image planes
157 | //-----------------------------------------------------------------------------------------
158 | 
159 | class ImageIO
160 | {
161 | public:
162 |     enum ImageType{standard, derivative, normalized};
163 |     ImageIO(void);
164 |     ~ImageIO(void);
165 | public:
166 |     template <class T>
167 |     static void loadImage(const QImage& image,T*& pImagePlane,int& width,int& height,int& nchannels);
168 |     template <class T>
169 |     static bool loadImage(const QString& filename,T*& pImagePlane,int& width,int& height,int& nchannels);
170 | 
171 |     template <class T>
172 |     static unsigned char convertPixel(const T& value,bool IsFloat,ImageType type,T& _Max,T& _Min);
173 | 
174 |     template <class T>
175 |     static bool writeImage(const QString& filename, const T*& pImagePlane,int width,int height,int nchannels,ImageType type=standard,int quality=-1);
176 | 
177 |     template <class T>
178 |     static bool writeImage(const QString& filename,const T* pImagePlane,int width,int height,int nchannels,T min, T max,int quality=-1);
179 | 
180 | };
181 | 
182 | template <class T>
183 | void ImageIO::loadImage(const QImage& image, T*& pImagePlane,int& width,int& height,int& nchannels)
184 | {
185 |     // get the image information
186 |     width=image.width();
187 |     height=image.height();
188 |     nchannels=3;
189 |     pImagePlane=new T[width*height*nchannels];
190 | 
191 |     // check whether the type is float point
192 |     bool IsFloat=false;
193 |     if(typeid(T)==typeid(double) || typeid(T)==typeid(float) || typeid(T)==typeid(long double))
194 |         IsFloat=true;
195 | 
196 |     const unsigned char* plinebuffer;
197 |     for(int i=0;i<height;i++)
198 |     {
199 |         plinebuffer=image.scanLine(i);
200 |         for(int j=0;j<width;j++)
201 |         {
202 |             if(IsFloat)
203 |             {
204 |                 pImagePlane[(i*width+j)*3]=(T)plinebuffer[j*4]/255;
205 |                 pImagePlane[(i*width+j)*3+1]=(T)plinebuffer[j*4+1]/255;
206 |                 pImagePlane[(i*width+j)*3+2]=(T)plinebuffer[j*4+2]/255;
207 |             }
208 |             else
209 |             {
210 |                 pImagePlane[(i*width+j)*3]=plinebuffer[j*4];
211 |                 pImagePlane[(i*width+j)*3+1]=plinebuffer[j*4+1];
212 |                 pImagePlane[(i*width+j)*3+2]=plinebuffer[j*4+2];
213 |             }
214 |         }
215 |     }
216 | }
217 | 
218 | template <class T>
219 | bool ImageIO::loadImage(const QString&filename, T*& pImagePlane,int& width,int& height,int& nchannels)
220 | {
221 |     QImage image;
222 |     if(image.load(filename)==false)
223 |         return false;
224 |     if(image.format()!=QImage::Format_RGB32)
225 |     {
226 |         QImage temp=image.convertToFormat(QImage::Format_RGB32);
227 |         image=temp;
228 |     }
229 |     loadImage(image,pImagePlane,width,height,nchannels);
230 |     return true;
231 | }
232 | 
233 | template <class T>
234 | bool ImageIO::writeImage(const QString& filename, const T*& pImagePlane,int width,int height,int nchannels,ImageType type,int quality)
235 | {
236 |     int nPixels=width*height,nElements;
237 |     nElements=nPixels*nchannels;
238 |     unsigned char* pTempBuffer;
239 |     pTempBuffer=new unsigned char[nPixels*4];
240 |     memset(pTempBuffer,0,nPixels*4);
241 | 
242 |     // check whether the type is float point
243 |     bool IsFloat=false;
244 |     if(typeid(T)==typeid(double) || typeid(T)==typeid(float) || typeid(T)==typeid(long double))
245 |         IsFloat=true;
246 | 
247 |     T _Max=0,_Min=0;
248 |     switch(type){
249 |         case standard:
250 |             break;
251 |         case derivative:
252 |             _Max=0;
253 |             for(int i=0;i<nPixels;i++)
254 |             {
255 |                 if(IsFloat)
256 |                     _Max=__max(_Max,fabs((double)pImagePlane[i]));
257 |                 else
258 |                     _Max=__max(_Max,abs(pImagePlane[i]));
259 |             }
260 |             break;
261 |         case normalized:
262 |             _Min=_Max=pImagePlane[0];
263 |             for(int i=1;i<nElements;i++)
264 |             {
265 |                 _Min=__min(_Min,pImagePlane[i]);
266 |                 _Max=__max(_Max,pImagePlane[i]);
267 |             }
268 |             break;
269 |     }
270 | 
271 |     for(int i=0;i<nPixels;i++)
272 |     {
273 |         if(nchannels>=3)
274 |         {
275 |             pTempBuffer[i*4]=convertPixel(pImagePlane[i*nchannels],IsFloat,type,_Max,_Min);
276 |             pTempBuffer[i*4+1]=convertPixel(pImagePlane[i*nchannels+1],IsFloat,type,_Max,_Min);
277 |             pTempBuffer[i*4+2]=convertPixel(pImagePlane[i*nchannels+2],IsFloat,type,_Max,_Min);
278 |         }
279 |         else
280 |             for (int j=0;j<3;j++)
281 |                 pTempBuffer[i*4+j]=convertPixel(pImagePlane[i*nchannels],IsFloat,type,_Max,_Min);
282 |         pTempBuffer[i*4+3]=255;
283 |     }
284 |     QImage *pQImage=new QImage(pTempBuffer,width,height,QImage::Format_RGB32);
285 |     bool result= pQImage->save(filename,0,quality);
286 |     delete pQImage;
287 |     delete pTempBuffer;
288 |     return result;
289 | }
290 | 
291 | template <class T>
292 | bool ImageIO::writeImage(const QString& filename, const T* pImagePlane,int width,int height,int nchannels,T min,T max,int quality)
293 | {
294 |     int nPixels=width*height,nElements;
295 |     nElements=nPixels*nchannels;
296 |     unsigned char* pTempBuffer;
297 |     pTempBuffer=new unsigned char[nPixels*4];
298 |     memset(pTempBuffer,0,nPixels*4);
299 | 
300 |     // check whether the type is float point
301 |     bool IsFloat=false;
302 |     if(typeid(T)==typeid(double) || typeid(T)==typeid(float) || typeid(T)==typeid(long double))
303 |         IsFloat=true;
304 | 
305 |     T _Max=max,_Min=min;
306 | 
307 |     for(int i=0;i<nPixels;i++)
308 |     {
309 |         if(nchannels>=3)
310 |         {
311 |             pTempBuffer[i*4]=convertPixel(pImagePlane[i*nchannels],IsFloat,normalized,_Max,_Min);
312 |             pTempBuffer[i*4+1]=convertPixel(pImagePlane[i*nchannels+1],IsFloat,normalized,_Max,_Min);
313 |             pTempBuffer[i*4+2]=convertPixel(pImagePlane[i*nchannels+2],IsFloat,normalized,_Max,_Min);
314 |         }
315 |         else
316 |             for (int j=0;j<3;j++)
317 |                 pTempBuffer[i*4+j]=convertPixel(pImagePlane[i*nchannels],IsFloat,normalized,_Max,_Min);
318 |         pTempBuffer[i*4+3]=255;
319 |     }
320 |     QImage *pQImage=new QImage(pTempBuffer,width,height,QImage::Format_RGB32);
321 |     bool result= pQImage->save(filename,0,quality);
322 |     delete pQImage;
323 |     delete pTempBuffer;
324 |     return result;
325 | }
326 | 
327 | template <class T>
328 | unsigned char ImageIO::convertPixel(const T& value,bool IsFloat,ImageType type,T& _Max,T& _Min)
329 | {
330 |     switch(type){
331 |         case standard:
332 |             if(IsFloat)
333 |                 return __max(__min(value*255,255),0);
334 |             else
335 |                 return __max(__min(value,255),0);
336 |             break;
337 |         case derivative:
338 |             return (double)((double)value/_Max+1)/2*255;
339 |             break;
340 |         case normalized:
341 |             return (double)(value-_Min)/(_Max-_Min)*255;
342 |             break;
343 |     }
344 |     return 0;
345 | }
346 | //*/
347 | #endif
348 | 


--------------------------------------------------------------------------------
/src/ImageProcessing.h:
--------------------------------------------------------------------------------
  1 | // Author: Ce Liu (c) Dec, 2009; celiu@mit.edu
  2 | // Modified By: Deepak Pathak (c) 2016; pathak@berkeley.edu
  3 | 
  4 | #ifndef _ImageProcessing_h
  5 | #define _ImageProcessing_h
  6 | 
  7 | #include "math.h"
  8 | #include "stdio.h"
  9 | #include "stdlib.h"
 10 | #include <typeinfo>
 11 | 
 12 | //----------------------------------------------------------------------------------
 13 | // class to handle basic image processing functions
 14 | // this is a collection of template functions. These template functions are
 15 | // used in other image classes such as BiImage, IntImage and FImage
 16 | //----------------------------------------------------------------------------------
 17 | 
 18 | class ImageProcessing
 19 | {
 20 | public:
 21 | 	ImageProcessing(void);
 22 | 	~ImageProcessing(void);
 23 | public:
 24 | 	// basic functions
 25 | 	template <class T>
 26 | 	static inline T EnforceRange(const T& x,const int& MaxValue) {return __min(__max(x,0),MaxValue-1);};
 27 | 
 28 | 	//---------------------------------------------------------------------------------
 29 | 	// function to interpolate the image plane
 30 | 	//---------------------------------------------------------------------------------
 31 | 	template <class T1,class T2>
 32 | 	static inline void BilinearInterpolate(const T1* pImage,int width,int height,int nChannels,double x,double y,T2* result);
 33 | 
 34 | 	template <class T1>
 35 | 	static inline T1 BilinearInterpolate(const T1* pImage,int width,int height,double x,double y);
 36 | 
 37 | 	// the transpose of bilinear interpolation
 38 | 	template <class T1,class T2>
 39 | 	static inline void BilinearInterpolate_transpose(const T1* pImage,int width,int height,int nChannels,double x,double y,T2* result);
 40 | 
 41 | 	template <class T1>
 42 | 	static inline T1 BilinearInterpolate_transpose(const T1* pImage,int width,int height,double x,double y);
 43 | 
 44 | 	template <class T1,class T2>
 45 | 	static void ResizeImage(const T1* pSrcImage,T2* pDstImage,int SrcWidth,int SrcHeight,int nChannels,double Ratio);
 46 | 
 47 | 	template <class T1,class T2>
 48 | 	static void ResizeImage(const T1* pSrcImage,T2* pDstImage,int SrcWidth,int SrcHeight,int nChannels,int DstWidth,int DstHeight);
 49 | 
 50 | 	//---------------------------------------------------------------------------------
 51 | 	// functions for 1D filtering
 52 | 	//---------------------------------------------------------------------------------
 53 | 	template <class T1,class T2>
 54 | 	static void hfiltering(const T1* pSrcImage,T2* pDstImage,int width,int height,int nChannels,const double* pfilter1D,int fsize);
 55 | 
 56 | 	template <class T1,class T2>
 57 | 	static void vfiltering(const T1* pSrcImage,T2* pDstImage,int width,int height,int nChannels,const double* pfilter1D,int fsize);
 58 | 
 59 | 	template <class T1,class T2>
 60 | 	static void hfiltering_transpose(const T1* pSrcImage,T2* pDstImage,int width,int height,int nChannels,const double* pfilter1D,int fsize);
 61 | 
 62 | 	template <class T1,class T2>
 63 | 	static void vfiltering_transpose(const T1* pSrcImage,T2* pDstImage,int width,int height,int nChannels,const double* pfilter1D,int fsize);
 64 | 
 65 | 	//---------------------------------------------------------------------------------
 66 | 	// functions for 2D filtering
 67 | 	//---------------------------------------------------------------------------------
 68 | 	template <class T1,class T2>
 69 | 	static void filtering(const T1* pSrcImage,T2* pDstImage,int width,int height,int nChannels,const double* pfilter2D,int fsize);
 70 | 
 71 | 	template <class T1,class T2>
 72 | 	static void filtering_transpose(const T1* pSrcImage,T2* pDstImage,int width,int height,int nChannels,const double* pfilter2D,int fsize);
 73 | 
 74 | 	template <class T1,class T2>
 75 | 	static void Laplacian(const T1* pSrcImage,T2* pDstImage,int width,int height,int nChannels);
 76 | 
 77 | 	//---------------------------------------------------------------------------------
 78 | 	// functions for sample a patch from the image
 79 | 	//---------------------------------------------------------------------------------
 80 | 	template <class T1,class T2>
 81 | 	static void getPatch(const T1* pSrcImgae,T2* pPatch,int width,int height,int nChannels,double x,double y,int wsize);
 82 | 
 83 | 	//---------------------------------------------------------------------------------
 84 | 	// function to warp image
 85 | 	//---------------------------------------------------------------------------------
 86 | 	template <class T1,class T2>
 87 | 	static void warpImage(T1* pWarpIm2,const T1* pIm1,const T1* pIm2,const T2* pVx,const T2* pVy,int width,int height,int nChannels);
 88 | 
 89 | 	template <class T1,class T2>
 90 | 	static void warpImageFlow(T1* pWarpIm2,const T1* pIm1,const T1* pIm2,const T2* pFlow,int width,int height,int nChannels);
 91 | 
 92 | 	template <class T1,class T2>
 93 | 	static void warpImage(T1* pWarpIm2,const T1* pIm2,const T2* pVx,const T2* pVy,int width,int height,int nChannels);
 94 | 
 95 | 	template <class T1,class T2>
 96 | 	static void warpImage_transpose(T1* pWarpIm2,const T1* pIm2,const T2* pVx,const T2* pVy,int width,int height,int nChannels);
 97 | 
 98 | 	template <class T1,class T2>
 99 | 	static void warpImage(T1* pWarpIm2,const T1* pIm2,const T2*flow,int width,int height,int nChannels);
100 | 
101 | 	template <class T1,class T2>
102 | 	static void warpImage_transpose(T1* pWarpIm2,const T1* pIm2,const T2* flow,int width,int height,int nChannels);
103 | 
104 | 	template <class T1,class T2,class T3>
105 | 	static void warpImage(T1 *pWarpIm2, T3* pMask,const T1 *pIm1, const T1 *pIm2, const T2 *pVx, const T2 *pVy, int width, int height, int nChannels);
106 | 
107 | 
108 | 	//---------------------------------------------------------------------------------
109 | 	// function to crop an image
110 | 	//---------------------------------------------------------------------------------
111 | 	template <class T1,class T2>
112 | 	static void cropImage(const T1* pSrcImage,int SrcWidth,int SrcHeight,int nChannels,T2* pDstImage,int Left,int Top,int DstWidth,int DstHeight);
113 | 	//---------------------------------------------------------------------------------
114 | 
115 | 	//---------------------------------------------------------------------------------
116 | 	// function to generate a 2D Gaussian
117 | 	//---------------------------------------------------------------------------------
118 | 	template <class T>
119 | 	static void generate2DGaussian(T*& pImage,int wsize,double sigma=-1);
120 | 
121 | 	template <class T>
122 | 	static void generate1DGaussian(T*& pImage,int wsize,double sigma=-1);
123 | 
124 | };
125 | 
126 | //--------------------------------------------------------------------------------------------------
127 | // function to interplate multi-channel image plane for (x,y)
128 | // --------------------------------------------------------------------------------------------------
129 | template <class T1,class T2>
130 | inline void ImageProcessing::BilinearInterpolate(const T1* pImage,int width,int height,int nChannels,double x,double y,T2* result)
131 | {
132 | 	int xx,yy,m,n,u,v,l,offset;
133 | 	xx=x;
134 | 	yy=y;
135 | 	double dx,dy,s;
136 | 	dx=__max(__min(x-xx,1),0);
137 | 	dy=__max(__min(y-yy,1),0);
138 | 
139 | 	for(m=0;m<=1;m++)
140 | 		for(n=0;n<=1;n++)
141 | 		{
142 | 			u=EnforceRange(xx+m,width);
143 | 			v=EnforceRange(yy+n,height);
144 | 			offset=(v*width+u)*nChannels;
145 | 			s=fabs(1-m-dx)*fabs(1-n-dy);
146 | 			for(l=0;l<nChannels;l++)
147 | 				result[l]+=pImage[offset+l]*s;
148 | 		}
149 | }
150 | 
151 | template <class T1>
152 | inline T1 ImageProcessing::BilinearInterpolate(const T1* pImage,int width,int height,double x,double y)
153 | {
154 | 	int xx,yy,m,n,u,v,l,offset;
155 | 	xx=x;
156 | 	yy=y;
157 | 	double dx,dy,s;
158 | 	dx=__max(__min(x-xx,1),0);
159 | 	dy=__max(__min(y-yy,1),0);
160 | 
161 | 	T1 result=0;
162 | 	for(m=0;m<=1;m++)
163 | 		for(n=0;n<=1;n++)
164 | 		{
165 | 			u=EnforceRange(xx+m,width);
166 | 			v=EnforceRange(yy+n,height);
167 | 			offset=v*width+u;
168 | 			s=fabs(1-m-dx)*fabs(1-n-dy);
169 | 			result+=pImage[offset]*s;
170 | 		}
171 | 	return result;
172 | }
173 | 
174 | 
175 | //--------------------------------------------------------------------------------------------------
176 | // function to interplate multi-channel image plane for (x,y)
177 | // --------------------------------------------------------------------------------------------------
178 | template <class T1,class T2>
179 | inline void ImageProcessing::BilinearInterpolate_transpose(const T1* pInput,int width,int height,int nChannels,double x,double y,T2* pDstImage)
180 | {
181 | 	int xx,yy,m,n,u,v,l,offset;
182 | 	xx=x;
183 | 	yy=y;
184 | 	double dx,dy,s;
185 | 	dx=__max(__min(x-xx,1),0);
186 | 	dy=__max(__min(y-yy,1),0);
187 | 
188 | 	for(m=0;m<=1;m++)
189 | 		for(n=0;n<=1;n++)
190 | 		{
191 | 			u=EnforceRange(xx+m,width);
192 | 			v=EnforceRange(yy+n,height);
193 | 			offset=(v*width+u)*nChannels;
194 | 			s=fabs(1-m-dx)*fabs(1-n-dy);
195 | 			for(l=0;l<nChannels;l++)
196 | 				pDstImage[offset+l] += pInput[l]*s;
197 | 		}
198 | }
199 | 
200 | //------------------------------------------------------------------------------------------------------------
201 | // this is the most general function for reszing an image with a varying nChannels
202 | // bilinear interpolation is used for now. It might be replaced by other (bicubic) interpolation methods
203 | //------------------------------------------------------------------------------------------------------------
204 | template <class T1,class T2>
205 | void ImageProcessing::ResizeImage(const T1* pSrcImage,T2* pDstImage,int SrcWidth,int SrcHeight,int nChannels,double Ratio)
206 | {
207 | 	int DstWidth,DstHeight;
208 | 	DstWidth=(double)SrcWidth*Ratio;
209 | 	DstHeight=(double)SrcHeight*Ratio;
210 | 	memset(pDstImage,0,sizeof(T2)*DstWidth*DstHeight*nChannels);
211 | 
212 | 	double x,y;
213 | 
214 | 	for(int i=0;i<DstHeight;i++)
215 | 		for(int j=0;j<DstWidth;j++)
216 | 		{
217 | 			x=(double)(j+1)/Ratio-1;
218 | 			y=(double)(i+1)/Ratio-1;
219 | 
220 | 			// bilinear interpolation
221 | 			BilinearInterpolate(pSrcImage,SrcWidth,SrcHeight,nChannels,x,y,pDstImage+(i*DstWidth+j)*nChannels);
222 | 		}
223 | }
224 | 
225 | template <class T1,class T2>
226 | void ImageProcessing::ResizeImage(const T1 *pSrcImage, T2 *pDstImage, int SrcWidth, int SrcHeight, int nChannels, int DstWidth, int DstHeight)
227 | {
228 | 	double xRatio=(double)DstWidth/SrcWidth;
229 | 	double yRatio=(double)DstHeight/SrcHeight;
230 | 	memset(pDstImage,sizeof(T2)*DstWidth*DstHeight*nChannels,0);
231 | 
232 | 	double x,y;
233 | 
234 | 	for(int i=0;i<DstHeight;i++)
235 | 		for(int j=0;j<DstWidth;j++)
236 | 		{
237 | 			x=(double)(j+1)/xRatio-1;
238 | 			y=(double)(i+1)/yRatio-1;
239 | 
240 | 			// bilinear interpolation
241 | 			BilinearInterpolate(pSrcImage,SrcWidth,SrcHeight,nChannels,x,y,pDstImage+(i*DstWidth+j)*nChannels);
242 | 		}
243 | }
244 | 
245 | //------------------------------------------------------------------------------------------------------------
246 | //  horizontal direction filtering
247 | //------------------------------------------------------------------------------------------------------------
248 | template <class T1,class T2>
249 | void ImageProcessing::hfiltering(const T1* pSrcImage,T2* pDstImage,int width,int height,int nChannels,const double* pfilter1D,int fsize)
250 | {
251 | 	memset(pDstImage,0,sizeof(T2)*width*height*nChannels);
252 | 	T2* pBuffer;
253 | 	double w;
254 | 	int i,j,l,k,offset,jj;
255 | 	for(i=0;i<height;i++)
256 | 		for(j=0;j<width;j++)
257 | 		{
258 | 			offset=i*width*nChannels;
259 | 			pBuffer=pDstImage+offset+j*nChannels;
260 | 			for(l=-fsize;l<=fsize;l++)
261 | 			{
262 | 				w=pfilter1D[l+fsize];
263 | 				jj=EnforceRange(j+l,width);
264 | 				for(k=0;k<nChannels;k++)
265 | 					pBuffer[k]+=pSrcImage[offset+jj*nChannels+k]*w;
266 | 			}
267 | 		}
268 | }
269 | 
270 | //------------------------------------------------------------------------------------------------------------
271 | //  horizontal direction filtering transpose
272 | //------------------------------------------------------------------------------------------------------------
273 | template <class T1,class T2>
274 | void ImageProcessing::hfiltering_transpose(const T1* pSrcImage,T2* pDstImage,int width,int height,int nChannels,const double* pfilter1D,int fsize)
275 | {
276 | 	memset(pDstImage,0,sizeof(T2)*width*height*nChannels);
277 | 	const T1* pBuffer;
278 | 	double w;
279 | 	int i,j,l,k,offset,jj;
280 | 	for(i=0;i<height;i++)
281 | 		for(j=0;j<width;j++)
282 | 		{
283 | 			int offset0=i*width*nChannels;
284 | 			pBuffer=pSrcImage+(i*width+j)*nChannels;
285 | 			for(l=-fsize;l<=fsize;l++)
286 | 			{
287 | 				w=pfilter1D[l+fsize];
288 | 				jj=EnforceRange(j+l,width);
289 | 				offset = offset0 + jj*nChannels;
290 | 				for(k=0;k<nChannels;k++)
291 | 					pDstImage[offset+k] += pBuffer[k]*w;
292 | 			}
293 | 		}
294 | }
295 | //------------------------------------------------------------------------------------------------------------
296 | // fast filtering algorithm for laplacian
297 | //------------------------------------------------------------------------------------------------------------
298 | template <class T1,class T2>
299 | void ImageProcessing::Laplacian(const T1 *pSrcImage, T2 *pDstImage, int width, int height, int nChannels)
300 | {
301 | 	int LineWidth=width*nChannels;
302 | 	int nElements=width*height*nChannels;
303 | 	// first treat the corners
304 | 	for(int k=0;k<nChannels;k++)
305 | 	{
306 | 		pDstImage[k]=pSrcImage[k]*2-pSrcImage[nChannels+k]-pSrcImage[LineWidth+k];
307 | 		pDstImage[LineWidth-nChannels+k]=pSrcImage[LineWidth-nChannels+k]*2-pSrcImage[LineWidth-2*nChannels+k]-pSrcImage[2*LineWidth-nChannels+k];
308 | 		pDstImage[nElements-LineWidth+k]=pSrcImage[nElements-LineWidth+k]*2-pSrcImage[nElements-LineWidth+nChannels+k]-pSrcImage[nElements-2*LineWidth+k];
309 | 		pDstImage[nElements-nChannels+k]=pSrcImage[nElements-nChannels+k]*2-pSrcImage[nElements-2*nChannels+k]-pSrcImage[nElements-LineWidth-nChannels+k];
310 | 	}
311 | 	// then treat the borders
312 | 	for(int i=1;i<width-1;i++)
313 | 		for(int k=0;k<nChannels;k++)
314 | 		{
315 | 			pDstImage[i*nChannels+k]=pSrcImage[i*nChannels+k]*3-pSrcImage[(i-1)*nChannels+k]-pSrcImage[(i+1)*nChannels+k]-pSrcImage[i*nChannels+LineWidth+k];
316 | 			pDstImage[nElements-LineWidth+i*nChannels+k]=pSrcImage[nElements-LineWidth+i*nChannels+k]*3-pSrcImage[nElements-LineWidth+(i-1)*nChannels+k]-pSrcImage[nElements-LineWidth+(i+1)*nChannels+k]-pSrcImage[nElements-2*LineWidth+i*nChannels+k];
317 | 		}
318 | 	for(int i=1;i<height-1;i++)
319 | 		for(int k=0;k<nChannels;k++)
320 | 		{
321 | 			pDstImage[i*LineWidth+k]=pSrcImage[i*LineWidth+k]*3-pSrcImage[i*LineWidth+nChannels+k]-pSrcImage[(i-1)*LineWidth+k]-pSrcImage[(i+1)*LineWidth+k];
322 | 			pDstImage[(i+1)*LineWidth-nChannels+k]=pSrcImage[(i+1)*LineWidth-nChannels+k]*3-pSrcImage[(i+1)*LineWidth-2*nChannels+k]-pSrcImage[i*LineWidth-nChannels+k]-pSrcImage[(i+2)*LineWidth-nChannels+k];
323 | 		}
324 | 	// now the interior
325 | 	for(int i=1;i<height-1;i++)
326 | 		for(int j=1;j<width-1;j++)
327 | 		{
328 | 			int offset=(i*width+j)*nChannels;
329 | 			for(int k=0;k<nChannels;k++)
330 | 				pDstImage[offset+k]=pSrcImage[offset+k]*4-pSrcImage[offset+nChannels+k]-pSrcImage[offset-nChannels+k]-pSrcImage[offset-LineWidth+k]-pSrcImage[offset+LineWidth+k];
331 | 		}
332 | }
333 | 
334 | 
335 | //------------------------------------------------------------------------------------------------------------
336 | // vertical direction filtering
337 | //------------------------------------------------------------------------------------------------------------
338 | template <class T1,class T2>
339 | void ImageProcessing::vfiltering(const T1* pSrcImage,T2* pDstImage,int width,int height,int nChannels,const double* pfilter1D,int fsize)
340 | {
341 | 	memset(pDstImage,0,sizeof(T2)*width*height*nChannels);
342 | 	T2* pBuffer;
343 | 	double w;
344 | 	int i,j,l,k,offset,ii;
345 | 	for(i=0;i<height;i++)
346 | 		for(j=0;j<width;j++)
347 | 		{
348 | 			pBuffer=pDstImage+(i*width+j)*nChannels;
349 | 			for(l=-fsize;l<=fsize;l++)
350 | 			{
351 | 				w=pfilter1D[l+fsize];
352 | 				ii=EnforceRange(i+l,height);
353 | 				for(k=0;k<nChannels;k++)
354 | 					pBuffer[k]+=pSrcImage[(ii*width+j)*nChannels+k]*w;
355 | 			}
356 | 		}
357 | }
358 | 
359 | //------------------------------------------------------------------------------------------------------------
360 | // vertical direction filtering transpose
361 | //------------------------------------------------------------------------------------------------------------
362 | template <class T1,class T2>
363 | void ImageProcessing::vfiltering_transpose(const T1* pSrcImage,T2* pDstImage,int width,int height,int nChannels,const double* pfilter1D,int fsize)
364 | {
365 | 	memset(pDstImage,0,sizeof(T2)*width*height*nChannels);
366 | 	const T1* pBuffer;
367 | 	double w;
368 | 	int i,j,l,k,offset,ii;
369 | 	for(i=0;i<height;i++)
370 | 		for(j=0;j<width;j++)
371 | 		{
372 | 			pBuffer=pSrcImage+(i*width+j)*nChannels;
373 | 			for(l=-fsize;l<=fsize;l++)
374 | 			{
375 | 				w=pfilter1D[l+fsize];
376 | 				ii=EnforceRange(i+l,height);
377 | 				offset = (ii*width+j)*nChannels;
378 | 				for(k=0;k<nChannels;k++)
379 | 					//pBuffer[k]+=pSrcImage[(ii*width+j)*nChannels+k]*w;
380 | 					pDstImage[offset+k] += pBuffer[k]*w;
381 | 			}
382 | 		}
383 | }
384 | 
385 | 
386 | //------------------------------------------------------------------------------------------------------------
387 | // 2d filtering
388 | //------------------------------------------------------------------------------------------------------------
389 | template <class T1,class T2>
390 | void ImageProcessing::filtering(const T1* pSrcImage,T2* pDstImage,int width,int height,int nChannels,const double* pfilter2D,int fsize)
391 | {
392 | 	double w;
393 | 	int i,j,u,v,k,ii,jj,wsize,offset;
394 | 	wsize=fsize*2+1;
395 | 	double* pBuffer=new double[nChannels];
396 | 	for(i=0;i<height;i++)
397 | 		for(j=0;j<width;j++)
398 | 		{
399 | 			for(k=0;k<nChannels;k++)
400 | 				pBuffer[k]=0;
401 | 			for(u=-fsize;u<=fsize;u++)
402 | 				for(v=-fsize;v<=fsize;v++)
403 | 				{
404 | 					w=pfilter2D[(u+fsize)*wsize+v+fsize];
405 | 					ii=EnforceRange(i+u,height);
406 | 					jj=EnforceRange(j+v,width);
407 | 					offset=(ii*width+jj)*nChannels;
408 | 					for(k=0;k<nChannels;k++)
409 | 						pBuffer[k]+=pSrcImage[offset+k]*w;
410 | 				}
411 | 			offset=(i*width+j)*nChannels;
412 | 			for(k=0;k<nChannels;k++)
413 | 				pDstImage[offset+k]=pBuffer[k];
414 | 		}
415 | 	delete pBuffer;
416 | }
417 | 
418 | //------------------------------------------------------------------------------------------------------------
419 | // 2d filtering transpose
420 | //------------------------------------------------------------------------------------------------------------
421 | template <class T1,class T2>
422 | void ImageProcessing::filtering_transpose(const T1* pSrcImage,T2* pDstImage,int width,int height,int nChannels,const double* pfilter2D,int fsize)
423 | {
424 | 	double w;
425 | 	int i,j,u,v,k,ii,jj,wsize,offset;
426 | 	wsize=fsize*2+1;
427 | 	memset(pDstImage,0,sizeof(T2)*width*height*nChannels);
428 | 	for(i=0;i<height;i++)
429 | 		for(j=0;j<width;j++)
430 | 		{
431 | 			int offset0 = (i*width+j)*nChannels;
432 | 			for(u=-fsize;u<=fsize;u++)
433 | 				for(v=-fsize;v<=fsize;v++)
434 | 				{
435 | 					w=pfilter2D[(u+fsize)*wsize+v+fsize];
436 | 					ii=EnforceRange(i+u,height);
437 | 					jj=EnforceRange(j+v,width);
438 | 					int offset=(ii*width+jj)*nChannels;
439 | 					for(k=0;k<nChannels;k++)
440 | 						pDstImage[offset+k]+=pSrcImage[offset0+k]*w;
441 | 				}
442 | 		}
443 | }
444 | 
445 | 
446 | //------------------------------------------------------------------------------------------------------------
447 | // function to sample a patch from the source image
448 | //------------------------------------------------------------------------------------------------------------
449 | template <class T1,class T2>
450 | void ImageProcessing::getPatch(const T1* pSrcImage,T2* pPatch,int width,int height,int nChannels,double x0,double y0,int wsize)
451 | {
452 | 	// suppose pPatch has been allocated and cleared before calling the function
453 | 	int wlength=wsize*2+1;
454 | 	double x,y;
455 | 	for(int i=-wsize;i<=wsize;i++)
456 | 		for(int j=-wsize;j<=wsize;j++)
457 | 		{
458 | 			y=y0+i;
459 | 			x=x0+j;
460 | 			if(x<0 || x>width-1 || y<0 || y>height-1)
461 | 				continue;
462 | 			BilinearInterpolate(pSrcImage,width,height,nChannels,x,y,pPatch+((i+wsize)*wlength+j+wsize)*nChannels);
463 | 		}
464 | }
465 | 
466 | //------------------------------------------------------------------------------------------------------------
467 | // function to warp an image with respect to flow field
468 | // pWarpIm2 has to be allocated before hands
469 | //------------------------------------------------------------------------------------------------------------
470 | template <class T1,class T2>
471 | void ImageProcessing::warpImage(T1 *pWarpIm2, const T1 *pIm1, const T1 *pIm2, const T2 *pVx, const T2 *pVy, int width, int height, int nChannels)
472 | {
473 | 	memset(pWarpIm2,0,sizeof(T1)*width*height*nChannels);
474 | 	for(int i=0;i<height;i++)
475 | 		for(int j=0;j<width;j++)
476 | 		{
477 | 			int offset=i*width+j;
478 | 			double x,y;
479 | 			y=i+pVy[offset];
480 | 			x=j+pVx[offset];
481 | 			offset*=nChannels;
482 | 			if(x<0 || x>width-1 || y<0 || y>height-1)
483 | 			{
484 | 				for(int k=0;k<nChannels;k++)
485 | 					pWarpIm2[offset+k]=pIm1[offset+k];
486 | 				continue;
487 | 			}
488 | 			BilinearInterpolate(pIm2,width,height,nChannels,x,y,pWarpIm2+offset);
489 | 		}
490 | }
491 | 
492 | template <class T1,class T2>
493 | void ImageProcessing::warpImageFlow(T1 *pWarpIm2, const T1 *pIm1, const T1 *pIm2, const T2 *pFlow, int width, int height, int nChannels)
494 | {
495 | 	memset(pWarpIm2,0,sizeof(T1)*width*height*nChannels);
496 | 	for(int i=0;i<height;i++)
497 | 		for(int j=0;j<width;j++)
498 | 		{
499 | 			int offset=i*width+j;
500 | 			double x,y;
501 | 			y=i+pFlow[offset*2+1];
502 | 			x=j+pFlow[offset*2];
503 | 			offset*=nChannels;
504 | 			if(x<0 || x>width-1 || y<0 || y>height-1)
505 | 			{
506 | 				for(int k=0;k<nChannels;k++)
507 | 					pWarpIm2[offset+k]=pIm1[offset+k];
508 | 				continue;
509 | 			}
510 | 			BilinearInterpolate(pIm2,width,height,nChannels,x,y,pWarpIm2+offset);
511 | 		}
512 | }
513 | 
514 | template <class T1,class T2>
515 | void ImageProcessing::warpImage(T1 *pWarpIm2,const T1 *pIm2, const T2 *pVx, const T2 *pVy, int width, int height, int nChannels)
516 | {
517 | 	memset(pWarpIm2,0,sizeof(T1)*width*height*nChannels);
518 | 	for(int i=0;i<height;i++)
519 | 		for(int j=0;j<width;j++)
520 | 		{
521 | 			int offset=i*width+j;
522 | 			double x,y;
523 | 			y=i+pVy[offset];
524 | 			x=j+pVx[offset];
525 | 			offset*=nChannels;
526 | 			if(x<0 || x>width-1 || y<0 || y>height-1)
527 | 				continue;
528 | 			BilinearInterpolate(pIm2,width,height,nChannels,x,y,pWarpIm2+offset);
529 | 		}
530 | }
531 | 
532 | template <class T1,class T2>
533 | void ImageProcessing::warpImage_transpose(T1 *pWarpIm2,const T1 *pIm2, const T2 *pVx, const T2 *pVy, int width, int height, int nChannels)
534 | {
535 | 	memset(pWarpIm2,0,sizeof(T1)*width*height*nChannels);
536 | 	for(int i=0;i<height;i++)
537 | 		for(int j=0;j<width;j++)
538 | 		{
539 | 			int offset=i*width+j;
540 | 			double x,y;
541 | 			y=i+pVy[offset];
542 | 			x=j+pVx[offset];
543 | 			offset*=nChannels;
544 | 			if(x<0 || x>width-1 || y<0 || y>height-1)
545 | 				continue;
546 | 			//BilinearInterpolate(pIm2,width,height,nChannels,x,y,pWarpIm2+offset);
547 | 			BilinearInterpolate_transpose(pIm2+offset,width,height,nChannels,x,y,pWarpIm2);
548 | 		}
549 | }
550 | 
551 | //////////////////////////////////////////////////////////////////////////////////////
552 | // different format
553 | //////////////////////////////////////////////////////////////////////////////////////
554 | template <class T1,class T2>
555 | void ImageProcessing::warpImage(T1 *pWarpIm2,const T1 *pIm2, const T2 *flow, int width, int height, int nChannels)
556 | {
557 | 	memset(pWarpIm2,0,sizeof(T1)*width*height*nChannels);
558 | 	for(int i=0;i<height;i++)
559 | 		for(int j=0;j<width;j++)
560 | 		{
561 | 			int offset=i*width+j;
562 | 			double x,y;
563 | 			y=i+flow[offset*2+1];
564 | 			x=j+flow[offset*2];
565 | 			offset*=nChannels;
566 | 			if(x<0 || x>width-1 || y<0 || y>height-1)
567 | 				continue;
568 | 			BilinearInterpolate(pIm2,width,height,nChannels,x,y,pWarpIm2+offset);
569 | 		}
570 | }
571 | 
572 | template <class T1,class T2>
573 | void ImageProcessing::warpImage_transpose(T1 *pWarpIm2,const T1 *pIm2, const T2 *flow, int width, int height, int nChannels)
574 | {
575 | 	memset(pWarpIm2,0,sizeof(T1)*width*height*nChannels);
576 | 	for(int i=0;i<height;i++)
577 | 		for(int j=0;j<width;j++)
578 | 		{
579 | 			int offset=i*width+j;
580 | 			double x,y;
581 | 			y=i+flow[offset*2+1];
582 | 			x=j+flow[offset*2];
583 | 			offset*=nChannels;
584 | 			if(x<0 || x>width-1 || y<0 || y>height-1)
585 | 				continue;
586 | 			//BilinearInterpolate(pIm2,width,height,nChannels,x,y,pWarpIm2+offset);
587 | 			BilinearInterpolate_transpose(pIm2+offset,width,height,nChannels,x,y,pWarpIm2);
588 | 		}
589 | }
590 | 
591 | 
592 | template <class T1,class T2,class T3>
593 | void ImageProcessing::warpImage(T1 *pWarpIm2, T3* pMask,const T1 *pIm1, const T1 *pIm2, const T2 *pVx, const T2 *pVy, int width, int height, int nChannels)
594 | {
595 | 	memset(pWarpIm2,0,sizeof(T1)*width*height*nChannels);
596 | 	for(int i=0;i<height;i++)
597 | 		for(int j=0;j<width;j++)
598 | 		{
599 | 			int offset=i*width+j;
600 | 			double x,y;
601 | 			y=i+pVy[offset];
602 | 			x=j+pVx[offset];
603 | 			offset*=nChannels;
604 | 			if(x<0 || x>width-1 || y<0 || y>height-1)
605 | 			{
606 | 				for(int k=0;k<nChannels;k++)
607 | 					pWarpIm2[offset+k]=pIm1[offset+k];
608 | 				pMask[i*width+j]=0;
609 | 				continue;
610 | 			}
611 | 			pMask[i*width+j]=1;
612 | 			BilinearInterpolate(pIm2,width,height,nChannels,x,y,pWarpIm2+offset);
613 | 		}
614 | }
615 | 
616 | //------------------------------------------------------------------------------------------------------------
617 | // function to crop an image from the source
618 | // assume that pDstImage has been allocated
619 | // also Left and Top must be valid, DstWidth and DstHeight should ensure that the image lies
620 | // inside the image boundary
621 | //------------------------------------------------------------------------------------------------------------
622 | template <class T1,class T2>
623 | void ImageProcessing::cropImage(const T1 *pSrcImage, int SrcWidth, int SrcHeight, int nChannels, T2 *pDstImage, int Left, int Top, int DstWidth, int DstHeight)
624 | {
625 | 	if(typeid(T1)==typeid(T2))
626 | 	{
627 | 		for(int i=0;i<DstHeight;i++)
628 | 			memcpy(pDstImage+i*DstWidth*nChannels,pSrcImage+((i+Top)*SrcWidth+Left)*nChannels,sizeof(T1)*DstWidth*nChannels);
629 | 		return;
630 | 	}
631 | 	int offsetSrc,offsetDst;
632 | 	for(int i=0;i<DstHeight;i++)
633 | 		for(int j=0;j<DstWidth;j++)
634 | 		{
635 | 			offsetSrc=((i+Top)*SrcWidth+Left+j)*nChannels;
636 | 			offsetDst=(i*DstWidth+j)*nChannels;
637 | 			for(int k=0;k<nChannels;k++)
638 | 				pDstImage[offsetDst+k]=pSrcImage[offsetSrc+k];
639 | 		}
640 | }
641 | 
642 | //------------------------------------------------------------------------------------------------------------
643 | // function to generate a 2D Gaussian image
644 | // pImage must be allocated before calling the function
645 | //------------------------------------------------------------------------------------------------------------
646 | template <class T>
647 | void ImageProcessing::generate2DGaussian(T*& pImage, int wsize, double sigma)
648 | {
649 | 	if(sigma==-1)
650 | 		sigma=wsize/2;
651 | 	double alpha=1/(2*sigma*sigma);
652 | 	int winlength=wsize*2+1;
653 | 	if(pImage==NULL)
654 | 		pImage=new T[winlength*winlength];
655 | 	double total = 0;
656 | 	for(int i=-wsize;i<=wsize;i++)
657 | 		for(int j=-wsize;j<=wsize;j++)
658 | 		{
659 | 			pImage[(i+wsize)*winlength+j+wsize]=exp(-(double)(i*i+j*j)*alpha);
660 | 			total += pImage[(i+wsize)*winlength+j+wsize];
661 | 		}
662 | 	for(int i = 0;i<winlength*winlength;i++)
663 | 		pImage[i]/=total;
664 | }
665 | 
666 | //------------------------------------------------------------------------------------------------------------
667 | // function to generate a 1D Gaussian image
668 | // pImage must be allocated before calling the function
669 | //------------------------------------------------------------------------------------------------------------
670 | template <class T>
671 | void ImageProcessing::generate1DGaussian(T*& pImage, int wsize, double sigma)
672 | {
673 | 	if(sigma==-1)
674 | 		sigma=wsize/2;
675 | 	double alpha=1/(2*sigma*sigma);
676 | 	int winlength=wsize*2+1;
677 | 	if(pImage==NULL)
678 | 		pImage=new T[winlength];
679 | 	double total = 0;
680 | 	for(int i=-wsize;i<=wsize;i++)
681 | 	{
682 | 		pImage[i+wsize]=exp(-(double)(i*i)*alpha);
683 | 		total += pImage[i+wsize];
684 | 	}
685 | 	for(int i = 0;i<winlength;i++)
686 | 		pImage[i]/=total;
687 | }
688 | 
689 | #endif
690 | 


--------------------------------------------------------------------------------
/src/Matrix.h:
--------------------------------------------------------------------------------
  1 | // Author: Ce Liu (c) Dec, 2009; celiu@mit.edu
  2 | // Modified By: Deepak Pathak (c) 2016; pathak@berkeley.edu
  3 | 
  4 | #pragma once
  5 | 
  6 | #include "stdio.h"
  7 | #include "Vector.h"
  8 | #include "project.h"
  9 | #ifdef _QT
 10 | 	#include <QFile>
 11 | #endif
 12 | #include <iostream>
 13 | 
 14 | using namespace std;
 15 | 
 16 | template <class T=double>
 17 | class Matrix
 18 | {
 19 | private:
 20 | 	int nRow,nCol;
 21 | 	double* pData;
 22 | 	static bool IsDispInfo;
 23 | public:
 24 | 	Matrix(void);
 25 | 	Matrix(int _nrow,int _ncol,double* data=NULL);
 26 | 	Matrix(const Matrix<T>& matrix);
 27 | 	~Matrix(void);
 28 | 	void releaseData();
 29 | 	void copyData(const Matrix<T>& matrix);
 30 | 	void allocate(const Matrix<T>& matrix);
 31 | 	void allocate(int _nrow,int _ncol);
 32 | 	void reset();
 33 | 	bool dimMatch(const Matrix<T>& matrix) const;
 34 | 	bool dimcheck(const Matrix<T>& matrix) const;
 35 | 	void loadData(int _nrow,int _ncol,T* data);
 36 | 	static void enableDispInfo(bool dispInfo=false){IsDispInfo=dispInfo;};
 37 | 	// display the matrix
 38 | 	void printMatrix();
 39 | 	void identity(int ndim);
 40 | 
 41 | 	// function to access the member variables
 42 | 	inline int nrow() const{return nRow;};
 43 | 	inline int ncol() const{return nCol;};
 44 | 	inline double* data() {return pData;};
 45 | 	inline const double* data() const {return (const double*)pData;};
 46 | 	inline double operator [](int index) const{return pData[index];};
 47 | 	inline double& operator[](int index) {return pData[index];};
 48 | 	inline double data(int row,int col)const {return pData[row*nCol+col];};
 49 | 	inline double& data(int row,int col) {return pData[row*nCol+col];};
 50 | 	bool matchDimension(int _nrow,int _ncol) const {if(nRow==_nrow && nCol==_ncol) return true; else return false;};
 51 | 	bool matchDimension(const Matrix<T>& matrix) const {return matchDimension(matrix.nrow(),matrix.ncol());};
 52 | 
 53 | 	// functions to check dimensions
 54 | 	bool checkDimRight(const Vector<T>& vector) const;
 55 | 	bool checkDimRight(const Matrix<T>& matrix) const;
 56 | 	bool checkDimLeft(const Vector<T>& vector) const;
 57 | 	bool checkDimLeft(const Matrix<T>& matrix) const;
 58 | 
 59 | 	// functions for matrix computation
 60 | 	void Multiply(Vector<T>& result,const Vector<T>& vect) const;
 61 | 	void Multiply(Matrix<T>& result,const Matrix<T>& matrix) const;
 62 | 
 63 | 	void transpose(Matrix& result) const;
 64 | 	void fromVector(const Vector<T>& vect);
 65 | 	double norm2() const;
 66 | 	double sum() const
 67 | 	{
 68 | 		double total = 0;
 69 | 		for(int i = 0;i<nCol*nRom;i++)
 70 | 			total += pData[i];
 71 | 		return total;
 72 | 	}
 73 | 	// operators
 74 | 	Matrix& operator=(const Matrix<T>& matrix);
 75 | 
 76 | 	Matrix& operator+=(double val);
 77 | 	Matrix& operator-=(double val);
 78 | 	Matrix& operator*=(double val);
 79 | 	Matrix& operator/=(double val);
 80 | 
 81 | 	Matrix& operator+=(const Matrix<T>& matrix);
 82 | 	Matrix& operator-=(const Matrix<T>& matrix);
 83 | 	Matrix& operator*=(const Matrix<T>& matrix);
 84 | 	Matrix& operator/=(const Matrix<T>& matrix);
 85 | 
 86 | 	friend Vector<T> operator*(const Matrix<T>& matrix,const Vector<T>& vect);
 87 | 	friend Matrix<T> operator*(const Matrix<T>& matrix1,const Matrix<T>& matrix2);
 88 | 
 89 | 
 90 | 	// solve linear systems
 91 | 	void SolveLinearSystem(Vector<T>& result,const Vector<T>& b) const;
 92 | 	void ConjugateGradient(Vector<T>& result,const Vector<T>& b) const;
 93 | 
 94 | #ifdef _QT
 95 | 	bool writeMatrix(QFile& file) const;
 96 | 	bool readMatrix(QFile& file);
 97 | #endif
 98 | #ifdef _MATLAB
 99 | 	void readMatrix(const mxArray* prhs);
100 | 	void writeMatrix(mxArray*& prhs) const;
101 | #endif
102 | };
103 | 
104 | template<class T>
105 | bool Matrix<T>::IsDispInfo=false;
106 | 
107 | template<class T>
108 | Matrix<T>::Matrix(void)
109 | {
110 | 	nRow=nCol=0;
111 | 	pData=NULL;
112 | }
113 | 
114 | template<class T>
115 | Matrix<T>::Matrix(int nrow,int ncol,double* data)
116 | {
117 | 	nRow=nrow;
118 | 	nCol=ncol;
119 | 	pData=new T[nRow*nCol];
120 | 	if(data==NULL)
121 | 		memset(pData,0,sizeof(T)*nRow*nCol);
122 | 	else
123 | 		memcpy(pData,data,sizeof(T)*nRow*nCol);
124 | }
125 | 
126 | template<class T>
127 | Matrix<T>::Matrix(const Matrix<T>& matrix)
128 | {
129 | 	nRow=nCol=0;
130 | 	pData=NULL;
131 | 	copyData(matrix);
132 | }
133 | 
134 | template<class T>
135 | Matrix<T>::~Matrix(void)
136 | {
137 | 	releaseData();
138 | }
139 | 
140 | template<class T>
141 | void Matrix<T>::releaseData()
142 | {
143 | 	if(pData!=NULL)
144 | 		delete pData;
145 | 	pData=NULL;
146 | 	nRow=nCol=0;
147 | }
148 | 
149 | template<class T>
150 | void Matrix<T>::copyData(const Matrix<T> &matrix)
151 | {
152 | 	if(!dimMatch(matrix))
153 | 		allocate(matrix);
154 | 	memcpy(pData,matrix.pData,sizeof(T)*nRow*nCol);
155 | }
156 | 
157 | template<class T>
158 | bool Matrix<T>::dimMatch(const Matrix<T>& matrix) const
159 | {
160 | 	if(nCol==matrix.nCol && nRow==matrix.nRow)
161 | 		return true;
162 | 	else
163 | 		return false;
164 | }
165 | 
166 | template<class T>
167 | bool Matrix<T>::dimcheck(const Matrix<T>& matrix) const
168 | {
169 | 	if(!dimMatch(matrix))
170 | 	{
171 | 		cout<<"The dimensions of the matrices don't match!"<<endl;
172 | 		return false;
173 | 	}
174 | 	return true;
175 | }
176 | 
177 | template<class T>
178 | void Matrix<T>::reset()
179 | {
180 | 	if(pData!=NULL)
181 | 		memset(pData,0,sizeof(T)*nRow*nCol);
182 | }
183 | 
184 | template<class T>
185 | void Matrix<T>::allocate(int nrow,int ncol)
186 | {
187 | 	releaseData();
188 | 	nRow=nrow;
189 | 	nCol=ncol;
190 | 	if(nRow*nCol>0)
191 | 	{
192 | 		pData=new T[nRow*nCol];
193 | 		memset(pData,0,sizeof(T)*nRow*nCol);
194 | 	}
195 | }
196 | 
197 | template<class T>
198 | void Matrix<T>::allocate(const Matrix<T>& matrix)
199 | {
200 | 	allocate(matrix.nRow,matrix.nCol);
201 | }
202 | 
203 | template<class T>
204 | void Matrix<T>::loadData(int _nrow, int _ncol, T *data)
205 | {
206 | 	if(!matchDimension(_nrow,_ncol))
207 | 		allocate(_nrow,_ncol);
208 | 	memcpy(pData,data,sizeof(T)*nRow*nCol);
209 | }
210 | 
211 | template<class T>
212 | void Matrix<T>::printMatrix()
213 | {
214 | 	for(int i=0;i<nRow;i++)
215 | 	{
216 | 		for(int j=0;j<nCol;j++)
217 | 			cout<<pData[i*nCol+j]<<" ";
218 | 		cout<<endl;
219 | 	}
220 | }
221 | 
222 | template<class T>
223 | void Matrix<T>::identity(int ndim)
224 | {
225 | 	allocate(ndim,ndim);
226 | 	reset();
227 | 	for(int i=0;i<ndim;i++)
228 | 		pData[i*ndim+i]=1;
229 | }
230 | 
231 | //--------------------------------------------------------------------------------------------------
232 | // functions to check dimensionalities
233 | //--------------------------------------------------------------------------------------------------
234 | template<class T>
235 | bool Matrix<T>::checkDimRight(const Vector<T>& vect) const
236 | {
237 | 	if(nCol==vect.dim())
238 | 		return true;
239 | 	else
240 | 	{
241 | 		cout<<"The matrix and vector don't match in multiplication!"<<endl;
242 | 		return false;
243 | 	}
244 | }
245 | 
246 | template<class T>
247 | bool Matrix<T>::checkDimRight(const Matrix<T> &matrix) const
248 | {
249 | 	if(nCol==matrix.nrow())
250 | 		return true;
251 | 	else
252 | 	{
253 | 		cout<<"The matrix and matrix don't match in multiplication!"<<endl;
254 | 		return false;
255 | 	}
256 | }
257 | 
258 | template<class T>
259 | bool Matrix<T>::checkDimLeft(const Vector<T>& vect) const
260 | {
261 | 	if(nRow==vect.dim())
262 | 		return true;
263 | 	else
264 | 	{
265 | 		cout<<"The vector and matrix don't match in multiplication!"<<endl;
266 | 		return false;
267 | 	}
268 | }
269 | 
270 | template<class T>
271 | bool Matrix<T>::checkDimLeft(const Matrix<T> &matrix) const
272 | {
273 | 	if(nRow==matrix.ncol())
274 | 		return true;
275 | 	else
276 | 	{
277 | 		cout<<"The matrix and matrix don't match in multiplication!"<<endl;
278 | 		return false;
279 | 	}
280 | }
281 | 
282 | //--------------------------------------------------------------------------------------------------
283 | // functions for numerical computation
284 | //--------------------------------------------------------------------------------------------------
285 | template<class T>
286 | void Matrix<T>::Multiply(Vector<T> &result, const Vector<T>&vect) const
287 | {
288 | 	checkDimRight(vect);
289 | 	if(result.dim()!=nRow)
290 | 		result.allocate(nRow);
291 | 	for(int i=0;i<nRow;i++)
292 | 	{
293 | 		double temp=0;
294 | 		for(int j=0;j<nCol;j++)
295 | 			temp+=pData[i*nCol+j]*vect.data()[j];
296 | 		result.data()[i]=temp;
297 | 	}
298 | }
299 | 
300 | template<class T>
301 | void Matrix<T>::Multiply(Matrix<T> &result, const Matrix<T> &matrix) const
302 | {
303 | 	checkDimRight(matrix);
304 | 	if(!result.matchDimension(nRow,matrix.nCol))
305 | 		result.allocate(nRow,matrix.nCol);
306 | 	for(int i=0;i<nRow;i++)
307 | 		for(int j=0;j<matrix.nCol;j++)
308 | 		{
309 | 			double temp=0;
310 | 			for(int k=0;k<nCol;k++)
311 | 				temp+=pData[i*nCol+k]*matrix.pData[k*matrix.nCol+j];
312 | 			result.pData[i*matrix.nCol+j]=temp;
313 | 		}
314 | }
315 | 
316 | template<class T>
317 | void Matrix<T>::transpose(Matrix<T> &result) const
318 | {
319 | 	if(!result.matchDimension(nCol,nRow))
320 | 		result.allocate(nCol,nRow);
321 | 	for(int i=0;i<nCol;i++)
322 | 		for(int j=0;j<nRow;j++)
323 | 			result.pData[i*nRow+j]=pData[j*nCol+i];
324 | }
325 | 
326 | template<class T>
327 | void Matrix<T>::fromVector(const Vector<T>&vect)
328 | {
329 | 	if(!matchDimension(vect.dim(),1))
330 | 		allocate(vect.dim(),1);
331 | 	memcpy(pData,vect.data(),sizeof(double)*vect.dim());
332 | }
333 | 
334 | template<class T>
335 | double Matrix<T>::norm2() const
336 | {
337 | 	if(pData==NULL)
338 | 		return 0;
339 | 	double temp=0;
340 | 	for(int i=0;i<nCol*nRow;i++)
341 | 		temp+=pData[i]*pData[i];
342 | 	return temp;
343 | }
344 | 
345 | //--------------------------------------------------------------------------------------------------
346 | // operators
347 | //--------------------------------------------------------------------------------------------------
348 | template<class T>
349 | Matrix<T>& Matrix<T>::operator=(const Matrix<T>& matrix)
350 | {
351 | 	copyData(matrix);
352 | 	return *this;
353 | }
354 | 
355 | template<class T>
356 | Matrix<T>& Matrix<T>::operator +=(double val)
357 | {
358 | 	for(int i=0;i<nCol*nRow;i++)
359 | 		pData[i]+=val;
360 | 	return *this;
361 | }
362 | 
363 | template<class T>
364 | Matrix<T>& Matrix<T>::operator -=(double val)
365 | {
366 | 	for(int i=0;i<nCol*nRow;i++)
367 | 		pData[i]-=val;
368 | 	return *this;
369 | }
370 | 
371 | template<class T>
372 | Matrix<T>& Matrix<T>::operator *=(double val)
373 | {
374 | 	for(int i=0;i<nCol*nRow;i++)
375 | 		pData[i]*=val;
376 | 	return *this;
377 | }
378 | 
379 | template<class T>
380 | Matrix<T>& Matrix<T>::operator /=(double val)
381 | {
382 | 	for(int i=0;i<nCol*nRow;i++)
383 | 		pData[i]/=val;
384 | 	return *this;
385 | }
386 | 
387 | template<class T>
388 | Matrix<T>& Matrix<T>::operator +=(const Matrix<T> &matrix)
389 | {
390 | 	dimcheck(matrix);
391 | 	for(int i=0;i<nCol*nRow;i++)
392 | 		pData[i]+=matrix.pData[i];
393 | 	return *this;
394 | }
395 | 
396 | template<class T>
397 | Matrix<T>& Matrix<T>::operator -=(const Matrix<T> &matrix)
398 | {
399 | 	dimcheck(matrix);
400 | 	for(int i=0;i<nCol*nRow;i++)
401 | 		pData[i]-=matrix.pData[i];
402 | 	return *this;
403 | }
404 | 
405 | template<class T>
406 | Matrix<T>& Matrix<T>::operator *=(const Matrix<T> &matrix)
407 | {
408 | 	dimcheck(matrix);
409 | 	for(int i=0;i<nCol*nRow;i++)
410 | 		pData[i]*=matrix.pData[i];
411 | 	return *this;
412 | }
413 | 
414 | template<class T>
415 | Matrix<T>& Matrix<T>::operator /=(const Matrix<T> &matrix)
416 | {
417 | 	dimcheck(matrix);
418 | 	for(int i=0;i<nCol*nRow;i++)
419 | 		pData[i]/=matrix.pData[i];
420 | 	return *this;
421 | }
422 | 
423 | template<class T>
424 | Vector<T> operator*(const Matrix<T>& matrix,const Vector<T>& vect)
425 | {
426 | 	Vector<T> result;
427 | 	matrix.Multiply(result,vect);
428 | 	return result;
429 | }
430 | 
431 | template<class T>
432 | Matrix<T> operator*(const Matrix<T>& matrix1,const Matrix<T>& matrix2)
433 | {
434 | 	Matrix<T> result;
435 | 	matrix1.Multiply(result,matrix2);
436 | 	return result;
437 | }
438 | 
439 | //--------------------------------------------------------------------------------------------------
440 | // function for conjugate gradient method
441 | //--------------------------------------------------------------------------------------------------
442 | template<class T>
443 | void Matrix<T>::ConjugateGradient(Vector<T> &result, const Vector<T>&b) const
444 | {
445 | 	if(nCol!=nRow)
446 | 	{
447 | 		cout<<"Error: when solving Ax=b, A is not square!"<<endl;
448 | 		return;
449 | 	}
450 | 	checkDimRight(b);
451 | 	if(!result.matchDimension(b))
452 | 		result.allocate(b);
453 | 
454 | 	Vector<T> r(b),p,q;
455 | 	result.reset();
456 | 
457 | 	int nIterations=nRow*5;
458 | 	Vector<T> rou(nIterations);
459 | 	for(int k=0;k<nIterations;k++)
460 | 	{
461 | 		rou[k]=r.norm2();
462 | 		if(IsDispInfo)
463 | 			cout<<rou[k]<<endl;
464 | 
465 | 		if(rou[k]<1E-20)
466 | 			break;
467 | 		if(k==0)
468 | 			p=r;
469 | 		else
470 | 		{
471 | 			double ratio=rou[k]/rou[k-1];
472 | 			p=r+p*ratio;
473 | 		}
474 | 		Multiply(q,p);
475 | 		double alpha=rou[k]/innerproduct(p,q);
476 | 		result+=p*alpha;
477 | 		r-=q*alpha;
478 | 	}
479 | }
480 | 
481 | template<class T>
482 | void Matrix<T>::SolveLinearSystem(Vector<T> &result, const Vector<T>&b) const
483 | {
484 | 	if(nCol==nRow)
485 | 	{
486 | 		ConjugateGradient(result,b);
487 | 		return;
488 | 	}
489 | 	if(nRow<nCol)
490 | 	{
491 | 		cout<<"Not enough observations for parameter estimation!"<<endl;
492 | 		return;
493 | 	}
494 | 	Matrix<T> AT,ATA;
495 | 	transpose(AT);
496 | 	AT.Multiply(ATA,*this);
497 | 	Vector<T> ATb;
498 | 	AT.Multiply(ATb,b);
499 | 	ATA.ConjugateGradient(result,ATb);
500 | }
501 | 
502 | #ifdef _QT
503 | 
504 | template<class T>
505 | bool Matrix<T>::writeMatrix(QFile &file) const
506 | {
507 | 	file.write((char *)&nRow,sizeof(int));
508 | 	file.write((char *)&nCol,sizeof(int));
509 | 	if(file.write((char *)pData,sizeof(double)*nRow*nCol)!=sizeof(double)*nRow*nCol)
510 | 		return false;
511 | 	return true;
512 | }
513 | 
514 | template<class T>
515 | bool Matrix<T>::readMatrix(QFile &file)
516 | {
517 | 	releaseData();
518 | 	file.read((char *)&nRow,sizeof(int));
519 | 	file.read((char *)&nCol,sizeof(int));
520 | 	if(nRow*nCol>0)
521 | 	{
522 | 		allocate(nRow,nCol);
523 | 		if(file.read((char *)pData,sizeof(double)*nRow*nCol)!=sizeof(double)*nRow*nCol)
524 | 			return false;
525 | 	}
526 | 	return true;
527 | }
528 | #endif
529 | 
530 | #ifdef _MATLAB
531 | 
532 | template<class T>
533 | void Matrix<T>::readMatrix(const mxArray* prhs)
534 | {
535 | 	if(pData!=NULL)
536 | 		delete pData;
537 | 	int nElements = mxGetNumberOfDimensions(prhs);
538 | 	if(nElements>2)
539 | 		mexErrMsgTxt("A matrix is expected to be loaded!");
540 | 	const int* dims = mxGetDimensions(prhs);
541 | 	allocate(dims[0],dims[1]);
542 | 	double* data = (double*)mxGetData(prhs);
543 | 	for(int i =0; i<nRow; i++)
544 | 		for(int j =0; j<nCol; j++)
545 | 			pData[i*nCol+j] = data[j*nRow+i];
546 | }
547 | 
548 | template<class T>
549 | void Matrix<T>::writeMatrix(mxArray*& plhs) const
550 | {
551 | 	int dims[2];
552 | 	dims[0]=nRow;dims[1]=nCol;
553 | 	plhs=mxCreateNumericArray(2, dims,mxDOUBLE_CLASS, mxREAL);
554 | 	double* data = (double *)mxGetData(plhs);
555 | 	for(int i =0; i<nRow; i++)
556 | 		for(int j =0; j<nCol; j++)
557 | 			data[j*nRow+i] = pData[i*nCol+j];
558 | }
559 | #endif
560 | 


--------------------------------------------------------------------------------
/src/NoiseModel.h:
--------------------------------------------------------------------------------
  1 | // Author: Ce Liu (c) Dec, 2009; celiu@mit.edu
  2 | // Modified By: Deepak Pathak (c) 2016; pathak@berkeley.edu
  3 | 
  4 | #pragma once
  5 | 
  6 | #include "stdio.h"
  7 | #include "Vector.h"
  8 | #include <iostream>
  9 | 
 10 | #ifndef PI
 11 | #define PI 3.1415926535897932384626433832
 12 | #endif
 13 | 
 14 | using namespace std;
 15 | 
 16 | class GaussianMixture
 17 | {
 18 | public:
 19 | 	int nChannels;
 20 | 	double* alpha;
 21 | 	double* sigma;
 22 | 	double* beta;
 23 | 	double* sigma_square;
 24 | 	double* beta_square;
 25 | public:
 26 | 	GaussianMixture()
 27 | 	{
 28 | 		nChannels = 0;
 29 | 		alpha = sigma = beta = sigma_square = beta_square = NULL;
 30 | 	}
 31 | 	GaussianMixture(int _nChannels)
 32 | 	{
 33 | 		nChannels = _nChannels;
 34 | 		allocate();
 35 | 		for(int i = 0;i<nChannels;i++)
 36 | 		{
 37 | 			alpha[i] = 0.95;
 38 | 			sigma[i] = 0.05;
 39 | 			beta[i] = 0.5;
 40 | 		}
 41 | 		square();
 42 | 	}
 43 | 	GaussianMixture(const GaussianMixture& GM)
 44 | 	{
 45 | 		clear();
 46 | 		copy(GM);
 47 | 	}
 48 | 	void copy(const GaussianMixture& GM)
 49 | 	{
 50 | 		nChannels = GM.nChannels;
 51 | 		allocate();
 52 | 		for(int i  = 0;i<nChannels;i++)
 53 | 		{
 54 | 			alpha[i]  = GM.alpha[i];
 55 | 			sigma[i] = GM.sigma[i];
 56 | 			beta[i]    = GM.beta[i];
 57 | 		}
 58 | 		square();
 59 | 	}
 60 | 	void operator=(const GaussianMixture& GM)
 61 | 	{
 62 | 		clear();
 63 | 		copy(GM);
 64 | 	}
 65 | 	GaussianMixture shrink(int N)
 66 | 	{
 67 | 		GaussianMixture GM(N);
 68 | 		for(int i = 0;i<N;i++)
 69 | 		{
 70 | 			GM.alpha[i]  = alpha[i];
 71 | 			GM.sigma[i] = sigma[i];
 72 | 			GM.beta[i]    = beta[i];
 73 | 		}
 74 | 		GM.square();
 75 | 		return GM;
 76 | 	}
 77 | 	void allocate()
 78 | 	{
 79 | 		alpha = new double[nChannels];
 80 | 		sigma = new double[nChannels];
 81 | 		beta = new double[nChannels];
 82 | 		sigma_square = new double[nChannels];
 83 | 		beta_square = new double[nChannels];
 84 | 	}
 85 | 	void clear()
 86 | 	{
 87 | 		if(!alpha)
 88 | 			delete []alpha;
 89 | 		if(!sigma)
 90 | 			delete []sigma;
 91 | 		if(!beta)
 92 | 			delete []beta;
 93 | 		if(!sigma_square)
 94 | 			delete []sigma_square;
 95 | 		if(!beta_square)
 96 | 			delete []beta_square;
 97 | 		alpha = sigma = beta = sigma_square = beta_square = NULL;
 98 | 	}
 99 | 	void reset()
100 | 	{
101 | 		//for(int i = 0;i<nChannels;i++)
102 | 		//	alpha[i] = sigma[i] = beta[i] = sigma_square[i] = beta_square[i] = 0;
103 | 		for(int i = 0;i<nChannels;i++)
104 | 		{
105 | 			alpha[i] = 0.95;
106 | 			sigma[i] = 0.05;
107 | 			beta[i] = 0.5;
108 | 		}
109 | 		square();
110 | 	}
111 | 	void reset(int _nChannels)
112 | 	{
113 | 		clear();
114 | 		nChannels = _nChannels;
115 | 		allocate();
116 | 		reset();
117 | 	}
118 | 	double Gaussian(double x,int i,int k) const
119 | 	{
120 | 		if(i==0)
121 | 			 return exp(-x/(2*sigma_square[k]))/(2*PI*sigma[k]);
122 | 		else
123 | 			return exp(-x/(2*beta_square[k]))/(2*PI*beta[k]);
124 | 	}
125 | 	~GaussianMixture()
126 | 	{
127 | 		clear();
128 | 	}
129 | 	void square()
130 | 	{
131 | 		for(int i =0;i<nChannels;i++)
132 | 		{
133 | 			sigma_square[i] = sigma[i]*sigma[i];
134 | 			beta_square[i] = beta[i]*beta[i];
135 | 		}
136 | 	}
137 | 	void display()
138 | 	{
139 | 		for(int i = 0;i<nChannels;i++)
140 | 			cout<<"alpha: "<<alpha[i] << " sigma: "<<sigma[i]<<" beta: "<<beta[i]<<" sigma^2: "<<sigma_square[i]<<" beta^2: "<<beta_square[i]<<endl;
141 | 	}
142 | 	bool write(const char* filename)
143 | 	{
144 | 		ofstream myfile(filename,ios::out | ios::binary);
145 | 		if(myfile.is_open())
146 | 		{
147 | 			bool foo = write(myfile);
148 | 			myfile.close();
149 | 			return foo;
150 | 		}
151 | 		return false;
152 | 	}
153 | 	bool write(ofstream& myfile)
154 | 	{
155 | 		myfile.write((char *)&nChannels,sizeof(int));
156 | 		myfile.write((char *)alpha,sizeof(double)*nChannels);
157 | 		myfile.write((char *)sigma,sizeof(double)*nChannels);
158 | 		myfile.write((char *)beta,sizeof(double)*nChannels);
159 | 		return true;
160 | 	}
161 | 	bool read(const char* filename)
162 | 	{
163 | 		ifstream myfile(filename, ios::in | ios::binary);
164 | 		if(myfile.is_open())
165 | 		{
166 | 			bool foo = read(myfile);
167 | 			myfile.close();
168 | 			square();
169 | 			return foo;
170 | 		}
171 | 		return false;
172 | 	}
173 | 	bool read(ifstream& myfile)
174 | 	{
175 | 		myfile.read((char *)&nChannels,sizeof(int));
176 | 		allocate();
177 | 		myfile.read((char *)alpha,sizeof(double)*nChannels);
178 | 		myfile.read((char *)sigma,sizeof(double)*nChannels);
179 | 		myfile.read((char *)beta,sizeof(double)*nChannels);
180 | 		square();
181 | 		return true;
182 | 	}
183 | };
184 | 
185 | //class Laplacian
186 | //{
187 | //public:
188 | //	int nChannels;
189 | //	Vector<double> scale;
190 | //public:
191 | //	Laplacian()
192 | //	{
193 | //	}
194 | //	Laplacian(int _nChannels)
195 | //	{
196 | //		nChannels = _nChannels;
197 | //		scale.allocate(nChannels);
198 | //	}
199 | //	Laplacian(const Laplacian
200 | //
201 | //};
202 | 


--------------------------------------------------------------------------------
/src/OpticalFlow.cpp:
--------------------------------------------------------------------------------
   1 | // Author: Ce Liu (c) Dec, 2009; celiu@mit.edu
   2 | // Modified By: Deepak Pathak (c) 2016; pathak@berkeley.edu
   3 | 
   4 | #include "OpticalFlow.h"
   5 | #include "ImageProcessing.h"
   6 | #include "GaussianPyramid.h"
   7 | #include <cstdlib>
   8 | #include <iostream>
   9 | 
  10 | using namespace std;
  11 | 
  12 | #ifndef _MATLAB
  13 | 	bool OpticalFlow::IsDisplay=true;
  14 | #else
  15 | 	bool OpticalFlow::IsDisplay=false;
  16 | #endif
  17 | 
  18 | //OpticalFlow::InterpolationMethod OpticalFlow::interpolation = OpticalFlow::Bicubic;
  19 | OpticalFlow::InterpolationMethod OpticalFlow::interpolation = OpticalFlow::Bilinear;
  20 | OpticalFlow::NoiseModel OpticalFlow::noiseModel = OpticalFlow::Lap;
  21 | GaussianMixture OpticalFlow::GMPara;
  22 | Vector<double> OpticalFlow::LapPara;
  23 | 
  24 | 
  25 | OpticalFlow::OpticalFlow(void)
  26 | {
  27 | }
  28 | 
  29 | OpticalFlow::~OpticalFlow(void)
  30 | {
  31 | }
  32 | 
  33 | //--------------------------------------------------------------------------------------------------------
  34 | //  function to compute dx, dy and dt for motion estimation
  35 | //--------------------------------------------------------------------------------------------------------
  36 | void OpticalFlow::getDxs(DImage &imdx, DImage &imdy, DImage &imdt, const DImage &im1, const DImage &im2)
  37 | {
  38 | 	//double gfilter[5]={0.01,0.09,0.8,0.09,0.01};
  39 | 	double gfilter[5]={0.02,0.11,0.74,0.11,0.02};
  40 | 	//double gfilter[5]={0,0,1,0,0};
  41 | 	if(1)
  42 | 	{
  43 | 		//DImage foo,Im;
  44 | 		//Im.Add(im1,im2);
  45 | 		//Im.Multiplywith(0.5);
  46 | 		////foo.imfilter_hv(Im,gfilter,2,gfilter,2);
  47 | 		//Im.dx(imdx,true);
  48 | 		//Im.dy(imdy,true);
  49 | 		//imdt.Subtract(im2,im1);
  50 | 		DImage Im1,Im2,Im;
  51 | 
  52 | 		im1.imfilter_hv(Im1,gfilter,2,gfilter,2);
  53 | 		im2.imfilter_hv(Im2,gfilter,2,gfilter,2);
  54 | 		Im.copyData(Im1);
  55 | 		Im.Multiplywith(0.4);
  56 | 		Im.Add(Im2,0.6);
  57 | 		//Im.Multiplywith(0.5);
  58 | 		//Im1.copyData(im1);
  59 | 		//Im2.copyData(im2);
  60 | 
  61 | 		Im.dx(imdx,true);
  62 | 		Im.dy(imdy,true);
  63 | 		imdt.Subtract(Im2,Im1);
  64 | 	}
  65 | 	else
  66 | 	{
  67 | 		// Im1 and Im2 are the smoothed version of im1 and im2
  68 | 		DImage Im1,Im2;
  69 | 
  70 | 		im1.imfilter_hv(Im1,gfilter,2,gfilter,2);
  71 | 		im2.imfilter_hv(Im2,gfilter,2,gfilter,2);
  72 | 
  73 | 		//Im1.copyData(im1);
  74 | 		//Im2.copyData(im2);
  75 | 
  76 | 		Im2.dx(imdx,true);
  77 | 		Im2.dy(imdy,true);
  78 | 		imdt.Subtract(Im2,Im1);
  79 | 	}
  80 | 
  81 | 
  82 | 	imdx.setDerivative();
  83 | 	imdy.setDerivative();
  84 | 	imdt.setDerivative();
  85 | }
  86 | 
  87 | //--------------------------------------------------------------------------------------------------------
  88 | // function to do sanity check: imdx*du+imdy*dy+imdt=0
  89 | //--------------------------------------------------------------------------------------------------------
  90 | void OpticalFlow::SanityCheck(const DImage &imdx, const DImage &imdy, const DImage &imdt, double du, double dv)
  91 | {
  92 | 	if(imdx.matchDimension(imdy)==false || imdx.matchDimension(imdt)==false)
  93 | 	{
  94 | 		cout<<"The dimensions of the derivatives don't match!"<<endl;
  95 | 		return;
  96 | 	}
  97 | 	const _FlowPrecision* pImDx,*pImDy,*pImDt;
  98 | 	pImDx=imdx.data();
  99 | 	pImDy=imdy.data();
 100 | 	pImDt=imdt.data();
 101 | 	double error=0;
 102 | 	for(int i=0;i<imdx.height();i++)
 103 | 		for(int j=0;j<imdx.width();j++)
 104 | 			for(int k=0;k<imdx.nchannels();k++)
 105 | 			{
 106 | 				int offset=(i*imdx.width()+j)*imdx.nchannels()+k;
 107 | 				double temp=pImDx[offset]*du+pImDy[offset]*dv+pImDt[offset];
 108 | 				error+=fabs(temp);
 109 | 			}
 110 | 	error/=imdx.nelements();
 111 | 	cout<<"The mean error of |dx*u+dy*v+dt| is "<<error<<endl;
 112 | }
 113 | 
 114 | //--------------------------------------------------------------------------------------------------------
 115 | // function to warp image based on the flow field
 116 | //--------------------------------------------------------------------------------------------------------
 117 | void OpticalFlow::warpFL(DImage &warpIm2, const DImage &Im1, const DImage &Im2, const DImage &vx, const DImage &vy)
 118 | {
 119 | 	if(warpIm2.matchDimension(Im2)==false)
 120 | 		warpIm2.allocate(Im2.width(),Im2.height(),Im2.nchannels());
 121 | 	ImageProcessing::warpImage(warpIm2.data(),Im1.data(),Im2.data(),vx.data(),vy.data(),Im2.width(),Im2.height(),Im2.nchannels());
 122 | }
 123 | 
 124 | void OpticalFlow::warpFL(DImage &warpIm2, const DImage &Im1, const DImage &Im2, const DImage &Flow)
 125 | {
 126 | 	if(warpIm2.matchDimension(Im2)==false)
 127 | 		warpIm2.allocate(Im2.width(),Im2.height(),Im2.nchannels());
 128 | 	ImageProcessing::warpImageFlow(warpIm2.data(),Im1.data(),Im2.data(),Flow.data(),Im2.width(),Im2.height(),Im2.nchannels());
 129 | }
 130 | 
 131 | 
 132 | //--------------------------------------------------------------------------------------------------------
 133 | // function to generate mask of the pixels that move inside the image boundary
 134 | //--------------------------------------------------------------------------------------------------------
 135 | void OpticalFlow::genInImageMask(DImage &mask, const DImage &vx, const DImage &vy,int interval)
 136 | {
 137 | 	int imWidth,imHeight;
 138 | 	imWidth=vx.width();
 139 | 	imHeight=vx.height();
 140 | 	if(mask.matchDimension(vx)==false)
 141 | 		mask.allocate(imWidth,imHeight);
 142 | 	const _FlowPrecision *pVx,*pVy;
 143 | 	_FlowPrecision *pMask;
 144 | 	pVx=vx.data();
 145 | 	pVy=vy.data();
 146 | 	mask.reset();
 147 | 	pMask=mask.data();
 148 | 	double x,y;
 149 | 	for(int i=0;i<imHeight;i++)
 150 | 		for(int j=0;j<imWidth;j++)
 151 | 		{
 152 | 			int offset=i*imWidth+j;
 153 | 			y=i+pVx[offset];
 154 | 			x=j+pVy[offset];
 155 | 			if(x<interval  || x>imWidth-1-interval || y<interval || y>imHeight-1-interval)
 156 | 				continue;
 157 | 			pMask[offset]=1;
 158 | 		}
 159 | }
 160 | 
 161 | void OpticalFlow::genInImageMask(DImage &mask, const DImage &flow,int interval)
 162 | {
 163 | 	int imWidth,imHeight;
 164 | 	imWidth=flow.width();
 165 | 	imHeight=flow.height();
 166 | 	if(mask.matchDimension(flow.width(),flow.height(),1)==false)
 167 | 		mask.allocate(imWidth,imHeight);
 168 | 	else
 169 | 		mask.reset();
 170 | 
 171 | 	const _FlowPrecision *pFlow;
 172 | 	_FlowPrecision *pMask;
 173 | 	pFlow = flow.data();;
 174 | 	pMask=mask.data();
 175 | 	double x,y;
 176 | 	for(int i=0;i<imHeight;i++)
 177 | 		for(int j=0;j<imWidth;j++)
 178 | 		{
 179 | 			int offset=i*imWidth+j;
 180 | 			y=i+pFlow[offset*2+1];
 181 | 			x=j+pFlow[offset*2];
 182 | 			if(x<interval  || x>imWidth-1-interval || y<interval || y>imHeight-1-interval)
 183 | 				continue;
 184 | 			pMask[offset]=1;
 185 | 		}
 186 | }
 187 | 
 188 | //--------------------------------------------------------------------------------------------------------
 189 | // function to compute optical flow field using two fixed point iterations
 190 | // Input arguments:
 191 | //     Im1, Im2:						frame 1 and frame 2
 192 | //	warpIm2:						the warped frame 2 according to the current flow field u and v
 193 | //	u,v:									the current flow field, NOTICE that they are also output arguments
 194 | //
 195 | //--------------------------------------------------------------------------------------------------------
 196 | void OpticalFlow::SmoothFlowSOR(const DImage &Im1, const DImage &Im2, DImage &warpIm2, DImage &u, DImage &v,
 197 | 																    double alpha, int nOuterFPIterations, int nInnerFPIterations, int nSORIterations)
 198 | {
 199 | 	DImage mask,imdx,imdy,imdt;
 200 | 	int imWidth,imHeight,nChannels,nPixels;
 201 | 	imWidth=Im1.width();
 202 | 	imHeight=Im1.height();
 203 | 	nChannels=Im1.nchannels();
 204 | 	nPixels=imWidth*imHeight;
 205 | 
 206 | 	DImage du(imWidth,imHeight),dv(imWidth,imHeight);
 207 | 	DImage uu(imWidth,imHeight),vv(imWidth,imHeight);
 208 | 	DImage ux(imWidth,imHeight),uy(imWidth,imHeight);
 209 | 	DImage vx(imWidth,imHeight),vy(imWidth,imHeight);
 210 | 	DImage Phi_1st(imWidth,imHeight);
 211 | 	DImage Psi_1st(imWidth,imHeight,nChannels);
 212 | 
 213 | 	DImage imdxy,imdx2,imdy2,imdtdx,imdtdy;
 214 | 	DImage ImDxy,ImDx2,ImDy2,ImDtDx,ImDtDy;
 215 | 	DImage foo1,foo2;
 216 | 
 217 | 	double prob1,prob2,prob11,prob22;
 218 | 
 219 | 	double varepsilon_phi=pow(0.001,2);
 220 | 	double varepsilon_psi=pow(0.001,2);
 221 | 
 222 | 	//--------------------------------------------------------------------------
 223 | 	// the outer fixed point iteration
 224 | 	//--------------------------------------------------------------------------
 225 | 	for(int count=0;count<nOuterFPIterations;count++)
 226 | 	{
 227 | 		// compute the gradient
 228 | 		getDxs(imdx,imdy,imdt,Im1,warpIm2);
 229 | 
 230 | 		// generate the mask to set the weight of the pxiels moving outside of the image boundary to be zero
 231 | 		genInImageMask(mask,u,v);
 232 | 
 233 | 		// set the derivative of the flow field to be zero
 234 | 		du.reset();
 235 | 		dv.reset();
 236 | 
 237 | 		//--------------------------------------------------------------------------
 238 | 		// the inner fixed point iteration
 239 | 		//--------------------------------------------------------------------------
 240 | 		for(int hh=0;hh<nInnerFPIterations;hh++)
 241 | 		{
 242 | 			// compute the derivatives of the current flow field
 243 | 			if(hh==0)
 244 | 			{
 245 | 				uu.copyData(u);
 246 | 				vv.copyData(v);
 247 | 			}
 248 | 			else
 249 | 			{
 250 | 				uu.Add(u,du);
 251 | 				vv.Add(v,dv);
 252 | 			}
 253 | 			uu.dx(ux);
 254 | 			uu.dy(uy);
 255 | 			vv.dx(vx);
 256 | 			vv.dy(vy);
 257 | 
 258 | 			// compute the weight of phi
 259 | 			Phi_1st.reset();
 260 | 			_FlowPrecision* phiData=Phi_1st.data();
 261 | 			double temp;
 262 | 			const _FlowPrecision *uxData,*uyData,*vxData,*vyData;
 263 | 			uxData=ux.data();
 264 | 			uyData=uy.data();
 265 | 			vxData=vx.data();
 266 | 			vyData=vy.data();
 267 | 			double power_alpha = 0.5;
 268 | 			for(int i=0;i<nPixels;i++)
 269 | 			{
 270 | 				temp=uxData[i]*uxData[i]+uyData[i]*uyData[i]+vxData[i]*vxData[i]+vyData[i]*vyData[i];
 271 | 				//phiData[i]=power_alpha*pow(temp+varepsilon_phi,power_alpha-1);
 272 | 				phiData[i] = 0.5/sqrt(temp+varepsilon_phi);
 273 | 				//phiData[i] = 1/(power_alpha+temp);
 274 | 			}
 275 | 
 276 | 			// compute the nonlinear term of psi
 277 | 			Psi_1st.reset();
 278 | 			_FlowPrecision* psiData=Psi_1st.data();
 279 | 			const _FlowPrecision *imdxData,*imdyData,*imdtData;
 280 | 			const _FlowPrecision *duData,*dvData;
 281 | 			imdxData=imdx.data();
 282 | 			imdyData=imdy.data();
 283 | 			imdtData=imdt.data();
 284 | 			duData=du.data();
 285 | 			dvData=dv.data();
 286 | 
 287 | 			double _a  = 10000, _b = 0.1;
 288 | 			if(nChannels==1)
 289 | 				for(int i=0;i<nPixels;i++)
 290 | 				{
 291 | 					temp=imdtData[i]+imdxData[i]*duData[i]+imdyData[i]*dvData[i];
 292 | 					//if(temp*temp<0.04)
 293 | 					// psiData[i]=1/(2*sqrt(temp*temp+varepsilon_psi));
 294 | 					//psiData[i] = _a*_b/(1+_a*temp*temp);
 295 | 
 296 | 					// the following code is for log Gaussian mixture probability model
 297 | 					temp *= temp;
 298 | 					switch(noiseModel)
 299 | 					{
 300 | 					case GMixture:
 301 | 						prob1 = GMPara.Gaussian(temp,0,0)*GMPara.alpha[0];
 302 | 						prob2 = GMPara.Gaussian(temp,1,0)*(1-GMPara.alpha[0]);
 303 | 						prob11 = prob1/(2*GMPara.sigma_square[0]);
 304 | 						prob22 = prob2/(2*GMPara.beta_square[0]);
 305 | 						psiData[i] = (prob11+prob22)/(prob1+prob2);
 306 | 						break;
 307 | 					case Lap:
 308 | 						if(LapPara[0]<1E-20)
 309 | 							continue;
 310 | 						//psiData[i]=1/(2*sqrt(temp+varepsilon_psi)*LapPara[0]);
 311 |                         psiData[i]=1/(2*sqrt(temp+varepsilon_psi));
 312 | 						break;
 313 | 					}
 314 | 				}
 315 | 			else
 316 | 				for(int i=0;i<nPixels;i++)
 317 | 					for(int k=0;k<nChannels;k++)
 318 | 					{
 319 | 						int offset=i*nChannels+k;
 320 | 						temp=imdtData[offset]+imdxData[offset]*duData[i]+imdyData[offset]*dvData[i];
 321 | 						//if(temp*temp<0.04)
 322 | 						 // psiData[offset]=1/(2*sqrt(temp*temp+varepsilon_psi));
 323 | 						//psiData[offset] =  _a*_b/(1+_a*temp*temp);
 324 | 						temp *= temp;
 325 | 						switch(noiseModel)
 326 | 						{
 327 | 						case GMixture:
 328 | 							prob1 = GMPara.Gaussian(temp,0,k)*GMPara.alpha[k];
 329 | 							prob2 = GMPara.Gaussian(temp,1,k)*(1-GMPara.alpha[k]);
 330 | 							prob11 = prob1/(2*GMPara.sigma_square[k]);
 331 | 							prob22 = prob2/(2*GMPara.beta_square[k]);
 332 | 							psiData[offset] = (prob11+prob22)/(prob1+prob2);
 333 | 							break;
 334 | 						case Lap:
 335 | 							if(LapPara[k]<1E-20)
 336 | 								continue;
 337 | 							//psiData[offset]=1/(2*sqrt(temp+varepsilon_psi)*LapPara[k]);
 338 |                             psiData[offset]=1/(2*sqrt(temp+varepsilon_psi));
 339 | 							break;
 340 | 						}
 341 | 					}
 342 | 			// prepare the components of the large linear system
 343 | 			ImDxy.Multiply(Psi_1st,imdx,imdy);
 344 | 			ImDx2.Multiply(Psi_1st,imdx,imdx);
 345 | 			ImDy2.Multiply(Psi_1st,imdy,imdy);
 346 | 			ImDtDx.Multiply(Psi_1st,imdx,imdt);
 347 | 			ImDtDy.Multiply(Psi_1st,imdy,imdt);
 348 | 
 349 | 			if(nChannels>1)
 350 | 			{
 351 | 				ImDxy.collapse(imdxy);
 352 | 				ImDx2.collapse(imdx2);
 353 | 				ImDy2.collapse(imdy2);
 354 | 				ImDtDx.collapse(imdtdx);
 355 | 				ImDtDy.collapse(imdtdy);
 356 | 			}
 357 | 			else
 358 | 			{
 359 | 				imdxy.copyData(ImDxy);
 360 | 				imdx2.copyData(ImDx2);
 361 | 				imdy2.copyData(ImDy2);
 362 | 				imdtdx.copyData(ImDtDx);
 363 | 				imdtdy.copyData(ImDtDy);
 364 | 			}
 365 | 			// laplacian filtering of the current flow field
 366 | 		    Laplacian(foo1,u,Phi_1st);
 367 | 			Laplacian(foo2,v,Phi_1st);
 368 | 
 369 | 			for(int i=0;i<nPixels;i++)
 370 | 			{
 371 | 				imdtdx.data()[i] = -imdtdx.data()[i]-alpha*foo1.data()[i];
 372 | 				imdtdy.data()[i] = -imdtdy.data()[i]-alpha*foo2.data()[i];
 373 | 			}
 374 | 
 375 | 			// here we start SOR
 376 | 
 377 | 			// set omega
 378 | 			double omega = 1.8;
 379 | 
 380 | 			du.reset();
 381 | 			dv.reset();
 382 | 
 383 | 			for(int k = 0; k<nSORIterations; k++)
 384 | 				for(int i = 0; i<imHeight; i++)
 385 | 					for(int j = 0; j<imWidth; j++)
 386 | 					{
 387 | 						int offset = i * imWidth+j;
 388 | 						double sigma1 = 0, sigma2 = 0, coeff = 0;
 389 |                         double _weight;
 390 | 
 391 | 
 392 | 						if(j>0)
 393 | 						{
 394 |                             _weight = phiData[offset-1];
 395 | 							sigma1  += _weight*du.data()[offset-1];
 396 | 							sigma2  += _weight*dv.data()[offset-1];
 397 | 							coeff   += _weight;
 398 | 						}
 399 | 						if(j<imWidth-1)
 400 | 						{
 401 |                             _weight = phiData[offset];
 402 | 							sigma1 += _weight*du.data()[offset+1];
 403 | 							sigma2 += _weight*dv.data()[offset+1];
 404 | 							coeff   += _weight;
 405 | 						}
 406 | 						if(i>0)
 407 | 						{
 408 |                             _weight = phiData[offset-imWidth];
 409 | 							sigma1 += _weight*du.data()[offset-imWidth];
 410 | 							sigma2 += _weight*dv.data()[offset-imWidth];
 411 | 							coeff   += _weight;
 412 | 						}
 413 | 						if(i<imHeight-1)
 414 | 						{
 415 |                             _weight = phiData[offset];
 416 | 							sigma1  += _weight*du.data()[offset+imWidth];
 417 | 							sigma2  += _weight*dv.data()[offset+imWidth];
 418 | 							coeff   += _weight;
 419 | 						}
 420 | 						sigma1 *= -alpha;
 421 | 						sigma2 *= -alpha;
 422 | 						coeff *= alpha;
 423 | 						 // compute du
 424 | 						sigma1 += imdxy.data()[offset]*dv.data()[offset];
 425 | 						du.data()[offset] = (1-omega)*du.data()[offset] + omega/(imdx2.data()[offset] + alpha*0.05 + coeff)*(imdtdx.data()[offset] - sigma1);
 426 | 						// compute dv
 427 | 						sigma2 += imdxy.data()[offset]*du.data()[offset];
 428 | 						dv.data()[offset] = (1-omega)*dv.data()[offset] + omega/(imdy2.data()[offset] + alpha*0.05 + coeff)*(imdtdy.data()[offset] - sigma2);
 429 | 					}
 430 | 		}
 431 | 		u.Add(du);
 432 | 		v.Add(dv);
 433 | 		if(interpolation == Bilinear)
 434 | 			warpFL(warpIm2,Im1,Im2,u,v);
 435 | 		else
 436 | 		{
 437 | 			Im2.warpImageBicubicRef(Im1,warpIm2,u,v);
 438 | 			warpIm2.threshold();
 439 | 		}
 440 | 
 441 | 		//Im2.warpImageBicubicRef(Im1,warpIm2,BicubicCoeff,u,v);
 442 | 
 443 | 		// estimate noise level
 444 | 		switch(noiseModel)
 445 | 		{
 446 | 		case GMixture:
 447 | 			estGaussianMixture(Im1,warpIm2,GMPara);
 448 | 			break;
 449 | 		case Lap:
 450 | 			estLaplacianNoise(Im1,warpIm2,LapPara);
 451 | 		}
 452 | 	}
 453 | 
 454 | }
 455 | 
 456 | 
 457 | 
 458 | //--------------------------------------------------------------------------------------------------------
 459 | // function to compute optical flow field using two fixed point iterations
 460 | // Input arguments:
 461 | //     Im1, Im2:						frame 1 and frame 2
 462 | //	warpIm2:						the warped frame 2 according to the current flow field u and v
 463 | //	u,v:									the current flow field, NOTICE that they are also output arguments
 464 | //
 465 | //--------------------------------------------------------------------------------------------------------
 466 | void OpticalFlow::SmoothFlowPDE(const DImage &Im1, const DImage &Im2, DImage &warpIm2, DImage &u, DImage &v,
 467 | 																    double alpha, int nOuterFPIterations, int nInnerFPIterations, int nCGIterations)
 468 | {
 469 | 	DImage mask,imdx,imdy,imdt;
 470 | 	int imWidth,imHeight,nChannels,nPixels;
 471 | 	imWidth=Im1.width();
 472 | 	imHeight=Im1.height();
 473 | 	nChannels=Im1.nchannels();
 474 | 	nPixels=imWidth*imHeight;
 475 | 
 476 | 	DImage du(imWidth,imHeight),dv(imWidth,imHeight);
 477 | 	DImage uu(imWidth,imHeight),vv(imWidth,imHeight);
 478 | 	DImage ux(imWidth,imHeight),uy(imWidth,imHeight);
 479 | 	DImage vx(imWidth,imHeight),vy(imWidth,imHeight);
 480 | 	DImage Phi_1st(imWidth,imHeight);
 481 | 	DImage Psi_1st(imWidth,imHeight,nChannels);
 482 | 
 483 | 	DImage imdxy,imdx2,imdy2,imdtdx,imdtdy;
 484 | 	DImage ImDxy,ImDx2,ImDy2,ImDtDx,ImDtDy;
 485 | 	DImage A11,A12,A22,b1,b2;
 486 | 	DImage foo1,foo2;
 487 | 
 488 | 	// compute bicubic interpolation coeff
 489 | 	//DImage BicubicCoeff;
 490 | 	//Im2.warpImageBicubicCoeff(BicubicCoeff);
 491 | 	double prob1,prob2,prob11,prob22;
 492 | 	// variables for conjugate gradient
 493 | 	DImage r1,r2,p1,p2,q1,q2;
 494 | 	double* rou;
 495 | 	rou=new double[nCGIterations];
 496 | 
 497 | 	double varepsilon_phi=pow(0.001,2);
 498 | 	double varepsilon_psi=pow(0.001,2);
 499 | 
 500 | 	//--------------------------------------------------------------------------
 501 | 	// the outer fixed point iteration
 502 | 	//--------------------------------------------------------------------------
 503 | 	for(int count=0;count<nOuterFPIterations;count++)
 504 | 	{
 505 | 		// compute the gradient
 506 | 		getDxs(imdx,imdy,imdt,Im1,warpIm2);
 507 | 
 508 | 		// generate the mask to set the weight of the pxiels moving outside of the image boundary to be zero
 509 | 		genInImageMask(mask,u,v);
 510 | 
 511 | 		// set the derivative of the flow field to be zero
 512 | 		du.reset();
 513 | 		dv.reset();
 514 | 
 515 | 		//--------------------------------------------------------------------------
 516 | 		// the inner fixed point iteration
 517 | 		//--------------------------------------------------------------------------
 518 | 		for(int hh=0;hh<nInnerFPIterations;hh++)
 519 | 		{
 520 | 			// compute the derivatives of the current flow field
 521 | 			if(hh==0)
 522 | 			{
 523 | 				uu.copyData(u);
 524 | 				vv.copyData(v);
 525 | 			}
 526 | 			else
 527 | 			{
 528 | 				uu.Add(u,du);
 529 | 				vv.Add(v,dv);
 530 | 			}
 531 | 			uu.dx(ux);
 532 | 			uu.dy(uy);
 533 | 			vv.dx(vx);
 534 | 			vv.dy(vy);
 535 | 
 536 | 			// compute the weight of phi
 537 | 			Phi_1st.reset();
 538 | 			_FlowPrecision* phiData=Phi_1st.data();
 539 | 			_FlowPrecision temp;
 540 | 			const _FlowPrecision *uxData,*uyData,*vxData,*vyData;
 541 | 			uxData=ux.data();
 542 | 			uyData=uy.data();
 543 | 			vxData=vx.data();
 544 | 			vyData=vy.data();
 545 | 			double power_alpha = 0.5;
 546 | 			for(int i=0;i<nPixels;i++)
 547 | 			{
 548 | 				temp=uxData[i]*uxData[i]+uyData[i]*uyData[i]+vxData[i]*vxData[i]+vyData[i]*vyData[i];
 549 | 				//phiData[i]=power_alpha*pow(temp+varepsilon_phi,power_alpha-1);
 550 | 				phiData[i] = 0.5/sqrt(temp+varepsilon_phi);
 551 | 				//phiData[i] = 1/(power_alpha+temp);
 552 | 			}
 553 | 
 554 | 			// compute the nonlinear term of psi
 555 | 			Psi_1st.reset();
 556 | 			_FlowPrecision* psiData=Psi_1st.data();
 557 | 			const _FlowPrecision *imdxData,*imdyData,*imdtData;
 558 | 			const _FlowPrecision *duData,*dvData;
 559 | 			imdxData=imdx.data();
 560 | 			imdyData=imdy.data();
 561 | 			imdtData=imdt.data();
 562 | 			duData=du.data();
 563 | 			dvData=dv.data();
 564 | 
 565 | 			double _a  = 10000, _b = 0.1;
 566 | 			if(nChannels==1)
 567 | 				for(int i=0;i<nPixels;i++)
 568 | 				{
 569 | 					temp=imdtData[i]+imdxData[i]*duData[i]+imdyData[i]*dvData[i];
 570 | 					//if(temp*temp<0.04)
 571 | 					// psiData[i]=1/(2*sqrt(temp*temp+varepsilon_psi));
 572 | 					//psiData[i] = _a*_b/(1+_a*temp*temp);
 573 | 
 574 | 					// the following code is for log Gaussian mixture probability model
 575 | 					temp *= temp;
 576 | 					switch(noiseModel)
 577 | 					{
 578 | 					case GMixture:
 579 | 						prob1 = GMPara.Gaussian(temp,0,0)*GMPara.alpha[0];
 580 | 						prob2 = GMPara.Gaussian(temp,1,0)*(1-GMPara.alpha[0]);
 581 | 						prob11 = prob1/(2*GMPara.sigma_square[0]);
 582 | 						prob22 = prob2/(2*GMPara.beta_square[0]);
 583 | 						psiData[i] = (prob11+prob22)/(prob1+prob2);
 584 | 						break;
 585 | 					case Lap:
 586 | 						if(LapPara[0]<1E-20)
 587 | 							continue;
 588 | 						psiData[i]=1/(2*sqrt(temp+varepsilon_psi)*LapPara[0]);
 589 | 						break;
 590 | 					}
 591 | 				}
 592 | 			else
 593 | 				for(int i=0;i<nPixels;i++)
 594 | 					for(int k=0;k<nChannels;k++)
 595 | 					{
 596 | 						int offset=i*nChannels+k;
 597 | 						temp=imdtData[offset]+imdxData[offset]*duData[i]+imdyData[offset]*dvData[i];
 598 | 						//if(temp*temp<0.04)
 599 | 						 // psiData[offset]=1/(2*sqrt(temp*temp+varepsilon_psi));
 600 | 						//psiData[offset] =  _a*_b/(1+_a*temp*temp);
 601 | 						temp *= temp;
 602 | 						switch(noiseModel)
 603 | 						{
 604 | 						case GMixture:
 605 | 							prob1 = GMPara.Gaussian(temp,0,k)*GMPara.alpha[k];
 606 | 							prob2 = GMPara.Gaussian(temp,1,k)*(1-GMPara.alpha[k]);
 607 | 							prob11 = prob1/(2*GMPara.sigma_square[k]);
 608 | 							prob22 = prob2/(2*GMPara.beta_square[k]);
 609 | 							psiData[offset] = (prob11+prob22)/(prob1+prob2);
 610 | 							break;
 611 | 						case Lap:
 612 | 							if(LapPara[k]<1E-20)
 613 | 								continue;
 614 | 							psiData[offset]=1/(2*sqrt(temp+varepsilon_psi)*LapPara[k]);
 615 | 							break;
 616 | 						}
 617 | 					}
 618 | 
 619 | 			// prepare the components of the large linear system
 620 | 			ImDxy.Multiply(Psi_1st,imdx,imdy);
 621 | 			ImDx2.Multiply(Psi_1st,imdx,imdx);
 622 | 			ImDy2.Multiply(Psi_1st,imdy,imdy);
 623 | 			ImDtDx.Multiply(Psi_1st,imdx,imdt);
 624 | 			ImDtDy.Multiply(Psi_1st,imdy,imdt);
 625 | 
 626 | 			if(nChannels>1)
 627 | 			{
 628 | 				ImDxy.collapse(imdxy);
 629 | 				ImDx2.collapse(imdx2);
 630 | 				ImDy2.collapse(imdy2);
 631 | 				ImDtDx.collapse(imdtdx);
 632 | 				ImDtDy.collapse(imdtdy);
 633 | 			}
 634 | 			else
 635 | 			{
 636 | 				imdxy.copyData(ImDxy);
 637 | 				imdx2.copyData(ImDx2);
 638 | 				imdy2.copyData(ImDy2);
 639 | 				imdtdx.copyData(ImDtDx);
 640 | 				imdtdy.copyData(ImDtDy);
 641 | 			}
 642 | 
 643 | 			// filtering
 644 | 			//imdx2.smoothing(A11,3);
 645 | 			//imdxy.smoothing(A12,3);
 646 | 			//imdy2.smoothing(A22,3);
 647 | 			A11.copyData(imdx2);
 648 | 			A12.copyData(imdxy);
 649 | 			A22.copyData(imdy2);
 650 | 
 651 | 			// add epsilon to A11 and A22
 652 | 			A11.Add(alpha*0.5);
 653 | 			A22.Add(alpha*0.5);
 654 | 
 655 | 			// form b
 656 | 			//imdtdx.smoothing(b1,3);
 657 | 			//imdtdy.smoothing(b2,3);
 658 | 			b1.copyData(imdtdx);
 659 | 			b2.copyData(imdtdy);
 660 | 
 661 | 			// laplacian filtering of the current flow field
 662 | 		    Laplacian(foo1,u,Phi_1st);
 663 | 			Laplacian(foo2,v,Phi_1st);
 664 | 			_FlowPrecision *b1Data,*b2Data;
 665 | 			const _FlowPrecision *foo1Data,*foo2Data;
 666 | 			b1Data=b1.data();
 667 | 			b2Data=b2.data();
 668 | 			foo1Data=foo1.data();
 669 | 			foo2Data=foo2.data();
 670 | 
 671 | 			for(int i=0;i<nPixels;i++)
 672 | 			{
 673 | 				b1Data[i]=-b1Data[i]-alpha*foo1Data[i];
 674 | 				b2Data[i]=-b2Data[i]-alpha*foo2Data[i];
 675 | 			}
 676 | 
 677 | 			// for debug only, displaying the matrix coefficients
 678 | 			//A11.imwrite("A11.bmp",ImageIO::normalized);
 679 | 			//A12.imwrite("A12.bmp",ImageIO::normalized);
 680 | 			//A22.imwrite("A22.bmp",ImageIO::normalized);
 681 | 			//b1.imwrite("b1.bmp",ImageIO::normalized);
 682 | 			//b2.imwrite("b2.bmp",ImageIO::normalized);
 683 | 
 684 | 			//-----------------------------------------------------------------------
 685 | 			// conjugate gradient algorithm
 686 | 			//-----------------------------------------------------------------------
 687 | 			r1.copyData(b1);
 688 | 			r2.copyData(b2);
 689 | 			du.reset();
 690 | 			dv.reset();
 691 | 
 692 | 			for(int k=0;k<nCGIterations;k++)
 693 | 			{
 694 | 				rou[k]=r1.norm2()+r2.norm2();
 695 | 				//cout<<rou[k]<<endl;
 696 | 				if(rou[k]<1E-10)
 697 | 					break;
 698 | 				if(k==0)
 699 | 				{
 700 | 					p1.copyData(r1);
 701 | 					p2.copyData(r2);
 702 | 				}
 703 | 				else
 704 | 				{
 705 | 					double ratio=rou[k]/rou[k-1];
 706 | 					p1.Add(r1,p1,ratio);
 707 | 					p2.Add(r2,p2,ratio);
 708 | 				}
 709 | 				// go through the large linear system
 710 | 				foo1.Multiply(A11,p1);
 711 | 				foo2.Multiply(A12,p2);
 712 | 				q1.Add(foo1,foo2);
 713 | 				Laplacian(foo1,p1,Phi_1st);
 714 | 				q1.Add(foo1,alpha);
 715 | 
 716 | 				foo1.Multiply(A12,p1);
 717 | 				foo2.Multiply(A22,p2);
 718 | 				q2.Add(foo1,foo2);
 719 | 				Laplacian(foo2,p2,Phi_1st);
 720 | 				q2.Add(foo2,alpha);
 721 | 
 722 | 				double beta;
 723 | 				beta=rou[k]/(p1.innerproduct(q1)+p2.innerproduct(q2));
 724 | 
 725 | 				du.Add(p1,beta);
 726 | 				dv.Add(p2,beta);
 727 | 
 728 | 				r1.Add(q1,-beta);
 729 | 				r2.Add(q2,-beta);
 730 | 			}
 731 | 			//-----------------------------------------------------------------------
 732 | 			// end of conjugate gradient algorithm
 733 | 			//-----------------------------------------------------------------------
 734 | 		}// end of inner fixed point iteration
 735 | 
 736 | 		// the following procedure is merely for debugging
 737 | 		//cout<<"du "<<du.norm2()<<" dv "<<dv.norm2()<<endl;
 738 | 		// update the flow field
 739 | 		u.Add(du,1);
 740 | 		v.Add(dv,1);
 741 | 		if(interpolation == Bilinear)
 742 | 			warpFL(warpIm2,Im1,Im2,u,v);
 743 | 		else
 744 | 		{
 745 | 			Im2.warpImageBicubicRef(Im1,warpIm2,u,v);
 746 | 			warpIm2.threshold();
 747 | 		}
 748 | 
 749 | 		//Im2.warpImageBicubicRef(Im1,warpIm2,BicubicCoeff,u,v);
 750 | 
 751 | 		// estimate noise level
 752 | 		switch(noiseModel)
 753 | 		{
 754 | 		case GMixture:
 755 | 			estGaussianMixture(Im1,warpIm2,GMPara);
 756 | 			break;
 757 | 		case Lap:
 758 | 			estLaplacianNoise(Im1,warpIm2,LapPara);
 759 | 		}
 760 | 
 761 | 	}// end of outer fixed point iteration
 762 | 	delete rou;
 763 | }
 764 | 
 765 | void OpticalFlow::estGaussianMixture(const DImage& Im1,const DImage& Im2,GaussianMixture& para,double prior)
 766 | {
 767 | 	int nIterations = 3, nChannels = Im1.nchannels();
 768 | 	DImage weight1(Im1),weight2(Im1);
 769 | 	double *total1,*total2;
 770 | 	total1 = new double[nChannels];
 771 | 	total2 = new double[nChannels];
 772 | 	for(int count = 0; count<nIterations; count++)
 773 | 	{
 774 | 		double temp;
 775 | 		memset(total1,0,sizeof(double)*nChannels);
 776 | 		memset(total2,0,sizeof(double)*nChannels);
 777 | 
 778 | 		// E step
 779 | 		for(int i = 0;i<weight1.npixels();i++)
 780 | 			for(int k=0;k<nChannels;k++)
 781 | 			{
 782 | 				int offset = i*weight1.nchannels()+k;
 783 | 				temp = Im1[offset]-Im2[offset];
 784 | 				temp *= temp;
 785 | 				weight1[offset] = para.Gaussian(temp,0,k)*para.alpha[k];
 786 | 				weight2[offset] = para.Gaussian(temp,1,k)*(1-para.alpha[k]);
 787 | 				temp = weight1[offset]+weight2[offset];
 788 | 				weight1[offset]/=temp;
 789 | 				weight2[offset]/=temp;
 790 | 				total1[k] += weight1[offset];
 791 | 				total2[k] += weight2[offset];
 792 | 			}
 793 | 
 794 | 		// M step
 795 | 		para.reset();
 796 | 
 797 | 
 798 | 		for(int i = 0;i<weight1.npixels();i++)
 799 | 			for(int k =0;k<nChannels;k++)
 800 | 			{
 801 | 				int offset = i*weight1.nchannels()+k;
 802 | 				temp = Im1[offset]-Im2[offset];
 803 | 				temp *= temp;
 804 | 				para.sigma[k]+= weight1[offset]*temp;
 805 | 				para.beta[k] += weight2[offset]*temp;
 806 | 			}
 807 | 
 808 | 		for(int k =0;k<nChannels;k++)
 809 | 		{
 810 | 			para.alpha[k] = total1[k]/(total1[k]+total2[k])*(1-prior)+0.95*prior; // regularize alpha
 811 | 			para.sigma[k] = sqrt(para.sigma[k]/total1[k]);
 812 | 			para.beta[k]   = sqrt(para.beta[k]/total2[k])*(1-prior)+0.3*prior; // regularize beta
 813 | 		}
 814 | 		para.square();
 815 | 		count = count;
 816 | 	}
 817 | }
 818 | 
 819 | void OpticalFlow::estLaplacianNoise(const DImage& Im1,const DImage& Im2,Vector<double>& para)
 820 | {
 821 | 	int nChannels = Im1.nchannels();
 822 | 	if(para.dim()!=nChannels)
 823 | 		para.allocate(nChannels);
 824 | 	else
 825 | 		para.reset();
 826 | 	double temp;
 827 | 	Vector<double> total(nChannels);
 828 | 	for(int k = 0;k<nChannels;k++)
 829 | 		total[k] = 0;
 830 | 
 831 | 	for(int i =0;i<Im1.npixels();i++)
 832 | 		for(int k = 0;k<nChannels;k++)
 833 | 		{
 834 | 			int offset = i*nChannels+k;
 835 | 			temp= fabs(Im1.data()[offset]-Im2.data()[offset]);
 836 | 			if(temp>0 && temp<1000000)
 837 | 			{
 838 | 				para[k] += temp;
 839 | 				total[k]++;
 840 | 			}
 841 | 		}
 842 | 	for(int k = 0;k<nChannels;k++)
 843 | 	{
 844 | 		if(total[k]==0)
 845 | 		{
 846 | 			cout<<"All the pixels are invalid in estimation Laplacian noise!!!"<<endl;
 847 | 			cout<<"Something severely wrong happened!!!"<<endl;
 848 | 			para[k] = 0.001;
 849 | 		}
 850 | 		else
 851 | 			para[k]/=total[k];
 852 | 	}
 853 | }
 854 | 
 855 | void OpticalFlow::Laplacian(DImage &output, const DImage &input, const DImage& weight)
 856 | {
 857 | 	if(output.matchDimension(input)==false)
 858 | 		output.allocate(input);
 859 | 	output.reset();
 860 | 
 861 | 	if(input.matchDimension(weight)==false)
 862 | 	{
 863 | 		cout<<"Error in image dimension matching OpticalFlow::Laplacian()!"<<endl;
 864 | 		return;
 865 | 	}
 866 | 
 867 | 	const _FlowPrecision *inputData=input.data(),*weightData=weight.data();
 868 | 	int width=input.width(),height=input.height();
 869 | 	DImage foo(width,height);
 870 | 	_FlowPrecision *fooData=foo.data(),*outputData=output.data();
 871 | 
 872 | 
 873 | 	// horizontal filtering
 874 | 	for(int i=0;i<height;i++)
 875 | 		for(int j=0;j<width-1;j++)
 876 | 		{
 877 | 			int offset=i*width+j;
 878 | 			fooData[offset]=(inputData[offset+1]-inputData[offset])*weightData[offset];
 879 | 		}
 880 | 	for(int i=0;i<height;i++)
 881 | 		for(int j=0;j<width;j++)
 882 | 		{
 883 | 			int offset=i*width+j;
 884 | 			if(j<width-1)
 885 | 				outputData[offset]-=fooData[offset];
 886 | 			if(j>0)
 887 | 				outputData[offset]+=fooData[offset-1];
 888 | 		}
 889 | 	foo.reset();
 890 | 	// vertical filtering
 891 | 	for(int i=0;i<height-1;i++)
 892 | 		for(int j=0;j<width;j++)
 893 | 		{
 894 | 			int offset=i*width+j;
 895 | 			fooData[offset]=(inputData[offset+width]-inputData[offset])*weightData[offset];
 896 | 		}
 897 | 	for(int i=0;i<height;i++)
 898 | 		for(int j=0;j<width;j++)
 899 | 		{
 900 | 			int offset=i*width+j;
 901 | 			if(i<height-1)
 902 | 				outputData[offset]-=fooData[offset];
 903 | 			if(i>0)
 904 | 				outputData[offset]+=fooData[offset-width];
 905 | 		}
 906 | }
 907 | 
 908 | void OpticalFlow::testLaplacian(int dim)
 909 | {
 910 | 	// generate the random weight
 911 | 	DImage weight(dim,dim);
 912 | 	for(int i=0;i<dim;i++)
 913 | 		for(int j=0;j<dim;j++)
 914 | 			//weight.data()[i*dim+j]=(double)rand()/RAND_MAX+1;
 915 | 			weight.data()[i*dim+j]=1;
 916 | 	// go through the linear system;
 917 | 	DImage sysMatrix(dim*dim,dim*dim);
 918 | 	DImage u(dim,dim),du(dim,dim);
 919 | 	for(int i=0;i<dim*dim;i++)
 920 | 	{
 921 | 		u.reset();
 922 | 		u.data()[i]=1;
 923 | 		Laplacian(du,u,weight);
 924 | 		for(int j=0;j<dim*dim;j++)
 925 | 			sysMatrix.data()[j*dim*dim+i]=du.data()[j];
 926 | 	}
 927 | 	// test whether the matrix is symmetric
 928 | 	for(int i=0;i<dim*dim;i++)
 929 | 	{
 930 | 		for(int j=0;j<dim*dim;j++)
 931 | 		{
 932 | 			if(sysMatrix.data()[i*dim*dim+j]>=0)
 933 | 				printf(" ");
 934 | 			printf(" %1.0f ",sysMatrix.data()[i*dim*dim+j]);
 935 | 		}
 936 | 		printf("\n");
 937 | 	}
 938 | }
 939 | 
 940 | //--------------------------------------------------------------------------------------
 941 | // function to perfomr coarse to fine optical flow estimation
 942 | //--------------------------------------------------------------------------------------
 943 | void OpticalFlow::Coarse2FineFlow(DImage &vx, DImage &vy, DImage &warpI2,const DImage &Im1, const DImage &Im2, double alpha, double ratio, int minWidth,
 944 | 																	 int nOuterFPIterations, int nInnerFPIterations, int nCGIterations)
 945 | {
 946 | 	// first build the pyramid of the two images
 947 | 	GaussianPyramid GPyramid1;
 948 | 	GaussianPyramid GPyramid2;
 949 | 	if(IsDisplay)
 950 | 		cout<<"Constructing pyramid...";
 951 | 	GPyramid1.ConstructPyramid(Im1,ratio,minWidth);
 952 | 	GPyramid2.ConstructPyramid(Im2,ratio,minWidth);
 953 | 	if(IsDisplay)
 954 | 		cout<<"done!"<<endl;
 955 | 
 956 | 	// now iterate from the top level to the bottom
 957 | 	DImage Image1,Image2,WarpImage2;
 958 | 	//GaussianMixture GMPara(Im1.nchannels()+2);
 959 | 
 960 | 	// initialize noise
 961 | 	switch(noiseModel){
 962 | 	case GMixture:
 963 | 		GMPara.reset(Im1.nchannels()+2);
 964 | 		break;
 965 | 	case Lap:
 966 | 		LapPara.allocate(Im1.nchannels()+2);
 967 | 		for(int i = 0;i<LapPara.dim();i++)
 968 | 			LapPara[i] = 0.02;
 969 | 		break;
 970 | 	}
 971 | 
 972 | 	for(int k=GPyramid1.nlevels()-1;k>=0;k--)
 973 | 	{
 974 | 		if(IsDisplay)
 975 | 			cout<<"Pyramid level "<<k;
 976 | 		int width=GPyramid1.Image(k).width();
 977 | 		int height=GPyramid1.Image(k).height();
 978 | 		im2feature(Image1,GPyramid1.Image(k));
 979 | 		im2feature(Image2,GPyramid2.Image(k));
 980 | 
 981 | 		if(k==GPyramid1.nlevels()-1) // if at the top level
 982 | 		{
 983 | 			vx.allocate(width,height);
 984 | 			vy.allocate(width,height);
 985 | 			//warpI2.copyData(Image2);
 986 | 			WarpImage2.copyData(Image2);
 987 | 		}
 988 | 		else
 989 | 		{
 990 | 
 991 | 			vx.imresize(width,height);
 992 | 			vx.Multiplywith(1/ratio);
 993 | 			vy.imresize(width,height);
 994 | 			vy.Multiplywith(1/ratio);
 995 | 			//warpFL(warpI2,GPyramid1.Image(k),GPyramid2.Image(k),vx,vy);
 996 | 			if(interpolation == Bilinear)
 997 | 				warpFL(WarpImage2,Image1,Image2,vx,vy);
 998 | 			else
 999 | 				Image2.warpImageBicubicRef(Image1,WarpImage2,vx,vy);
1000 | 		}
1001 | 		//SmoothFlowPDE(GPyramid1.Image(k),GPyramid2.Image(k),warpI2,vx,vy,alpha,nOuterFPIterations,nInnerFPIterations,nCGIterations);
1002 | 		//SmoothFlowPDE(Image1,Image2,WarpImage2,vx,vy,alpha*pow((1/ratio),k),nOuterFPIterations,nInnerFPIterations,nCGIterations,GMPara);
1003 | 
1004 | 		//SmoothFlowPDE(Image1,Image2,WarpImage2,vx,vy,alpha,nOuterFPIterations,nInnerFPIterations,nCGIterations);
1005 | 		SmoothFlowSOR(Image1,Image2,WarpImage2,vx,vy,alpha,nOuterFPIterations+k,nInnerFPIterations,nCGIterations+k*3);
1006 | 
1007 | 		//GMPara.display();
1008 | 		if(IsDisplay)
1009 | 			cout<<endl;
1010 | 	}
1011 | 	//warpFL(warpI2,Im1,Im2,vx,vy);
1012 | 	Im2.warpImageBicubicRef(Im1,warpI2,vx,vy);
1013 | 	warpI2.threshold();
1014 | }
1015 | 
1016 | void OpticalFlow::Coarse2FineFlowLevel(DImage &vx, DImage &vy, DImage &warpI2,const DImage &Im1, const DImage &Im2, double alpha, double ratio, int nLevels,
1017 | 																	 int nOuterFPIterations, int nInnerFPIterations, int nCGIterations)
1018 | {
1019 | 	// first build the pyramid of the two images
1020 | 	GaussianPyramid GPyramid1;
1021 | 	GaussianPyramid GPyramid2;
1022 | 	GaussianPyramid GFlow;
1023 | 	DImage flow;
1024 | 	AssembleFlow(vx,vy,flow);
1025 | 	if(IsDisplay)
1026 | 		cout<<"Constructing pyramid...";
1027 | 	GPyramid1.ConstructPyramidLevels(Im1,ratio,nLevels);
1028 | 	GPyramid2.ConstructPyramidLevels(Im2,ratio,nLevels);
1029 | 	GFlow.ConstructPyramidLevels(flow,ratio,nLevels);
1030 | 	flow= GFlow.Image(nLevels-1);
1031 | 	flow.Multiplywith(pow(ratio,nLevels-1));
1032 | 	DissembleFlow(flow,vx,vy);
1033 | 
1034 | 	if(IsDisplay)
1035 | 		cout<<"done!"<<endl;
1036 | 
1037 | 	// now iterate from the top level to the bottom
1038 | 	DImage Image1,Image2,WarpImage2;
1039 | 
1040 | 	// initialize noise
1041 | 	switch(noiseModel){
1042 | 	case GMixture:
1043 | 		GMPara.reset(Im1.nchannels()+2);
1044 | 		break;
1045 | 	case Lap:
1046 | 		LapPara.allocate(Im1.nchannels()+2);
1047 | 		for(int i = 0;i<LapPara.dim();i++)
1048 | 			LapPara[i] = 0.02;
1049 | 		break;
1050 | 	}
1051 | 
1052 | 
1053 | 	for(int k=GPyramid1.nlevels()-1;k>=0;k--)
1054 | 	{
1055 | 		if(IsDisplay)
1056 | 			cout<<"Pyramid level "<<k;
1057 | 		int width=GPyramid1.Image(k).width();
1058 | 		int height=GPyramid1.Image(k).height();
1059 | 		im2feature(Image1,GPyramid1.Image(k));
1060 | 		im2feature(Image2,GPyramid2.Image(k));
1061 | 
1062 | 		if(k<GPyramid1.nlevels()-1) // if at the top level
1063 | 		{
1064 | 			vx.imresize(width,height);
1065 | 			vx.Multiplywith(1/ratio);
1066 | 			vy.imresize(width,height);
1067 | 			vy.Multiplywith(1/ratio);
1068 | 		}
1069 | 		if(interpolation == Bilinear)
1070 | 			warpFL(WarpImage2,Image1,Image2,vx,vy);
1071 | 		else
1072 | 			Image2.warpImageBicubicRef(Image1,WarpImage2,vx,vy);
1073 | 		//SmoothFlowPDE(GPyramid1.Image(k),GPyramid2.Image(k),warpI2,vx,vy,alpha,nOuterFPIterations,nInnerFPIterations,nCGIterations);
1074 | 		//SmoothFlowPDE(Image1,Image2,WarpImage2,vx,vy,alpha*pow((1/ratio),k),nOuterFPIterations,nInnerFPIterations,nCGIterations,GMPara);
1075 | 
1076 | 		SmoothFlowPDE(Image1,Image2,WarpImage2,vx,vy,alpha,nOuterFPIterations,nInnerFPIterations,nCGIterations);
1077 | 		//GMPara.display();
1078 | 		if(IsDisplay)
1079 | 			cout<<endl;
1080 | 	}
1081 | 	//warpFL(warpI2,Im1,Im2,vx,vy);
1082 | 	Im2.warpImageBicubicRef(Im1,warpI2,vx,vy);
1083 | 	warpI2.threshold();
1084 | }
1085 | 
1086 | //---------------------------------------------------------------------------------------
1087 | // function to convert image to feature image
1088 | //---------------------------------------------------------------------------------------
1089 | void OpticalFlow::im2feature(DImage &imfeature, const DImage &im)
1090 | {
1091 | 	int width=im.width();
1092 | 	int height=im.height();
1093 | 	int nchannels=im.nchannels();
1094 | 	if(nchannels==1)
1095 | 	{
1096 | 		imfeature.allocate(im.width(),im.height(),3);
1097 | 		DImage imdx,imdy;
1098 | 		im.dx(imdx,true);
1099 | 		im.dy(imdy,true);
1100 | 		_FlowPrecision* data=imfeature.data();
1101 | 		for(int i=0;i<height;i++)
1102 | 			for(int j=0;j<width;j++)
1103 | 			{
1104 | 				int offset=i*width+j;
1105 | 				data[offset*3]=im.data()[offset];
1106 | 				data[offset*3+1]=imdx.data()[offset];
1107 | 				data[offset*3+2]=imdy.data()[offset];
1108 | 			}
1109 | 	}
1110 | 	else if(nchannels==3)
1111 | 	{
1112 | 		DImage grayImage;
1113 | 		im.desaturate(grayImage);
1114 | 
1115 | 		imfeature.allocate(im.width(),im.height(),5);
1116 | 		DImage imdx,imdy;
1117 | 		grayImage.dx(imdx,true);
1118 | 		grayImage.dy(imdy,true);
1119 | 		_FlowPrecision* data=imfeature.data();
1120 | 		for(int i=0;i<height;i++)
1121 | 			for(int j=0;j<width;j++)
1122 | 			{
1123 | 				int offset=i*width+j;
1124 | 				data[offset*5]=grayImage.data()[offset];
1125 | 				data[offset*5+1]=imdx.data()[offset];
1126 | 				data[offset*5+2]=imdy.data()[offset];
1127 | 				data[offset*5+3]=im.data()[offset*3+1]-im.data()[offset*3];
1128 | 				data[offset*5+4]=im.data()[offset*3+1]-im.data()[offset*3+2];
1129 | 			}
1130 | 	}
1131 | 	else
1132 | 		imfeature.copyData(im);
1133 | }
1134 | 
1135 | bool OpticalFlow::LoadOpticalFlow(const char* filename,DImage &flow)
1136 | {
1137 | 	Image<unsigned short int> foo;
1138 | 	if(foo.loadImage(filename) == false)
1139 | 		return false;
1140 | 	if(!flow.matchDimension(foo))
1141 | 		flow.allocate(foo);
1142 | 	for(int  i = 0;i<flow.npixels();i++)
1143 | 	{
1144 | 		flow.data()[i*2] = (double)foo.data()[i*2]/160-200;
1145 | 		flow.data()[i*2+1] = (double)foo.data()[i*2+1]/160-200;
1146 | 	}
1147 | 	return true;
1148 | }
1149 | 
1150 | bool OpticalFlow::LoadOpticalFlow(ifstream& myfile,DImage& flow)
1151 | {
1152 | 	Image<unsigned short int> foo;
1153 | 	if(foo.loadImage(myfile) == false)
1154 | 		return false;
1155 | 	if(!flow.matchDimension(foo))
1156 | 		flow.allocate(foo);
1157 | 	for(int  i = 0;i<flow.npixels();i++)
1158 | 	{
1159 | 		flow.data()[i*2] = (double)foo.data()[i*2]/160-200;
1160 | 		flow.data()[i*2+1] = (double)foo.data()[i*2+1]/160-200;
1161 | 	}
1162 | 	return true;
1163 | }
1164 | 
1165 | bool OpticalFlow::SaveOpticalFlow(const DImage& flow, const char* filename)
1166 | {
1167 | 	Image<unsigned short int> foo;
1168 | 	foo.allocate(flow);
1169 | 	for(int i =0;i<flow.npixels();i++)
1170 | 	{
1171 | 		foo.data()[i*2] = (__min(__max(flow.data()[i*2],-200),200)+200)*160;
1172 | 		foo.data()[i*2+1] = (__min(__max(flow.data()[i*2+1],-200),200)+200)*160;
1173 | 	}
1174 | 	return foo.saveImage(filename);
1175 | }
1176 | 
1177 | bool OpticalFlow::SaveOpticalFlow(const DImage& flow,ofstream& myfile)
1178 | {
1179 | 	Image<unsigned short int> foo;
1180 | 	foo.allocate(flow);
1181 | 	for(int i =0;i<flow.npixels();i++)
1182 | 	{
1183 | 		foo.data()[i*2] = (__min(__max(flow.data()[i*2],-200),200)+200)*160;
1184 | 		foo.data()[i*2+1] = (__min(__max(flow.data()[i*2+1],-200),200)+200)*160;
1185 | 	}
1186 | 	return foo.saveImage(myfile);
1187 | }
1188 | 
1189 | bool OpticalFlow::showFlow(const DImage& flow,const char* filename)
1190 | {
1191 | 	if(flow.nchannels()!=1)
1192 | 	{
1193 | 		cout<<"The flow must be a single channel image!"<<endl;
1194 | 		return false;
1195 | 	}
1196 | 	Image<unsigned char> foo;
1197 | 	foo.allocate(flow.width(),flow.height());
1198 | 	double Max = flow.max();
1199 | 	double Min = flow.min();
1200 | 	for(int i = 0;i<flow.npixels(); i++)
1201 | 		foo[i] = (flow[i]-Min)/(Max-Min)*255;
1202 |   // opencv support disabled. Can no longer write images.
1203 | 	// foo.imwrite(filename);
1204 |   return false;
1205 | }
1206 | 


--------------------------------------------------------------------------------
/src/OpticalFlow.h:
--------------------------------------------------------------------------------
  1 | // Author: Ce Liu (c) Dec, 2009; celiu@mit.edu
  2 | // Modified By: Deepak Pathak (c) 2016; pathak@berkeley.edu
  3 | 
  4 | #pragma once
  5 | 
  6 | #include "Image.h"
  7 | #include "NoiseModel.h"
  8 | #include "Vector.h"
  9 | #include <vector>
 10 | 
 11 | typedef double _FlowPrecision;
 12 | 
 13 | class OpticalFlow
 14 | {
 15 | public:
 16 | 	static bool IsDisplay;
 17 | public:
 18 | 	enum InterpolationMethod {Bilinear,Bicubic};
 19 | 	static InterpolationMethod interpolation;
 20 | 	enum NoiseModel {GMixture,Lap};
 21 | 	OpticalFlow(void);
 22 | 	~OpticalFlow(void);
 23 | 	static GaussianMixture GMPara;
 24 | 	static Vector<double> LapPara;
 25 | 	static NoiseModel noiseModel;
 26 | public:
 27 | 	static void getDxs(DImage& imdx,DImage& imdy,DImage& imdt,const DImage& im1,const DImage& im2);
 28 | 	static void SanityCheck(const DImage& imdx,const DImage& imdy,const DImage& imdt,double du,double dv);
 29 | 	static void warpFL(DImage& warpIm2,const DImage& Im1,const DImage& Im2,const DImage& vx,const DImage& vy);
 30 | 	static void warpFL(DImage& warpIm2,const DImage& Im1,const DImage& Im2,const DImage& flow);
 31 | 
 32 | 
 33 | 	static void genConstFlow(DImage& flow,double value,int width,int height);
 34 | 	static void genInImageMask(DImage& mask,const DImage& vx,const DImage& vy,int interval = 0);
 35 | 	static void genInImageMask(DImage& mask,const DImage& flow,int interval =0 );
 36 | 	static void SmoothFlowPDE(const DImage& Im1,const DImage& Im2, DImage& warpIm2,DImage& vx,DImage& vy,
 37 | 														 double alpha,int nOuterFPIterations,int nInnerFPIterations,int nCGIterations);
 38 | 
 39 | 	static void SmoothFlowSOR(const DImage& Im1,const DImage& Im2, DImage& warpIm2, DImage& vx, DImage& vy,
 40 | 														 double alpha,int nOuterFPIterations,int nInnerFPIterations,int nSORIterations);
 41 | 
 42 | 	static void estGaussianMixture(const DImage& Im1,const DImage& Im2,GaussianMixture& para,double prior = 0.9);
 43 | 	static void estLaplacianNoise(const DImage& Im1,const DImage& Im2,Vector<double>& para);
 44 | 	static void Laplacian(DImage& output,const DImage& input,const DImage& weight);
 45 | 	static void testLaplacian(int dim=3);
 46 | 
 47 | 	// function of coarse to fine optical flow
 48 | 	static void Coarse2FineFlow(DImage& vx,DImage& vy,DImage &warpI2,const DImage& Im1,const DImage& Im2,double alpha,double ratio,int minWidth,
 49 | 															int nOuterFPIterations,int nInnerFPIterations,int nCGIterations);
 50 | 
 51 | 	static void Coarse2FineFlowLevel(DImage& vx,DImage& vy,DImage &warpI2,const DImage& Im1,const DImage& Im2,double alpha,double ratio,int nLevels,
 52 | 															int nOuterFPIterations,int nInnerFPIterations,int nCGIterations);
 53 | 
 54 | 	// function to convert image to features
 55 | 	static void im2feature(DImage& imfeature,const DImage& im);
 56 | 
 57 | 	// function to load optical flow
 58 | 	static bool LoadOpticalFlow(const char* filename,DImage& flow);
 59 | 
 60 | 	static bool LoadOpticalFlow(ifstream& myfile,DImage& flow);
 61 | 
 62 | 	static bool SaveOpticalFlow(const DImage& flow, const char* filename);
 63 | 
 64 | 	static bool SaveOpticalFlow(const DImage& flow,ofstream& myfile);
 65 | 
 66 | 	static bool showFlow(const DImage& vx,const char* filename);
 67 | 
 68 | 	// function to assemble and dissemble flows
 69 | 	static void AssembleFlow(const DImage& vx,const DImage& vy,DImage& flow)
 70 | 	{
 71 | 		if(!flow.matchDimension(vx.width(),vx.height(),2))
 72 | 			flow.allocate(vx.width(),vx.height(),2);
 73 | 		for(int i = 0;i<vx.npixels();i++)
 74 | 		{
 75 | 			flow.data()[i*2] = vx.data()[i];
 76 | 			flow.data()[i*2+1] = vy.data()[i];
 77 | 		}
 78 | 	}
 79 | 	static void DissembleFlow(const DImage& flow,DImage& vx,DImage& vy)
 80 | 	{
 81 | 		if(!vx.matchDimension(flow.width(),flow.height(),1))
 82 | 			vx.allocate(flow.width(),flow.height());
 83 | 		if(!vy.matchDimension(flow.width(),flow.height(),1))
 84 | 			vy.allocate(flow.width(),flow.height());
 85 | 		for(int i =0;i<vx.npixels();i++)
 86 | 		{
 87 | 			vx.data()[i] = flow.data()[i*2];
 88 | 			vy.data()[i] = flow.data()[i*2+1];
 89 | 		}
 90 | 	}
 91 | 	static void ComputeOpticalFlow(const DImage& Im1,const DImage& Im2,DImage& flow)
 92 | 	{
 93 | 		if(!Im1.matchDimension(Im2))
 94 | 		{
 95 | 			cout<<"The input images for optical flow have different dimensions!"<<endl;
 96 | 			return;
 97 | 		}
 98 | 		if(!flow.matchDimension(Im1.width(),Im1.height(),2))
 99 | 			flow.allocate(Im1.width(),Im1.height(),2);
100 | 
101 | 		double alpha=0.01;
102 | 		double ratio=0.75;
103 | 		int minWidth=30;
104 | 		int nOuterFPIterations=15;
105 | 		int nInnerFPIterations=1;
106 | 		int nCGIterations=40;
107 | 
108 | 		DImage vx,vy,warpI2;
109 | 		OpticalFlow::Coarse2FineFlow(vx,vy,warpI2,Im1,Im2,alpha,ratio,minWidth,nOuterFPIterations,nInnerFPIterations,nCGIterations);
110 | 		AssembleFlow(vx,vy,flow);
111 | 	}
112 | };
113 | 


--------------------------------------------------------------------------------
/src/Stochastic.cpp:
--------------------------------------------------------------------------------
  1 | // Author: Ce Liu (c) Dec, 2009; celiu@mit.edu
  2 | // Modified By: Deepak Pathak (c) 2016; pathak@berkeley.edu
  3 | 
  4 | #include "Stochastic.h"
  5 | #include "time.h"
  6 | #include "stdlib.h"
  7 | #include "stdio.h"
  8 | 
  9 | CStochastic::CStochastic(void)
 10 | {
 11 | }
 12 | 
 13 | CStochastic::~CStochastic(void)
 14 | {
 15 | }
 16 | 
 17 | void CStochastic::ConvertInt2String(int x,char* string,int BitNumber)
 18 | {
 19 | 	int i,Base=1;
 20 | 	for(i=1;i<BitNumber;i++)
 21 | 		Base*=10;
 22 | 	for(i=0;i<BitNumber;i++)
 23 | 	{
 24 | 		string[i]=x/Base+'0';
 25 | 		x%=Base;
 26 | 		Base/=10;
 27 | 	}
 28 | 	string[i]='\0';
 29 | }
 30 | 
 31 | double CStochastic::UniformSampling()
 32 | {
 33 | 	return (double)rand()/((double)RAND_MAX+(double)1);
 34 | }
 35 | 
 36 | int CStochastic::UniformSampling(int R)
 37 | {
 38 | 	int Index=(double)UniformSampling()*R;
 39 | 	if(Index>R-1)
 40 | 		Index=R-1;
 41 | 	return Index;
 42 | }
 43 | 
 44 | double CStochastic::GaussianSampling()
 45 | {
 46 | 	int i;
 47 | 	double result=0;
 48 | 	for (i=0;i<12;i++)
 49 | 		result+=UniformSampling();
 50 | 	result-=6;
 51 | 	return result;
 52 | }
 53 | 
 54 | 
 55 | double CStochastic::GetMean(double* signal,int length)
 56 | {
 57 | 	double mean=0;
 58 | 	int i;
 59 | 	for(i=0;i<length;i++)
 60 | 		mean+=signal[i];
 61 | 	mean/=length;
 62 | 	return mean;
 63 | }
 64 | 
 65 | int CStochastic::Sampling(double* Density,int NumSamples)
 66 | {
 67 | 	double RandNumber=UniformSampling();
 68 | 	int i;
 69 | 	double sum=0;
 70 | 	for(i=0;i<NumSamples;i++)
 71 | 	{
 72 | 		sum+=Density[i];
 73 | 		if(sum>=RandNumber)
 74 | 			return i;
 75 | 	}
 76 | 	return NumSamples-1;
 77 | }
 78 | 
 79 | void CStochastic::Generate1DGaussian(double* pGaussian,int size,double sigma)
 80 | {
 81 | 	int i;
 82 | 	if(sigma==0)
 83 | 		sigma=size/2;
 84 | 	for(i=-size;i<=size;i++)
 85 | 		pGaussian[i+size]=exp(-(double)i*i/(2*sigma));
 86 | }
 87 | 
 88 | void CStochastic::Generate2DGaussian(double* pGaussian,int WinSize,double sigma)
 89 | {
 90 | 	int i,j,WinLength=WinSize*2+1;
 91 | 	double Sigma;
 92 | 	if(sigma==0)
 93 | 		Sigma=WinSize;
 94 | 	else
 95 | 		Sigma=sigma;
 96 | 	Sigma*=Sigma;
 97 | 	for (i=-WinSize;i<=WinSize;i++)
 98 | 		for(j=-WinSize;j<=WinSize;j++)
 99 | 			pGaussian[(i+WinSize)*WinLength+j+WinSize]=exp(-(double)(i*i+j*j)/(2*Sigma));
100 | 	Normalize(WinLength*WinLength,pGaussian);
101 | }
102 | 
103 | double CStochastic::entropy(double* pDensity,int n)
104 | {
105 | 	double result=0;
106 | 	int i;
107 | 	for(i=0;i<n;i++)
108 | 		result-=log(__max(pDensity[i],1E-6))*pDensity[i];
109 | 	return result;
110 | }
111 | 


--------------------------------------------------------------------------------
/src/Stochastic.h:
--------------------------------------------------------------------------------
  1 | // Author: Ce Liu (c) Dec, 2009; celiu@mit.edu
  2 | // Modified By: Deepak Pathak (c) 2016; pathak@berkeley.edu
  3 | 
  4 | #ifndef STOCHASTIC_H
  5 | #define STOCHASTIC_H
  6 | 
  7 | #include "math.h"
  8 | #include "stdlib.h"
  9 | #include "project.h"
 10 | #include "memory.h"
 11 | 
 12 | #define _Release_2DArray(X,i,length) for(i=0;i<length;i++) if(X[i]!=NULL) delete X[i]; delete []X
 13 | 
 14 | #ifndef _abs
 15 | #define _abs(x) (x>=0)?x:-x
 16 | #endif
 17 | 
 18 | #ifndef PI
 19 | #define PI 3.1415927
 20 | #endif
 21 | 
 22 | enum SortType{SortAscending,SortDescending};
 23 | 
 24 | class CStochastic
 25 | {
 26 | public:
 27 | 	CStochastic(void);
 28 | 	~CStochastic(void);
 29 | 	static void ConvertInt2String(int x,char* string,int BitNumber=3);
 30 | 	static double UniformSampling();
 31 | 	static int UniformSampling(int R);
 32 | 	static double GaussianSampling();
 33 | 	template <class T> static void GetMeanVar(T* signal,int length,double* mean,double* var);
 34 | 	static int Sampling(double* Density,int NumSamples);
 35 | 	static double GetMean(double *signal,int length);
 36 | 	static void Generate1DGaussian(double* pGaussian,int size,double sigma=0);
 37 | 	static void Generate2DGaussian(double* pGaussian,int size,double sigma=0);
 38 | 	static double entropy(double* pDensity,int n);
 39 | 
 40 | 	template <class T> static T sum(int NumData,T* pData);
 41 | 	template <class T> static void Normalize(int NumData,T* pData);
 42 | 	template <class T> static T mean(int NumData, T* pData);
 43 | 	template <class T> static void sort(int number, T* pData,int *pIndex,SortType m_SortType=SortDescending);
 44 | 	template <class T> static T Min(int NumData, T* pData);
 45 | 	template <class T> static T Min(int NumData, T* pData1,T* pData2);
 46 | 	template <class T> static T Max(int NumData ,T* pData);
 47 | 	template <class T> static int FindMax(int NumData,T* pData);
 48 | 	template <class T1,class T2> static void ComputeVectorMean(int Dim,int NumData,T1* pData,T2* pMean,double* pWeight=NULL);
 49 | 	template <class T1,class T2> static void ComputeMeanCovariance(int Dim,int NumData,T1* pData,T2* pMean,T2* pCovarance,double* pWeight=NULL);
 50 | 	template <class T1,class T2> static double VectorSquareDistance(int Dim,T1* pVector1,T2* pVector2);
 51 | 	template <class T1> static void KMeanClustering(int Dim,int NumData,int NumClusters,T1* pData,int *pPartition,double** pClusterMean=NULL,int MaxIterationNum=10,int MinClusterSampleNumber=2);
 52 | 	template <class T> static double norm(T* X,int Dim);
 53 | 	template <class T1,class T2> static int FindClosestPoint(T1* pPointSet,int NumPoints,int nDim,T2* QueryPoint);
 54 | 	template <class T1,class T2> static void GaussianFiltering(T1* pSrcArray,T2* pDstArray,int NumPoints,int nChannels,int size,double sigma);
 55 | };
 56 | 
 57 | template <class T>
 58 | void CStochastic::GetMeanVar(T* signal,int length,double* mean,double* var)
 59 | {
 60 | 	double m_mean=0,m_var=0;
 61 | 
 62 | 	int i;
 63 | 	for (i=0;i<length;i++)
 64 | 		m_mean+=signal[i];
 65 | 	m_mean/=length;
 66 | 	for (i=0;i<length;i++)
 67 | 		m_var+=(signal[i]-m_mean)*(signal[i]-m_mean);
 68 | 	m_var/=length-1;
 69 | 	*mean=m_mean;
 70 | 	*var=m_var;
 71 | }
 72 | 
 73 | template <class T>
 74 | T CStochastic::sum(int NumData, T* pData)
 75 | {
 76 | 	T sum=0;
 77 | 	int i;
 78 | 	for(i=0;i<NumData;i++)
 79 | 		sum+=pData[i];
 80 | 	return sum;
 81 | }
 82 | 
 83 | template <class T>
 84 | void CStochastic::Normalize(int NumData,T* pData)
 85 | {
 86 | 	int i;
 87 | 	T Sum;
 88 | 	Sum=sum(NumData,pData);
 89 | 	for(i=0;i<NumData;i++)
 90 | 		pData[i]/=Sum;
 91 | }
 92 | 
 93 | template <class T>
 94 | T CStochastic::mean(int NumData,T* pData)
 95 | {
 96 | 	return sum(NumData,pData)/NumData;
 97 | }
 98 | 
 99 | ////////////////////////////////////////////////////////////
100 | // sort data in descending order
101 | template <class T>
102 | void CStochastic::sort(int Number,T* pData,int *pIndex,SortType m_SortType)
103 | {
104 | 	int i,j,offset_extreme,*flag;
105 | 	double extreme;
106 | 	flag=new int[Number];
107 | 	memset(flag,0,sizeof(int)*Number);
108 | 	for(i=0;i<Number;i++)
109 | 	{
110 | 		if(m_SortType==SortDescending)
111 | 			extreme=-1E100;
112 | 		else
113 | 			extreme=1E100;
114 | 		offset_extreme=0;
115 | 		for(j=0;j<Number;j++)
116 | 		{
117 | 			if(flag[j]==1)
118 | 				continue;
119 | 			if( (m_SortType==SortDescending && extreme<pData[j]) || (m_SortType==SortAscending && extreme>pData[j]))
120 | 			{
121 | 				extreme=pData[j];
122 | 				offset_extreme=j;
123 | 			}
124 | 		}
125 | 		pIndex[i]=offset_extreme;
126 | 		flag[offset_extreme]=1;
127 | 	}
128 | 	delete flag;
129 | }
130 | 
131 | template <class T>
132 | T CStochastic::Min(int NumData,T* pData)
133 | {
134 | 	int i;
135 | 	T result=pData[0];
136 | 	for(i=1;i<NumData;i++)
137 | 		result=__min(result,pData[i]);
138 | 	return result;
139 | }
140 | 
141 | template <class T>
142 | T CStochastic::Min(int NumData,T* pData1,T* pData2)
143 | {
144 | 	int i;
145 | 	T result=pData1[0]+pData2[0];
146 | 	for(i=1;i<NumData;i++)
147 | 		result=__min(result,pData1[i]+pData2[i]);
148 | 	return result;
149 | }
150 | 
151 | template <class T>
152 | T CStochastic::Max(int NumData,T* pData)
153 | {
154 | 	int i;
155 | 	T result=pData[0];
156 | 	for(i=1;i<NumData;i++)
157 | 		result=__max(result,pData[i]);
158 | 	return result;
159 | }
160 | 
161 | template <class T>
162 | int CStochastic::FindMax(int NumData,T* pData)
163 | {
164 | 	int i,index;
165 | 	T result=pData[0];
166 | 	index=0;
167 | 	for(i=1;i<NumData;i++)
168 | 		if(pData[i]>result)
169 | 		{
170 | 			index=i;
171 | 			result=pData[i];
172 | 		}
173 | 	return index;
174 | }
175 | 
176 | 
177 | template <class T1,class T2>
178 | void CStochastic::ComputeMeanCovariance(int Dim,int NumData,T1* pData,T2* pMean,T2* pCovariance,double* pWeight)
179 | {
180 | 	int i,j,k;
181 | 	memset(pMean,0,sizeof(T2)*Dim);
182 | 	memset(pCovariance,0,sizeof(T2)*Dim*Dim);
183 | 
184 | 	bool IsWeightLoaded=false;
185 | 	double Sum;
186 | 	if(pWeight!=NULL)
187 | 		IsWeightLoaded=true;
188 | 
189 | 	// compute mean first
190 | 	Sum=0;
191 | 	if(IsWeightLoaded)
192 | 		for(i=0;i<NumData;i++)
193 | 		{
194 | 			if(pWeight[i]==0)
195 | 				continue;
196 | 			for(j=0;j<Dim;j++)
197 | 				pMean[j]+=pData[i*Dim+j]*pWeight[i];
198 | 			Sum+=pWeight[i];
199 | 		}
200 | 	else
201 | 	{
202 | 		for(i=0;i<NumData;i++)
203 | 			for(j=0;j<Dim;j++)
204 | 				pMean[j]+=pData[i*Dim+j];
205 | 		Sum=NumData;
206 | 	}
207 | 	for(j=0;j<Dim;j++)
208 | 		pMean[j]/=Sum;
209 | 
210 | 	//compute covariance;
211 | 	T2* pTempVector;
212 | 	pTempVector=new T2[Dim];
213 | 
214 | 	for(i=0;i<NumData;i++)
215 | 	{
216 | 		for(j=0;j<Dim;j++)
217 | 			pTempVector[j]=pData[i*Dim+j]-pMean[j];
218 | 		if(IsWeightLoaded)
219 | 		{
220 | 			if(pWeight[i]==0)
221 | 				continue;
222 | 			for(j=0;j<Dim;j++)
223 | 				for(k=0;k<=j;k++)
224 | 					pCovariance[j*Dim+k]+=pTempVector[j]*pTempVector[k]*pWeight[i];
225 | 		}
226 | 		else
227 | 			for(j=0;j<Dim;j++)
228 | 				for(k=0;k<=j;k++)
229 | 					pCovariance[j*Dim+k]+=pTempVector[j]*pTempVector[k];
230 | 	}
231 | 	for(j=0;j<Dim;j++)
232 | 		for(k=j+1;k<Dim;k++)
233 | 			pCovariance[j*Dim+k]=pCovariance[k*Dim+j];
234 | 
235 | 	for(j=0;j<Dim*Dim;j++)
236 | 		pCovariance[j]/=Sum;
237 | 
238 | 	delete []pTempVector;
239 | }
240 | 
241 | template <class T1,class T2>
242 | void CStochastic::ComputeVectorMean(int Dim,int NumData,T1* pData,T2* pMean,double* pWeight)
243 | {
244 | 	int i,j;
245 | 	memset(pMean,0,sizeof(T2)*Dim);
246 | 	bool IsWeightLoaded;
247 | 	double Sum;
248 | 	if(pWeight==NULL)
249 | 		IsWeightLoaded=false;
250 | 	else
251 | 		IsWeightLoaded=true;
252 | 
253 | 	Sum=0;
254 | 	if(IsWeightLoaded)
255 | 		for(i=0;i<NumData;i++)
256 | 		{
257 | 			if(pWeight[i]==0)
258 | 				continue;
259 | 			for(j=0;j<Dim;j++)
260 | 				pMean[j]+=pData[i*Dim+j]*pWeight[i];
261 | 			Sum+=pWeight[i];
262 | 		}
263 | 	else
264 | 	{
265 | 		for(i=0;i<NumData;i++)
266 | 			for(j=0;j<Dim;j++)
267 | 				pMean[j]+=pData[i*Dim+j];
268 | 		Sum=NumData;
269 | 	}
270 | 	for(j=0;j<Dim;j++)
271 | 		pMean[j]/=Sum;
272 | }
273 | 
274 | template <class T1,class T2>
275 | double CStochastic::VectorSquareDistance(int Dim,T1* pVector1,T2* pVector2)
276 | {
277 | 	double result=0,temp;
278 | 	int i;
279 | 	for(i=0;i<Dim;i++)
280 | 	{
281 | 		temp=pVector1[i]-pVector2[i];
282 | 		result+=temp*temp;
283 | 	}
284 | 	return result;
285 | }
286 | 
287 | template <class T1>
288 | void CStochastic::KMeanClustering(int Dim,int NumData,int NumClusters,T1* pData,int *pPartition,double** pClusterMean,int MaxIterationNum, int MinClusterSampleNumber)
289 | {
290 | 	int i,j,k,l,Index,ClusterSampleNumber;
291 | 	double MinDistance,Distance;
292 | 	double** pCenters;
293 | 	pCenters=new double*[NumClusters];
294 | 	for(i=0;i<NumClusters;i++)
295 | 		pCenters[i]=new double[Dim];
296 | 
297 | 	// generate randome guess of the partition
298 | _CStochastic_KMeanClustering_InitializePartition:
299 | 	for(i=0;i<NumClusters;i++)
300 | 	{
301 | 		Index=UniformSampling(NumData);
302 | 		for(j=0;j<Dim;j++)
303 | 			pCenters[i][j]=pData[Index*Dim+j];
304 | 	}
305 | 
306 | 	for(k=0;k<MaxIterationNum;k++)
307 | 	{
308 | 		// step 1. do partition
309 | 		for(i=0;i<NumData;i++)
310 | 		{
311 | 			MinDistance=1E100;
312 | 			for(j=0;j<NumClusters;j++)
313 | 			{
314 | 				Distance=VectorSquareDistance(Dim,pData+i*Dim,pCenters[j]);
315 | 				if(Distance<MinDistance)
316 | 				{
317 | 					MinDistance=Distance;
318 | 					Index=j;
319 | 				}
320 | 			}
321 | 			pPartition[i]=Index;
322 | 		}
323 | 		// step 2. compute mean
324 | 		for(i=0;i<NumClusters;i++)
325 | 		{
326 | 			memset(pCenters[i],0,sizeof(double)*Dim);
327 | 			ClusterSampleNumber=0;
328 | 			for(j=0;j<NumData;j++)
329 | 				if(pPartition[j]==i)
330 | 				{
331 | 					for(l=0;l<Dim;l++)
332 | 						pCenters[i][l]+=pData[j*Dim+l];
333 | 					ClusterSampleNumber++;
334 | 				}
335 | 			// maybe the initial partition is bad
336 | 			// if so just do initial partition again
337 | 			if(ClusterSampleNumber<MinClusterSampleNumber)
338 | 				goto _CStochastic_KMeanClustering_InitializePartition;
339 | 			for(l=0;l<Dim;l++)
340 | 				pCenters[i][l]/=ClusterSampleNumber;
341 | 		}
342 | 	}
343 | 	// output the final partition if necessary
344 | 	if(pClusterMean!=NULL)
345 | 		for(i=0;i<NumClusters;i++)
346 | 			for(l=0;l<Dim;l++)
347 | 				pClusterMean[i][l]=pCenters[i][l];
348 | 	// free buffer
349 | 	for(i=0;i<NumClusters;i++)
350 | 		delete pCenters[i];
351 | 	delete []pCenters;
352 | }
353 | 
354 | template <class T>
355 | double CStochastic::norm(T* X,int Dim)
356 | {
357 | 	double result=0;
358 | 	int i;
359 | 	for(i=0;i<Dim;i++)
360 | 		result+=X[i]*X[i];
361 | 	result=sqrt(result);
362 | 	return result;
363 | }
364 | 
365 | template <class T1,class T2>
366 | int CStochastic::FindClosestPoint(T1* pPointSet,int NumPoints,int nDim,T2* QueryPoint)
367 | {
368 | 	int i,j,Index=0,offset;
369 | 	T1 MinDistance,Distance,x;
370 | 	MinDistance=0;
371 | 	for(j=0;j<nDim;j++)
372 | 		MinDistance+=_abs(pPointSet[j]-QueryPoint[j]);
373 | 	for(i=1;i<NumPoints;i++)
374 | 	{
375 | 		Distance=0;
376 | 		offset=i*nDim;
377 | 		for(j=0;j<nDim;j++)
378 | 		{
379 | 			x=pPointSet[offset+j]-QueryPoint[j];
380 | 			Distance+=_abs(x);
381 | 		}
382 | 		if(Distance<MinDistance)
383 | 		{
384 | 			MinDistance=Distance;
385 | 			Index=i;
386 | 		}
387 | 	}
388 | 	return Index;
389 | }
390 | 
391 | template <class T1,class T2>
392 | void CStochastic::GaussianFiltering(T1* pSrcArray,T2* pDstArray,int NumPoints,int nChannels,int size,double sigma)
393 | {
394 | 	int i,j,u,l;
395 | 	double *pGaussian,temp;
396 | 	pGaussian=new double[2*size+1];
397 | 	Generate1DGaussian(pGaussian,size,sigma);
398 | 	for(i=0;i<NumPoints;i++)
399 | 		for(l=0;l<nChannels;l++)
400 | 		{
401 | 			temp=0;
402 | 			for(j=-size;j<=size;j++)
403 | 			{
404 | 				u=i+j;
405 | 				u=__max(__min(u,NumPoints-1),0);
406 | 				temp+=pSrcArray[u*nChannels+l]*pGaussian[j+size];
407 | 			}
408 | 			pDstArray[i*nChannels+l]=temp;
409 | 		}
410 | 	delete pGaussian;
411 | }
412 | 
413 | #endif
414 | 


--------------------------------------------------------------------------------
/src/Vector.h:
--------------------------------------------------------------------------------
  1 | // Author: Ce Liu (c) Dec, 2009; celiu@mit.edu
  2 | // Modified By: Deepak Pathak (c) 2016; pathak@berkeley.edu
  3 | 
  4 | #pragma once
  5 | 
  6 | #include "stdio.h"
  7 | #include "project.h"
  8 | #include <vector>
  9 | 
 10 | using namespace std;
 11 | 
 12 | template <class T>
 13 | class Vector
 14 | {
 15 | protected:
 16 | 	int nDim;
 17 | 	T* pData;
 18 | public:
 19 | 	Vector(void);
 20 | 	Vector(int ndim,const T *data=NULL);
 21 | 	Vector(const Vector<T>& vect);
 22 | 	~Vector(void);
 23 | 	void releaseData();
 24 | 	void allocate(int ndim);
 25 | 	void allocate(const Vector<T>& vect){allocate(vect.nDim);};
 26 | 	void copyData(const Vector<T>& vect);
 27 | 	void dimcheck(const Vector<T>& vect) const;
 28 | 	void reset();
 29 | 	double norm2() const;
 30 | 
 31 | 	T sum() const;
 32 | 
 33 | 	void printVector();
 34 | 
 35 | 	// access the members
 36 | 	const T* data() const{return (const T*)pData;};
 37 | 	T* data() {return pData;};
 38 | 	int dim() const {return nDim;};
 39 | 	inline bool matchDimension(int _ndim) const {if(nDim==_ndim) return true;else return false;};
 40 | 	inline bool matchDimension(const Vector<T>& vect) const {return matchDimension(vect.nDim);};
 41 | 
 42 | 	// operators
 43 | 	inline T operator[](int index) const {return pData[index];};
 44 | 	inline T& operator[](int index){return *(pData+index);};
 45 | 	Vector<T>& operator=(const Vector<T>& vect);
 46 | 
 47 | 	//const Vector<T>& operator/(double val) const
 48 | 	//{
 49 | 	//	Vector<T> result(nDim);
 50 | 	//	for(int i =0;i<nDim;i++)
 51 | 	//		result.pData[i] = pData[i]/val;
 52 | 	//	return result;
 53 | 	//}
 54 | 
 55 | 	Vector<T>& operator+=(const Vector<T>& vect);
 56 | 	Vector<T>& operator*=(const Vector<T>& vect);
 57 | 	Vector<T>& operator-=(const Vector<T>& vect);
 58 | 	Vector<T>& operator/=(const Vector<T>& vect);
 59 | 
 60 | 	Vector<T>& operator+=(double val);
 61 | 	Vector<T>& operator*=(double val);
 62 | 	Vector<T>& operator-=(double val);
 63 | 	Vector<T>& operator/=(double val);
 64 | 
 65 | 	//friend const Vector<T> operator+(const Vector<T>& vect1,const Vector<T>& vect2);
 66 | 	//friend const Vector<T> operator*(const Vector<T>& vect1,const Vector<T>& vect2);
 67 | 	//friend const Vector<T> operator-(const Vector<T>& vect1,const Vector<T>& vect2);
 68 | 	//friend const Vector<T> operator/(const Vector<T>& vect1,const Vector<T>& vect2);
 69 | 
 70 | 	//friend const Vector<T> operator+(const Vector<T>& vect1,double val);
 71 | 	//friend const Vector<T> operator*(const Vector<T>& vect1,double val);
 72 | 	//friend const Vector<T> operator-(const Vector<T>& vect1,double val);
 73 | 	//friend Vector<T> operator/(const Vector<T>& vect,double val);
 74 | 
 75 | 	friend double innerproduct(const Vector<T>& vect1,const Vector<T>& vect2)
 76 | 	{
 77 | 		double result = 0;
 78 | 		for(int i = 0;i<vect1.dim();i++)
 79 | 			result += vect1[i]*vect2[i];
 80 | 		return result;
 81 | 	}
 82 | 
 83 | 	void concatenate(const vector< Vector<T> >& vect);
 84 | 
 85 | 	//friend const Vector<T> concatenate(const vector<Vector<T>>& vect){Vector<T> result; result.concatenate(vect); return result;};
 86 | 	bool write(ofstream& myfile)
 87 | 	{
 88 | 		myfile.write((char *)&nDim,sizeof(int));
 89 | 		myfile.write((char *)pData,sizeof(T)*nDim);
 90 | 		return true;
 91 | 	}
 92 | 	bool read(ifstream& myfile)
 93 | 	{
 94 | 		myfile.read((char *)&nDim,sizeof(int));
 95 | 		allocate(nDim);
 96 | 		myfile.read((char *)pData,sizeof(T)*nDim);
 97 | 		return true;
 98 | 	}
 99 | 	T mean(int N=-1) const
100 | 	{
101 | 		if(N==-1)
102 | 			N = nDim;
103 | 		T result = 0;
104 | 		for(int i = 0;i<N;i++)
105 | 			result += pData[i];
106 | 		return result/N;
107 | 	}
108 | #ifdef _MATLAB
109 | 	void readVector(const mxArray* prhs);
110 | 	void writeVector(mxArray*& prhs) const;
111 | #endif
112 | };
113 | 
114 | //template <class T>
115 | //double innerproduct(const Vector<T>& vect1,const Vector<T>& vect2)
116 | //{
117 | //	double result = 0;
118 | //	for(int i = 0;i<vect1.dim();i++)
119 | //		result += vect1[i]*vect2[i];
120 | //	return result;
121 | //}
122 | 
123 | template <class T>
124 | Vector<T>::Vector(void)
125 | {
126 | 	nDim=0;
127 | 	pData=NULL;
128 | }
129 | 
130 | template <class T>
131 | Vector<T>::Vector(int ndim, const T *data)
132 | {
133 | 	nDim=ndim;
134 | 	pData=new T[nDim];
135 | 	if(data!=NULL)
136 | 		memcpy(pData,data,sizeof(T)*nDim);
137 | 	else
138 | 		memset(pData,0,sizeof(T)*nDim);
139 | }
140 | 
141 | template <class T>
142 | Vector<T>::Vector(const Vector& vect)
143 | {
144 | 	nDim=0;
145 | 	pData=NULL;
146 | 	copyData(vect);
147 | }
148 | 
149 | template <class T>
150 | Vector<T>::~Vector(void)
151 | {
152 | 	releaseData();
153 | }
154 | 
155 | template <class T>
156 | void Vector<T>::releaseData()
157 | {
158 | 	if(pData!=NULL)
159 | 		delete[] pData;
160 | 	pData=NULL;
161 | 	nDim=0;
162 | }
163 | 
164 | template <class T>
165 | void Vector<T>::allocate(int ndim)
166 | {
167 | 	releaseData();
168 | 	nDim=ndim;
169 | 	if(nDim>0)
170 | 	{
171 | 		pData=new T[nDim];
172 | 		reset();
173 | 	}
174 | }
175 | 
176 | 
177 | template <class T>
178 | void Vector<T>::copyData(const Vector &vect)
179 | {
180 | 	if(nDim!=vect.nDim)
181 | 	{
182 | 		releaseData();
183 | 		nDim=vect.nDim;
184 | 		pData=new T[nDim];
185 | 	}
186 | 	memcpy(pData,vect.pData,sizeof(T)*nDim);
187 | }
188 | 
189 | template <class T>
190 | void Vector<T>::dimcheck(const Vector &vect) const
191 | {
192 | 	if(nDim!=vect.nDim)
193 | 		cout<<"The dimensions of the vectors don't match!"<<endl;
194 | }
195 | 
196 | template <class T>
197 | void Vector<T>::reset()
198 | {
199 | 	if(pData!=NULL)
200 | 		memset(pData,0,sizeof(T)*nDim);
201 | }
202 | 
203 | 
204 | template <class T>
205 | T Vector<T>::sum() const
206 | {
207 | 	T total = 0;
208 | 	for(int i=0;i<nDim;i++)
209 | 		total += pData[i];
210 | 	return total;
211 | }
212 | 
213 | template <class T>
214 | double Vector<T>::norm2() const
215 | {
216 | 	double temp=0;
217 | 	for(int i=0;i<nDim;i++)
218 | 		temp+=pData[i]*pData[i];
219 | 	return temp;
220 | }
221 | 
222 | template <class T>
223 | void Vector<T>::printVector()
224 | {
225 | 	for(int i=0;i<nDim;i++)
226 | 		cout<<pData[i]<<' ';
227 | 	cout<<endl;
228 | }
229 | 
230 | 
231 | //----------------------------------------------------------------------------------
232 | // operators
233 | //----------------------------------------------------------------------------------
234 | template <class T>
235 | Vector<T>& Vector<T>::operator =(const Vector<T> &vect)
236 | {
237 | 	copyData(vect);
238 | 	return *this;
239 | }
240 | 
241 | template <class T>
242 | Vector<T>& Vector<T>::operator +=(const Vector<T> &vect)
243 | {
244 | 	dimcheck(vect);
245 | 	for(int i=0;i<nDim;i++)
246 | 		pData[i]+=vect.data()[i];
247 | 	return *this;
248 | }
249 | 
250 | template <class T>
251 | Vector<T>& Vector<T>::operator *=(const Vector<T> &vect)
252 | {
253 | 	dimcheck(vect);
254 | 	for(int i=0;i<nDim;i++)
255 | 		pData[i]*=vect.data()[i];
256 | 	return *this;
257 | }
258 | 
259 | template <class T>
260 | Vector<T>& Vector<T>::operator -=(const Vector<T> &vect)
261 | {
262 | 	dimcheck(vect);
263 | 	for(int i=0;i<nDim;i++)
264 | 		pData[i]-=vect.data()[i];
265 | 	return *this;
266 | }
267 | 
268 | template <class T>
269 | Vector<T>& Vector<T>::operator /=(const Vector<T> &vect)
270 | {
271 | 	dimcheck(vect);
272 | 	for(int i=0;i<nDim;i++)
273 | 		pData[i]/=vect.data()[i];
274 | 	return *this;
275 | }
276 | 
277 | template <class T>
278 | Vector<T>& Vector<T>::operator +=(double val)
279 | {
280 | 	for(int i=0;i<nDim;i++)
281 | 		pData[i]+=val;
282 | 	return *this;
283 | }
284 | 
285 | template <class T>
286 | Vector<T>& Vector<T>::operator *=(double val)
287 | {
288 | 	for(int i=0;i<nDim;i++)
289 | 		pData[i]*=val;
290 | 	return *this;
291 | }
292 | 
293 | template <class T>
294 | Vector<T>& Vector<T>::operator -=(double val)
295 | {
296 | 	for(int i=0;i<nDim;i++)
297 | 		pData[i]-=val;
298 | 	return *this;
299 | }
300 | 
301 | template <class T>
302 | Vector<T>& Vector<T>::operator /=(double val)
303 | {
304 | 	for(int i=0;i<nDim;i++)
305 | 		pData[i]/=val;
306 | 	return *this;
307 | }
308 | 
309 | 
310 | template<class T>
311 | const Vector<T> operator+(const Vector<T>& vect1,const Vector<T>& vect2)
312 | {
313 | 	vect1.dimcheck(vect2);
314 | 	Vector<T> result(vect1);
315 | 	result+=vect2;
316 | 	return result;
317 | }
318 | 
319 | template<class T>
320 | const Vector<T> operator-(const Vector<T>& vect1,const Vector<T>& vect2)
321 | {
322 | 	vect1.dimcheck(vect2);
323 | 	Vector<T> result(vect1);
324 | 	result-=vect2;
325 | 	return result;
326 | }
327 | 
328 | template<class T>
329 | const Vector<T> operator*(const Vector<T>& vect1,const Vector<T>& vect2)
330 | {
331 | 	vect1.dimcheck(vect2);
332 | 	Vector<T> result(vect1);
333 | 	result*=vect2;
334 | 	return result;
335 | }
336 | 
337 | template<class T>
338 | const Vector<T> operator/(const Vector<T>& vect1,const Vector<T>& vect2)
339 | {
340 | 	vect1.dimcheck(vect2);
341 | 	Vector<T> result(vect1);
342 | 	result/=vect2;
343 | 	return result;
344 | }
345 | 
346 | template <class T>
347 | Vector<T> operator+(const Vector<T>& vect,double val)
348 | {
349 | 	Vector<T> result(vect);
350 | 	result+=val;
351 | 	return result;
352 | }
353 | 
354 | template <class T>
355 | Vector<T> operator-(const Vector<T>& vect,double val)
356 | {
357 | 	Vector<T> result(vect);
358 | 	result-=val;
359 | 	return result;
360 | }
361 | 
362 | template <class T>
363 | Vector<T> operator*(const Vector<T>& vect,double val)
364 | {
365 | 	Vector<T> result(vect);
366 | 	result*=val;
367 | 	return result;
368 | }
369 | 
370 | template <class T>
371 | Vector<T> operator/(const Vector<T>& vect,double val)
372 | {
373 | 	Vector<T> result(vect);
374 | 	result/=val;
375 | 	return result;
376 | }
377 | 
378 | 
379 | template <class T>
380 | double innerproduct(const Vector<T>& vect1,const Vector<T>& vect2)
381 | {
382 | 	vect1.dimcheck(vect2);
383 | 	double result=0;
384 | 	for(int i=0;i<vect1.nDim;i++)
385 | 		result+=vect1.pData[i]*vect2.pData[i];
386 | 	return result;
387 | }
388 | 
389 | template <class T>
390 | void Vector<T>::concatenate(const vector< Vector<T> >& vect)
391 | {
392 | 	releaseData();
393 | 	nDim = 0;
394 | 	for(int i = 0;i<vect.size();i++)
395 | 		nDim += vect[i].dim();
396 | 	allocate(nDim);
397 | 	int dim = 0;
398 | 	for(int i = 0;i<vect.size(); i++)
399 | 	{
400 | 		for(int j = 0;j<vect[i].dim();j++)
401 | 			pData[dim+j] = vect[i][j];
402 | 		dim += vect[i].dim();
403 | 	}
404 | }
405 | 
406 | #ifdef _QT
407 | 
408 | bool Vector::writeVector(QFile& file) const
409 | {
410 | 	file.write((char *)&nDim,sizeof(int));
411 | 	if(file.write((char *)pData,sizeof(double)*nDim)!=sizeof(double)*nDim)
412 | 		return false;
413 | 	return true;
414 | }
415 | 
416 | bool Vector::readVector(QFile &file)
417 | {
418 | 	releaseData();
419 | 	file.read((char *)&nDim,sizeof(int));
420 | 	if(nDim<0)
421 | 		return false;
422 | 	if(nDim>0)
423 | 	{
424 | 		allocate(nDim);
425 | 		if(file.read((char *)pData,sizeof(double)*nDim)!=sizeof(double)*nDim)
426 | 			return false;
427 | 	}
428 | 	return true;
429 | }
430 | 
431 | #endif
432 | 
433 | 
434 | #ifdef _MATLAB
435 | 
436 | template <class T>
437 | void Vector<T>::readVector(const mxArray* prhs)
438 | {
439 | 	if(pData!=NULL)
440 | 		delete[] pData;
441 | 	int nElements = mxGetNumberOfDimensions(prhs);
442 | 	if(nElements>2)
443 | 		mexErrMsgTxt("A vector is expected to be loaded!");
444 | 	const int* dims = mxGetDimensions(prhs);
445 | 	nDim = dims[0]*dims[1];
446 | 	pData = new T[nDim];
447 | 	double* ptr = (double*)mxGetData(prhs);
448 | 	for(int i =0;i<nDim;i++)
449 | 		pData[i] = ptr[i];
450 | }
451 | 
452 | template <class T>
453 | void Vector<T>::writeVector(mxArray*& plhs) const
454 | {
455 | 	int dims[2];
456 | 	dims[0]=nDim;dims[1]=1;
457 | 	plhs=mxCreateNumericArray(2, dims,mxDOUBLE_CLASS, mxREAL);
458 | 	double *ptr = (double*)mxGetData(plhs);
459 | 	for(int i =0;i<nDim;i++)
460 | 		ptr[i] = pData[i];
461 | }
462 | #endif
463 | 
464 | //*/
465 | 


--------------------------------------------------------------------------------
/src/project.h:
--------------------------------------------------------------------------------
 1 | // Author: Ce Liu (c) Dec, 2009; celiu@mit.edu
 2 | // Modified By: Deepak Pathak (c) 2016; pathak@berkeley.edu
 3 | 
 4 | #pragma once
 5 | #include "stdio.h"
 6 | #include <vector>
 7 | 
 8 | // if the files are compiled in linux or mac os then uncomment the following line, otherwise comment it if you compile using visual studio in windows
 9 | #define _LINUX_MAC
10 | // #define _OPENCV
11 | 
12 | template <class T>
13 | void _Release1DBuffer(T* pBuffer)
14 | {
15 | 	if(pBuffer!=NULL)
16 | 		delete []pBuffer;
17 | 	pBuffer=NULL;
18 | }
19 | 
20 | template <class T>
21 | void _Rlease2DBuffer(T** pBuffer,size_t nElements)
22 | {
23 | 	for(size_t i=0;i<nElements;i++)
24 | 		delete [](pBuffer[i]);
25 | 	delete []pBuffer;
26 | 	pBuffer=NULL;
27 | }
28 | 
29 | // disable matlab support
30 | // #define _MATLAB
31 | 
32 | #ifdef _MATLAB
33 | #include "mex.h"
34 | 
35 | #endif
36 | 
37 | 
38 | #ifdef _LINUX_MAC
39 | 
40 | template <class T1,class T2>
41 | T1 __min(T1 a, T2 b)
42 | {
43 |   return (a>b)?b:a;
44 | }
45 | 
46 | template <class T1,class T2>
47 | T1 __max(T1 a, T2 b)
48 | {
49 |   return (a<b)?b:a;
50 | }
51 | 
52 | #endif
53 | 


--------------------------------------------------------------------------------