├── 6.png ├── 8.png ├── CMakeLists.txt ├── README.txt ├── include ├── CPM_include │ ├── CPM.h │ ├── Image.h │ ├── ImageFeature.h │ ├── ImageIO.h │ ├── ImageProcessing.h │ ├── ImagePyramid.h │ ├── OpticFlowIO.h │ ├── Stochastic.h │ ├── Util.h │ ├── Vector.h │ └── project.h ├── ColorModel.h ├── Minimization.h ├── Pixel.h ├── ThreadPool.h ├── Unmixing.h ├── constants.h └── guidedfilter.h ├── lib ├── libCPM_lib.a └── libCPM_lib.so ├── sphere01.txt └── src ├── ColorModel.cpp ├── Minimization.cpp ├── Pixel.cpp ├── guidedfilter.cpp └── main.cpp /6.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/V-Sense/soft_segmentation/a0e2717199787633eb849b5e66a59e9fd7f53b31/6.png -------------------------------------------------------------------------------- /8.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/V-Sense/soft_segmentation/a0e2717199787633eb849b5e66a59e9fd7f53b31/8.png -------------------------------------------------------------------------------- /CMakeLists.txt: -------------------------------------------------------------------------------- 1 | cmake_minimum_required(VERSION 2.8) 2 | 3 | set(PROJECTNAME "SoftSegmentation") 4 | project(${PROJECTNAME} C CXX) 5 | 6 | # for gdb debug -> run cmake -DCMAKE_BUILD_TYPE=Debug 7 | set(CMAKE_BUILD_TYPE Debug) #Debug or Release 8 | 9 | # Enable C++11 features 10 | if(CMAKE_COMPILER_IS_GNUCXX) 11 | set(CMAKE_CXX_FLAGS "-std=gnu++11") 12 | elseif(CMAKE_CXX_COMPILER_ID STREQUAL "Clang") 13 | set(CMAKE_CXX_FLAGS "-std=c++11") 14 | endif() 15 | 16 | find_package(OpenCV REQUIRED) 17 | 18 | set(CMAKE_THREAD_PREFER_PTHREAD TRUE) 19 | set(THREADS_PREFER_PTHREAD_FLAG TRUE) 20 | 21 | find_package(Threads REQUIRED) 22 | 23 | include_directories(src) 24 | include_directories(include) 25 | include_directories(include/CPM_include) 26 | 27 | #file(GLOB HEADERS include/*.h) 28 | file(GLOB SOURCES src/*.cpp) 29 | 30 | #message(STATUS ${CMAKE_SOURCE_DIR}) 31 | 32 | #create a library out of this program 33 | #add_library(${PROJECTNAME}_lib ${SOURCES}) 34 | 35 | add_executable(${PROJECTNAME} src/main.cpp ${SOURCES}) 36 | target_link_libraries(${PROJECTNAME} 37 | ${CMAKE_THREAD_LIBS_INIT} 38 | ${CMAKE_SOURCE_DIR}/lib/libCPM_lib.so 39 | ${OpenCV_LIBS} 40 | ) 41 | -------------------------------------------------------------------------------- /README.txt: -------------------------------------------------------------------------------- 1 | This is a C++ implementation of the paper: 2 | 3 | Unmixing-Based Soft Color Segmentation for Image Manipulation 4 | 5 | Yagiz Aksoy, Tunc Ozan Aydin, Aljosa Smolic and Marc Pollefeys, ACM Trans. Graph., 2017 6 | 7 | Dependencies 8 | 9 | 10 | Ubuntu 14.04 or 16.04 11 | OpenCV 3.x 12 | Install the following dependencies from terminal: 13 | 14 | 15 | sudo apt-get install libpthread-stubs0-dev libboost-all-dev 16 | 17 | 18 | Installation: 19 | 20 | 1. Clone the code. 21 | 22 | 2. Build the project using the following commands: 23 | 24 | mkdir build 25 | cd build 26 | cmake .. 27 | make 28 | 29 | 3. Run the code as follow: 30 | 31 | ./SoftSegmentation 32 | 33 | For example: 34 | ./SoftSegmentation ../4_small.png 15 results 35 | 36 | Results are saved in the folder . 37 | 38 | A tau parameter of 11 gives good results. 39 | -------------------------------------------------------------------------------- /include/CPM_include/CPM.h: -------------------------------------------------------------------------------- 1 | /* 2 | 3 | Code of the Coarse-to-Fine PatchMatch, published at CVPR 2016 in 4 | "Efficient Coarse-to-Fine PatchMatch for Large Displacement Optical Flow" 5 | by Yinlin.Hu, Rui Song and Yunsong Li. 6 | 7 | Email: huyinlin@gmail.com 8 | 9 | Version 1.2 10 | 11 | Copyright (C) 2016 Yinlin.Hu 12 | 13 | Usages: 14 | 15 | The program "cpm.exe" has been built and tested on Windows 7. 16 | 17 | USAGE: cpm.exe img1Name img2Name outMatchName 18 | 19 | Explanations: 20 | 21 | The output of the program is a text file, which is in the format of "x1,y1,x2,y2" 22 | corresponding to one match per line. 23 | 24 | */ 25 | 26 | #ifndef _CPM_H_ 27 | #define _CPM_H_ 28 | 29 | #include "ImagePyramid.h" 30 | 31 | class CPM 32 | { 33 | public: 34 | CPM(); 35 | ~CPM(); 36 | 37 | int Matching(FImage& img1, FImage& img2, FImage& outMatches); 38 | void SetStereoFlag(int needStereo); 39 | void SetStep(int step); 40 | 41 | private: 42 | void imDaisy(FImage& img, UCImage& outFtImg); 43 | void CrossCheck(IntImage& seeds, FImage& seedsFlow, FImage& seedsFlow2, IntImage& kLabel2, int* valid, float th); 44 | float MatchCost(FImage& img1, FImage& img2, UCImage* im1f, UCImage* im2f, int x1, int y1, int x2, int y2); 45 | 46 | // a good initialization is already stored in bestU & bestV 47 | int Propogate(FImagePyramid& pyd1, FImagePyramid& pyd2, UCImage* pyd1f, UCImage* pyd2f, int level, float* radius, int iterCnt, IntImage* pydSeeds, IntImage& neighbors, FImage* pydSeedsFlow, float* bestCosts); 48 | void PyramidRandomSearch(FImagePyramid& pyd1, FImagePyramid& pyd2, UCImage* im1f, UCImage* im2f, IntImage* pydSeeds, IntImage& neighbors, FImage* pydSeedsFlow); 49 | void OnePass(FImagePyramid& pyd1, FImagePyramid& pyd2, UCImage* im1f, UCImage* im2f, IntImage& seeds, IntImage& neighbors, FImage* pydSeedsFlow); 50 | void UpdateSearchRadius(IntImage& neighbors, FImage* pydSeedsFlow, int level, float* outRadius); 51 | 52 | // minimum circle 53 | struct Point{ 54 | double x, y; 55 | }; 56 | double dist(Point a, Point b); 57 | Point intersection(Point u1, Point u2, Point v1, Point v2); 58 | Point circumcenter(Point a, Point b, Point c); 59 | // return the radius of the minimal circle 60 | float MinimalCircle(float* x, float*y, int n, float* centerX = NULL, float* centerY = NULL); 61 | 62 | // 63 | int _step; 64 | int _maxIters; 65 | float _stopIterRatio; 66 | float _pydRatio; 67 | 68 | int _isStereo; 69 | int _maxDisplacement; 70 | float _checkThreshold; 71 | int _borderWidth; 72 | 73 | IntImage _kLabels, _kLabels2; 74 | 75 | FImagePyramid _pyd1; 76 | FImagePyramid _pyd2; 77 | 78 | UCImage* _im1f; 79 | UCImage* _im2f; 80 | 81 | FImage* _pydSeedsFlow; 82 | FImage* _pydSeedsFlow2; 83 | 84 | IntImage _seeds; 85 | IntImage _seeds2; 86 | IntImage _neighbors; 87 | IntImage _neighbors2; 88 | 89 | }; 90 | 91 | #endif // _CPM_H_ -------------------------------------------------------------------------------- /include/CPM_include/ImageFeature.h: -------------------------------------------------------------------------------- 1 | #pragma once 2 | #include "Image.h" 3 | #include "math.h" 4 | #include "memory.h" 5 | #include 6 | 7 | #ifndef M_PI 8 | #define M_PI 3.1415926535897932384626433 9 | #endif 10 | 11 | 12 | class ImageFeature 13 | { 14 | public: 15 | ImageFeature(void); 16 | ~ImageFeature(void); 17 | 18 | template 19 | static void imSIFT(const Image& imsrc, UCImage& imsift, int cellSize = 2, int stepSize = 1, bool IsBoundaryIncluded = false, int nBins = 8); 20 | 21 | template 22 | static void imSIFT(const Image& imsrc, UCImage& imsift, const vector cellSizeVect, int stepSize = 1, bool IsBoundaryIncluded = false, int nBins = 8); 23 | 24 | }; 25 | 26 | template 27 | void ImageFeature::imSIFT(const Image& imsrc, UCImage &imsift, int cellSize, int stepSize, bool IsBoundaryIncluded, int nBins) 28 | { 29 | if(cellSize<=0) 30 | { 31 | cout<<"The cell size must be positive!"<Max) 71 | { 72 | Max = magsrc.pData[offset+j]; 73 | gradient.pData[i*2] = imdx.pData[offset+j]/Max; 74 | gradient.pData[i*2+1] = imdy.pData[offset+j]/Max; 75 | } 76 | } 77 | mag.pData[i] = Max; 78 | } 79 | 80 | // get the pixel-wise energy for each orientation band 81 | FImage imband(width,height,nBins); 82 | float theta = M_PI*2/nBins; 83 | float _cos,_sin,temp; 84 | for(int k = 0;k1) 92 | temp = pow(temp,alpha); 93 | imband.pData[i*nBins+k] = temp*mag.pData[i]; 94 | } 95 | } 96 | 97 | // filter out the SIFT feature 98 | FImage filter(cellSize*2+1,1); 99 | filter[0] = filter[cellSize+1] = 0.25; 100 | for(int i = 1;i=width) 146 | // x = __min(__max(x,0),width-1); 147 | //if (y<0 || y>=height) 148 | // y= __min(__max(y,0),height-1); 149 | 150 | memcpy(sift_cell.pData + count*nBins, imband_cell.pData + (y*width + x)*nBins, sizeof(float)*nBins); 151 | count++; 152 | } 153 | } 154 | // normalize the SIFT descriptor 155 | #ifdef WITH_SSE 156 | int offset = (i*sift_width + j)*siftdim; 157 | //memcpy(imsift.pData+offset,sift_cell.pData,sizeof(float)*siftdim); 158 | unsigned char* dst = imsift.pData + offset; 159 | // 160 | hu_m128* src = (hu_m128*)sift_cell.pData; 161 | hu_m128 r0, r1, r2, r3, r4; 162 | r0.m = _mm_set_ps1(0); 163 | for (int ii = 0; ii < siftdim / 4; ii++){ 164 | r1.m = _mm_mul_ps(src->m, src->m); 165 | r0.m = _mm_add_ps(r0.m, r1.m); 166 | src++; 167 | } 168 | float mag = sqrt(r0.m128_f32[0] + r0.m128_f32[1] + r0.m128_f32[2] + r0.m128_f32[3]); 169 | // 170 | hu_m128 _vmag; 171 | _vmag.m= _mm_set_ps1(mag); 172 | src = (hu_m128*)sift_cell.pData; 173 | for (int ii = 0; ii < siftdim / 4;ii++){ 174 | r1.m = _mm_add_ps(_vmag.m, _v1.m); 175 | r2.m = _mm_div_ps(src->m, r1.m); 176 | r3.m = _mm_mul_ps(r2.m, _v5.m); 177 | r4.m = _mm_min_ps(r3.m, _v5.m); 178 | dst[0] = r4.m128_f32[0]; 179 | dst[1] = r4.m128_f32[1]; 180 | dst[2] = r4.m128_f32[2]; 181 | dst[3] = r4.m128_f32[3]; 182 | dst += 4; 183 | src++; 184 | } 185 | #else 186 | float mag = sqrt(sift_cell.norm2()); 187 | int offset = (i*sift_width + j)*siftdim; 188 | //memcpy(imsift.pData+offset,sift_cell.pData,sizeof(float)*siftdim); 189 | for (int k = 0; k < siftdim; k++) 190 | imsift.pData[offset + k] = (unsigned char)__min(sift_cell.pData[k] / (mag + 0.01) * 255, 255);//(unsigned char) __min(sift_cell.pData[k]/mag*512,255); 191 | #endif 192 | }//*/ 193 | } 194 | } 195 | 196 | 197 | //-------------------------------------------------------------------------------------------------- 198 | // multi-scale SIFT features 199 | //-------------------------------------------------------------------------------------------------- 200 | template 201 | void ImageFeature::imSIFT(const Image& imsrc, UCImage &imsift, const vector cellSizeVect, int stepSize, bool IsBoundaryIncluded, int nBins) 202 | { 203 | // this parameter controls decay of the gradient energy falls into a bin 204 | // run SIFT_weightFunc.m to see why alpha = 9 is the best value 205 | int alpha = 9; 206 | 207 | int width = imsrc.width(), height = imsrc.height(), nchannels = imsrc.nchannels(); 208 | int nPixels = width*height; 209 | FImage imdx(width, height, nchannels), imdy(width, height, nchannels); 210 | // compute the derivatives; 211 | #if 0 212 | imsrc.dx(imdx, true); 213 | imsrc.dy(imdy, true); 214 | #else 215 | // sobel, more robust 216 | float xKernel[9] = { -1, 0, 1, -2, 0, 2, -1, 0, 1 }; 217 | float yKernel[9] = { -1, -2, -1, 0, 0, 0, 1, 2, 1 }; 218 | ImageProcessing::filtering(imsrc.pData, imdx.pData, width, height, nchannels, xKernel, 1); 219 | ImageProcessing::filtering(imsrc.pData, imdy.pData, width, height, nchannels, yKernel, 1); 220 | #endif 221 | 222 | // get the maximum gradient over the channels and estimate the normalized gradient 223 | FImage magsrc(width,height,nchannels),mag(width,height),gradient(width,height,2); 224 | float Max; 225 | for(int i=0;iMax) 239 | { 240 | Max = magsrc.pData[offset+j]; 241 | gradient.pData[i*2] = imdx.pData[offset+j]/Max; 242 | gradient.pData[i*2+1] = imdy.pData[offset+j]/Max; 243 | } 244 | } 245 | mag.pData[i] = Max; 246 | } 247 | 248 | // get the pixel-wise energy for each orientation band 249 | FImage imband(width,height,nBins); 250 | float theta = M_PI*2/nBins; 251 | float _cos,_sin,temp; 252 | for(int k = 0;k1) 260 | temp = pow(temp,alpha); 261 | imband.pData[i*nBins+k] = temp*mag.pData[i]; 262 | } 263 | } 264 | // get the maximum cell size 265 | int maxCellSize = cellSizeVect[0]; 266 | int nScales = cellSizeVect.size(); 267 | for(int h=1;h=width) 323 | // x = __min(__max(x,0),width-1); 324 | //if (y<0 || y>=height) 325 | // y= __min(__max(y,0),height-1); 326 | 327 | memcpy(sift_cell.pData+count*nBins,imband_cell.pData+(y*width+x)*nBins,sizeof(float)*nBins); 328 | count++; 329 | } 330 | // normalize the SIFT descriptor 331 | float mag = sqrt(sift_cell.norm2()); 332 | int offset = (i*sift_width+j)*siftdim*nScales+h*siftdim; 333 | //memcpy(imsift.pData+offset,sift_cell.pData,sizeof(float)*siftdim); 334 | for(int k = 0;k 9 | 10 | #ifdef WITH_SSE 11 | #include 12 | #endif 13 | 14 | template 15 | inline void* xmalloc(T size){ 16 | #ifdef WITH_SSE 17 | #ifdef WIN32 18 | return _aligned_malloc(size, 32); 19 | #else 20 | return memalign(32, size); 21 | #endif 22 | #else 23 | return malloc(size); 24 | #endif 25 | } 26 | 27 | template 28 | inline void xfree(T* ptr){ 29 | #if defined(WITH_SSE) && defined(WIN32) 30 | _aligned_free(ptr); 31 | #else 32 | free(ptr); 33 | #endif 34 | } 35 | 36 | #ifdef WITH_SSE 37 | 38 | // for windows and linux 39 | typedef union _m128{ 40 | __m128 m; 41 | __m128i mi; 42 | float m128_f32[4]; 43 | unsigned short m128i_u16[8]; 44 | }hu_m128; 45 | 46 | #endif 47 | 48 | class ImageIO 49 | { 50 | public: 51 | enum ImageType{standard, derivative, normalized}; 52 | ImageIO(void); 53 | ~ImageIO(void); 54 | public: 55 | template 56 | static bool loadImage(const char* filename,T*& pImagePlane,int& width,int& height, int& nchannels); 57 | template 58 | static bool saveImage(const char* filename,const T* pImagePlane,int width,int height, int nchannels,ImageType imtype = standard); 59 | template 60 | static void showImage(const char* winname, const T* pImagePlane, int width, int height, int nchannels, ImageType imtype = standard, int waittime = 1); 61 | template 62 | static void showGrayImageAsColor(const char* winname, const unsigned char* pImagePlane, int width, int height, T minV, T maxV, int waittime = 1); 63 | template 64 | static cv::Mat CvmatFromPixels(const T* pImagePlane, int width, int height, int nchannels, ImageType imtype = standard); 65 | template 66 | static void CvmatToPixels(const cv::Mat& cvInImg, T*& pOutImagePlane, int& width, int& height, int& nchannels); 67 | private: 68 | }; 69 | 70 | template 71 | bool ImageIO::loadImage(const char *filename, T *&pImagePlane, int &width, int &height, int &nchannels) 72 | { 73 | cv::Mat im = cv::imread(filename); 74 | if (im.data == NULL){ 75 | return false; 76 | } 77 | pImagePlane = (T*)xmalloc(sizeof(T) * im.total() * im.elemSize()); 78 | CvmatToPixels(im, pImagePlane, width, height, nchannels); 79 | return true; 80 | } 81 | 82 | template 83 | bool ImageIO::saveImage(const char* filename,const T* pImagePlane,int width,int height, int nchannels,ImageType imtype) 84 | { 85 | cv::Mat img = CvmatFromPixels(pImagePlane, width, height, nchannels, imtype); 86 | return cv::imwrite(filename, img); 87 | } 88 | 89 | template 90 | void ImageIO::showImage(const char* winname, const T* pImagePlane, int width, int height, int nchannels, 91 | ImageType imtype /*= standard*/, int waittime /*= 1*/) 92 | { 93 | cv::Mat img = CvmatFromPixels(pImagePlane, width, height, nchannels, imtype); 94 | cv::imshow(winname, img); 95 | cv::waitKey(waittime); 96 | } 97 | 98 | template 99 | void ImageIO::showGrayImageAsColor(const char* winname, const unsigned char* pImagePlane, int width, int height, 100 | T minV, T maxV, int waittime /*= 1*/) 101 | { 102 | CColorTable colorTbl; 103 | 104 | // check whether the type is float point 105 | bool IsFloat = false; 106 | if (typeid(T) == typeid(double) || typeid(T) == typeid(float) || typeid(T) == typeid(long double)) 107 | IsFloat = true; 108 | 109 | cv::Mat im; 110 | im.create(height, width, CV_8UC3); 111 | for (int i = 0; i < height; i++){ 112 | for (int j = 0; j < width; j++){ 113 | unsigned char grayVal = pImagePlane[i*width + j]; 114 | if (IsFloat){ 115 | grayVal = pImagePlane[i*width + j] * 255; 116 | } 117 | memcpy(im.data + i*im.step + j * 3, colorTbl[grayVal], 3); 118 | } 119 | } 120 | 121 | // show range 122 | char info[256]; 123 | if (IsFloat) 124 | sprintf(info, "[%.3f, %.3f]", (float)minV, (float)maxV); 125 | else 126 | sprintf(info, "[%d, %d]", (int)minV, (int)maxV); 127 | cv::putText(im, info, cvPoint(10, 20), CV_FONT_HERSHEY_SIMPLEX, 0.5, cvScalar(255, 255, 255)); 128 | 129 | // 130 | cv::imshow(winname, im); 131 | cv::waitKey(waittime); 132 | } 133 | 134 | template 135 | cv::Mat ImageIO::CvmatFromPixels(const T* pImagePlane, int width, int height, int nchannels, ImageType imtype /*= standard*/) 136 | { 137 | cv::Mat im; 138 | switch (nchannels){ 139 | case 1: 140 | im.create(height, width, CV_8UC1); 141 | break; 142 | case 3: 143 | im.create(height, width, CV_8UC3); 144 | break; 145 | case 4: 146 | im.create(height, width, CV_8UC4); 147 | break; 148 | default: 149 | return im; 150 | } 151 | // check whether the type is float point 152 | bool IsFloat = false; 153 | if (typeid(T) == typeid(double) || typeid(T) == typeid(float) || typeid(T) == typeid(long double)) 154 | IsFloat = true; 155 | 156 | double Max, Min; 157 | int nElements = width*height*nchannels; 158 | switch (imtype){ 159 | case standard: 160 | break; 161 | case derivative: 162 | // find the max of the absolute value 163 | Max = pImagePlane[0]; 164 | for (int i = 0; i < nElements; i++) 165 | Max = __max(Max, fabs((double)pImagePlane[i])); 166 | Min = -Max; 167 | break; 168 | case normalized: 169 | Max = Min = pImagePlane[0]; 170 | for (int i = 0; i < nElements; i++) 171 | { 172 | Max = __max(Max, pImagePlane[i]); 173 | Min = __min(Min, pImagePlane[i]); 174 | } 175 | break; 176 | } 177 | if (typeid(T) == typeid(unsigned char) && imtype == standard) 178 | { 179 | for (int i = 0; i < height; i++) 180 | memcpy(im.data + i*im.step, pImagePlane + i*im.step, width*nchannels); 181 | } 182 | else 183 | { 184 | for (int i = 0; i < height; i++) 185 | { 186 | int offset1 = i*width*nchannels; 187 | int offset2 = i*im.step; 188 | for (int j = 0; j < im.step; j++) 189 | { 190 | switch (imtype){ 191 | case standard: 192 | if (IsFloat) 193 | im.data[offset2 + j] = pImagePlane[offset1 + j] * 255; 194 | else 195 | im.data[offset2 + j] = __max(__min(pImagePlane[offset1 + j], 255), 0); 196 | break; 197 | case derivative: 198 | case normalized: 199 | im.data[offset2 + j] = ((double)pImagePlane[offset1 + j] - Min) / (Max - Min) * 255; 200 | break; 201 | } 202 | } 203 | } 204 | } 205 | 206 | // show range 207 | if (imtype == derivative || imtype == normalized){ 208 | char info[256]; 209 | if (IsFloat) 210 | sprintf(info, "[%.3f, %.3f]", Min, Max); 211 | else 212 | sprintf(info, "[%d, %d]", (int)Min, (int)Max); 213 | cv::putText(im, info, cvPoint(10, 20), CV_FONT_HERSHEY_SIMPLEX, 0.5, cvScalar(255, 255, 255)); 214 | } 215 | 216 | return im; 217 | } 218 | 219 | template 220 | void ImageIO::CvmatToPixels(const cv::Mat& cvInImg, T*& pOutImagePlane, int& width, int& height, int& nchannels) 221 | { 222 | if (cvInImg.data == NULL) // if allocation fails 223 | return; 224 | if (cvInImg.type() != CV_8UC1 && cvInImg.type() != CV_8UC3 && cvInImg.type() != CV_8UC4) // we only support three types of image information for now 225 | return; 226 | width = cvInImg.size().width; 227 | height = cvInImg.size().height; 228 | nchannels = cvInImg.channels(); 229 | 230 | if (typeid(T) == typeid(unsigned char)) 231 | { 232 | for (int i = 0; i < height; i++) 233 | memcpy(pOutImagePlane + i*cvInImg.step, cvInImg.data + i*cvInImg.step, width*nchannels); 234 | return; 235 | } 236 | 237 | // check whether the type is float point 238 | bool IsFloat = false; 239 | if (typeid(T) == typeid(double) || typeid(T) == typeid(float) || typeid(T) == typeid(long double)) 240 | IsFloat = true; 241 | 242 | for (int i = 0; i < height; i++) 243 | { 244 | int offset1 = i*width*nchannels; 245 | int offset2 = i*cvInImg.step; 246 | for (int j = 0; j < width*nchannels; j++) 247 | { 248 | if (IsFloat) 249 | pOutImagePlane[offset1 + j] = (T)cvInImg.data[offset2 + j] / 255; 250 | else 251 | pOutImagePlane[offset1 + j] = cvInImg.data[offset2 + j]; 252 | } 253 | } 254 | return; 255 | } 256 | 257 | /* 258 | #include 259 | #include 260 | #include 261 | #include "math.h" 262 | //----------------------------------------------------------------------------------------- 263 | // this class is a wrapper to use QImage to load image into image planes 264 | //----------------------------------------------------------------------------------------- 265 | 266 | class ImageIO 267 | { 268 | public: 269 | enum ImageType{standard, derivative, normalized}; 270 | ImageIO(void); 271 | ~ImageIO(void); 272 | public: 273 | template 274 | static void loadImage(const QImage& image,T*& pImagePlane,int& width,int& height,int& nchannels); 275 | template 276 | static bool loadImage(const QString& filename,T*& pImagePlane,int& width,int& height,int& nchannels); 277 | 278 | template 279 | static unsigned char convertPixel(const T& value,bool IsFloat,ImageType type,T& _Max,T& _Min); 280 | 281 | template 282 | static bool writeImage(const QString& filename, const T*& pImagePlane,int width,int height,int nchannels,ImageType type=standard,int quality=-1); 283 | 284 | template 285 | static bool writeImage(const QString& filename,const T* pImagePlane,int width,int height,int nchannels,T min, T max,int quality=-1); 286 | 287 | }; 288 | 289 | template 290 | void ImageIO::loadImage(const QImage& image, T*& pImagePlane,int& width,int& height,int& nchannels) 291 | { 292 | // get the image information 293 | width=image.width(); 294 | height=image.height(); 295 | nchannels=3; 296 | pImagePlane=new T[width*height*nchannels]; 297 | 298 | // check whether the type is float point 299 | bool IsFloat=false; 300 | if(typeid(T)==typeid(double) || typeid(T)==typeid(float) || typeid(T)==typeid(long double)) 301 | IsFloat=true; 302 | 303 | const unsigned char* plinebuffer; 304 | for(int i=0;i 326 | bool ImageIO::loadImage(const QString&filename, T*& pImagePlane,int& width,int& height,int& nchannels) 327 | { 328 | QImage image; 329 | if(image.load(filename)==false) 330 | return false; 331 | if(image.format()!=QImage::Format_RGB32) 332 | { 333 | QImage temp=image.convertToFormat(QImage::Format_RGB32); 334 | image=temp; 335 | } 336 | loadImage(image,pImagePlane,width,height,nchannels); 337 | return true; 338 | } 339 | 340 | template 341 | bool ImageIO::writeImage(const QString& filename, const T*& pImagePlane,int width,int height,int nchannels,ImageType type,int quality) 342 | { 343 | int nPixels=width*height,nElements; 344 | nElements=nPixels*nchannels; 345 | unsigned char* pTempBuffer; 346 | pTempBuffer=new unsigned char[nPixels*4]; 347 | memset(pTempBuffer,0,nPixels*4); 348 | 349 | // check whether the type is float point 350 | bool IsFloat=false; 351 | if(typeid(T)==typeid(double) || typeid(T)==typeid(float) || typeid(T)==typeid(long double)) 352 | IsFloat=true; 353 | 354 | T _Max=0,_Min=0; 355 | switch(type){ 356 | case standard: 357 | break; 358 | case derivative: 359 | _Max=0; 360 | for(int i=0;i=3) 381 | { 382 | pTempBuffer[i*4]=convertPixel(pImagePlane[i*nchannels],IsFloat,type,_Max,_Min); 383 | pTempBuffer[i*4+1]=convertPixel(pImagePlane[i*nchannels+1],IsFloat,type,_Max,_Min); 384 | pTempBuffer[i*4+2]=convertPixel(pImagePlane[i*nchannels+2],IsFloat,type,_Max,_Min); 385 | } 386 | else 387 | for (int j=0;j<3;j++) 388 | pTempBuffer[i*4+j]=convertPixel(pImagePlane[i*nchannels],IsFloat,type,_Max,_Min); 389 | pTempBuffer[i*4+3]=255; 390 | } 391 | QImage *pQImage=new QImage(pTempBuffer,width,height,QImage::Format_RGB32); 392 | bool result= pQImage->save(filename,0,quality); 393 | delete pQImage; 394 | delete pTempBuffer; 395 | return result; 396 | } 397 | 398 | template 399 | bool ImageIO::writeImage(const QString& filename, const T* pImagePlane,int width,int height,int nchannels,T min,T max,int quality) 400 | { 401 | int nPixels=width*height,nElements; 402 | nElements=nPixels*nchannels; 403 | unsigned char* pTempBuffer; 404 | pTempBuffer=new unsigned char[nPixels*4]; 405 | memset(pTempBuffer,0,nPixels*4); 406 | 407 | // check whether the type is float point 408 | bool IsFloat=false; 409 | if(typeid(T)==typeid(double) || typeid(T)==typeid(float) || typeid(T)==typeid(long double)) 410 | IsFloat=true; 411 | 412 | T _Max=max,_Min=min; 413 | 414 | for(int i=0;i=3) 417 | { 418 | pTempBuffer[i*4]=convertPixel(pImagePlane[i*nchannels],IsFloat,normalized,_Max,_Min); 419 | pTempBuffer[i*4+1]=convertPixel(pImagePlane[i*nchannels+1],IsFloat,normalized,_Max,_Min); 420 | pTempBuffer[i*4+2]=convertPixel(pImagePlane[i*nchannels+2],IsFloat,normalized,_Max,_Min); 421 | } 422 | else 423 | for (int j=0;j<3;j++) 424 | pTempBuffer[i*4+j]=convertPixel(pImagePlane[i*nchannels],IsFloat,normalized,_Max,_Min); 425 | pTempBuffer[i*4+3]=255; 426 | } 427 | QImage *pQImage=new QImage(pTempBuffer,width,height,QImage::Format_RGB32); 428 | bool result= pQImage->save(filename,0,quality); 429 | delete pQImage; 430 | delete pTempBuffer; 431 | return result; 432 | } 433 | 434 | template 435 | unsigned char ImageIO::convertPixel(const T& value,bool IsFloat,ImageType type,T& _Max,T& _Min) 436 | { 437 | switch(type){ 438 | case standard: 439 | if(IsFloat) 440 | return __max(__min(value*255,255),0); 441 | else 442 | return __max(__min(value,255),0); 443 | break; 444 | case derivative: 445 | return (double)((double)value/_Max+1)/2*255; 446 | break; 447 | case normalized: 448 | return (double)(value-_Min)/(_Max-_Min)*255; 449 | break; 450 | } 451 | return 0; 452 | } 453 | //*/ 454 | #endif -------------------------------------------------------------------------------- /include/CPM_include/ImageProcessing.h: -------------------------------------------------------------------------------- 1 | #ifndef _ImageProcessing_h 2 | #define _ImageProcessing_h 3 | 4 | #include "math.h" 5 | #include "stdio.h" 6 | #include "stdlib.h" 7 | #include "project.h" 8 | #include 9 | 10 | //---------------------------------------------------------------------------------- 11 | // class to handle basic image processing functions 12 | // this is a collection of template functions. These template functions are 13 | // used in other image classes such as BiImage, IntImage and FImage 14 | //---------------------------------------------------------------------------------- 15 | enum InterType{ INTER_NN, INTER_LINEAR }; 16 | 17 | class ImageProcessing 18 | { 19 | public: 20 | ImageProcessing(void); 21 | ~ImageProcessing(void); 22 | public: 23 | 24 | // basic functions 25 | template 26 | static inline T EnforceRange(const T& x,const int& MaxValue) {return __min(__max(x,0),MaxValue-1);}; 27 | 28 | // Values for L are in the range[0, 100] while a and b are roughly in the range[-110, 110]. 29 | template 30 | static void BGR2Lab(T1* pSrcImage, T2* pDstImage, int width, int height); 31 | 32 | //--------------------------------------------------------------------------------- 33 | // function to interpolate the image plane 34 | //--------------------------------------------------------------------------------- 35 | template 36 | static inline void BilinearInterpolate(const T1* pImage,int width,int height,int nChannels,float x,float y,T2* result); 37 | 38 | template 39 | static inline T1 BilinearInterpolate(const T1* pImage,int width,int height,float x,float y); 40 | 41 | // the transpose of bilinear interpolation 42 | template 43 | static inline void BilinearInterpolate_transpose(const T1* pImage,int width,int height,int nChannels,float x,float y,T2* result); 44 | 45 | template 46 | static inline T1 BilinearInterpolate_transpose(const T1* pImage,int width,int height,float x,float y); 47 | 48 | template 49 | static void ResizeImage(const T1* pSrcImage,T2* pDstImage,int SrcWidth,int SrcHeight,int nChannels,float Ratio, InterType type = INTER_LINEAR); 50 | 51 | template 52 | static void ResizeImage(const T1* pSrcImage, T2* pDstImage, int SrcWidth, int SrcHeight, int nChannels, int DstWidth, int DstHeight, InterType type = INTER_LINEAR); 53 | 54 | //--------------------------------------------------------------------------------- 55 | // functions for 1D filtering 56 | //--------------------------------------------------------------------------------- 57 | template 58 | static void hfiltering(const T1* pSrcImage,T2* pDstImage,int width,int height,int nChannels,const float* pfilter1D,int fsize); 59 | 60 | template 61 | static void vfiltering(const T1* pSrcImage,T2* pDstImage,int width,int height,int nChannels,const float* pfilter1D,int fsize); 62 | 63 | template 64 | static void hfiltering_transpose(const T1* pSrcImage,T2* pDstImage,int width,int height,int nChannels,const float* pfilter1D,int fsize); 65 | 66 | template 67 | static void vfiltering_transpose(const T1* pSrcImage,T2* pDstImage,int width,int height,int nChannels,const float* pfilter1D,int fsize); 68 | 69 | //--------------------------------------------------------------------------------- 70 | // functions for 2D filtering 71 | //--------------------------------------------------------------------------------- 72 | template 73 | static void filtering(const T1* pSrcImage,T2* pDstImage,int width,int height,int nChannels,const float* pfilter2D,int fsize); 74 | 75 | template 76 | static void filtering_transpose(const T1* pSrcImage,T2* pDstImage,int width,int height,int nChannels,const float* pfilter2D,int fsize); 77 | 78 | template 79 | static void Laplacian(const T1* pSrcImage,T2* pDstImage,int width,int height,int nChannels); 80 | 81 | template 82 | static void Medianfiltering(const T1* pSrcImage, T2* pDstImage, int width, int height, int nChannels, int fsize); 83 | 84 | template 85 | static void Integral(const T1* pSrcImage, T2* pDstImage, int width, int height, int nChannels); 86 | 87 | template // O(1) time box filtering using cumulative sum 88 | static void BoxFilter(const T1* pSrcImage, T2* pDstImage, int width, int height, int nChannels, int r, bool norm = true); 89 | 90 | //--------------------------------------------------------------------------------- 91 | // functions for sample a patch from the image 92 | //--------------------------------------------------------------------------------- 93 | template 94 | static void getPatch(const T1* pSrcImgae,T2* pPatch,int width,int height,int nChannels,float x,float y,int wsize); 95 | 96 | //--------------------------------------------------------------------------------- 97 | // function to warp image 98 | //--------------------------------------------------------------------------------- 99 | template 100 | static void warpImage(T1* pWarpIm2,const T1* pIm1,const T1* pIm2,const T2* pVx,const T2* pVy,int width,int height,int nChannels); 101 | 102 | template 103 | static void warpImageFlow(T1* pWarpIm2,const T1* pIm1,const T1* pIm2,const T2* pFlow,int width,int height,int nChannels); 104 | 105 | template 106 | static void warpImage(T1* pWarpIm2,const T1* pIm2,const T2* pVx,const T2* pVy,int width,int height,int nChannels); 107 | 108 | template 109 | static void warpImage_transpose(T1* pWarpIm2,const T1* pIm2,const T2* pVx,const T2* pVy,int width,int height,int nChannels); 110 | 111 | template 112 | static void warpImage(T1* pWarpIm2,const T1* pIm2,const T2*flow,int width,int height,int nChannels); 113 | 114 | template 115 | static void warpImage_transpose(T1* pWarpIm2,const T1* pIm2,const T2* flow,int width,int height,int nChannels); 116 | 117 | template 118 | static void warpImage(T1 *pWarpIm2, T3* pMask,const T1 *pIm1, const T1 *pIm2, const T2 *pVx, const T2 *pVy, int width, int height, int nChannels); 119 | 120 | 121 | //--------------------------------------------------------------------------------- 122 | // function to crop an image 123 | //--------------------------------------------------------------------------------- 124 | template 125 | static void cropImage(const T1* pSrcImage,int SrcWidth,int SrcHeight,int nChannels,T2* pDstImage,int Left,int Top,int DstWidth,int DstHeight); 126 | //--------------------------------------------------------------------------------- 127 | 128 | //--------------------------------------------------------------------------------- 129 | // function to generate a 2D Gaussian 130 | //--------------------------------------------------------------------------------- 131 | template 132 | static void generate2DGaussian(T*& pImage,int wsize,float sigma=-1); 133 | 134 | template 135 | static void generate1DGaussian(T*& pImage,int wsize,float sigma=-1); 136 | 137 | }; 138 | 139 | template 140 | void ImageProcessing::BGR2Lab(T1* pSrcImage, T2* pDstImage, int width, int height) 141 | { 142 | float normFactor = 1.f; 143 | if (typeid(T1) == typeid(unsigned char)){ 144 | normFactor = 255.f; 145 | } 146 | T1* pBGR = pSrcImage; 147 | T2* pLab = pDstImage; 148 | const int npix = width*height; 149 | 150 | const float T = 0.008856; 151 | const float color_attenuation = 1.5f; 152 | int i; 153 | for (i = 0; i < npix; i++){ 154 | const float b = pBGR[0] / normFactor; 155 | const float g = pBGR[1] / normFactor; 156 | const float r = pBGR[2] / normFactor; 157 | float X = 0.412453 * r + 0.357580 * g + 0.180423 * b; 158 | float Y = 0.212671 * r + 0.715160 * g + 0.072169 * b; 159 | float Z = 0.019334 * r + 0.119193 * g + 0.950227 * b; 160 | X /= 0.950456; 161 | Z /= 1.088754; 162 | float Y3 = pow(Y, 1. / 3); 163 | float fX = X > T ? pow(X, 1. / 3) : 7.787 * X + 16 / 116.; 164 | float fY = Y > T ? Y3 : 7.787 * Y + 16 / 116.; 165 | float fZ = Z > T ? pow(Z, 1. / 3) : 7.787 * Z + 16 / 116.; 166 | float L = Y > T ? 116 * Y3 - 16.0 : 903.3 * Y; 167 | float A = 500 * (fX - fY); 168 | float B = 200 * (fY - fZ); 169 | // correct L*a*b*: dark area or light area have less reliable colors 170 | float correct_lab = exp(-color_attenuation*pow(pow(L / 100, 2) - 0.6, 2)); 171 | pLab[0] = L; 172 | pLab[1] = A*correct_lab; 173 | pLab[2] = B*correct_lab; 174 | #if 0 175 | // considering the Values for L are in the range[0, 100] while a and b are roughly in the range[-110, 110], 176 | // normalize to [0,1] 177 | pLab[0] /= 220.; 178 | pLab[1] = (pLab[1] + 110) / 220.; 179 | pLab[2] = (pLab[2] + 110) / 220.; 180 | #endif 181 | // 182 | pBGR += 3; 183 | pLab += 3; 184 | } 185 | } 186 | 187 | //-------------------------------------------------------------------------------------------------- 188 | // function to interpolate multi-channel image plane for (x,y) 189 | // -------------------------------------------------------------------------------------------------- 190 | template 191 | inline void ImageProcessing::BilinearInterpolate(const T1* pImage,int width,int height,int nChannels,float x,float y,T2* result) 192 | { 193 | int xx,yy,m,n,u,v,l,offset; 194 | xx=x; 195 | yy=y; 196 | float dx,dy,s; 197 | dx=__max(__min(x-xx,1),0); 198 | dy=__max(__min(y-yy,1),0); 199 | 200 | memset(result, 0, sizeof(T2)*nChannels); 201 | for(m=0;m<=1;m++) 202 | for(n=0;n<=1;n++) 203 | { 204 | u=EnforceRange(xx+m,width); 205 | v=EnforceRange(yy+n,height); 206 | offset=(v*width+u)*nChannels; 207 | s=fabs(1-m-dx)*fabs(1-n-dy); 208 | for(l=0;l 214 | inline T1 ImageProcessing::BilinearInterpolate(const T1* pImage,int width,int height,float x,float y) 215 | { 216 | int xx,yy,m,n,u,v,l,offset; 217 | xx=x; 218 | yy=y; 219 | float dx,dy,s; 220 | dx=__max(__min(x-xx,1),0); 221 | dy=__max(__min(y-yy,1),0); 222 | 223 | T1 result=0; 224 | for(m=0;m<=1;m++) 225 | for(n=0;n<=1;n++) 226 | { 227 | u=EnforceRange(xx+m,width); 228 | v=EnforceRange(yy+n,height); 229 | offset=v*width+u; 230 | s=fabs(1-m-dx)*fabs(1-n-dy); 231 | result+=pImage[offset]*s; 232 | } 233 | return result; 234 | } 235 | 236 | 237 | //-------------------------------------------------------------------------------------------------- 238 | // function to interpolate multi-channel image plane for (x,y) 239 | // -------------------------------------------------------------------------------------------------- 240 | template 241 | inline void ImageProcessing::BilinearInterpolate_transpose(const T1* pInput,int width,int height,int nChannels,float x,float y,T2* pDstImage) 242 | { 243 | int xx,yy,m,n,u,v,l,offset; 244 | xx=x; 245 | yy=y; 246 | float dx,dy,s; 247 | dx=__max(__min(x-xx,1),0); 248 | dy=__max(__min(y-yy,1),0); 249 | 250 | for(m=0;m<=1;m++) 251 | for(n=0;n<=1;n++) 252 | { 253 | u=EnforceRange(xx+m,width); 254 | v=EnforceRange(yy+n,height); 255 | offset=(v*width+u)*nChannels; 256 | s=fabs(1-m-dx)*fabs(1-n-dy); 257 | for(l=0;l 267 | void ImageProcessing::ResizeImage(const T1* pSrcImage, T2* pDstImage, int SrcWidth, int SrcHeight, int nChannels, float Ratio, InterType type/* = INTER_LINEAR*/) 268 | { 269 | int DstWidth,DstHeight; 270 | DstWidth=(float)SrcWidth*Ratio; 271 | DstHeight=(float)SrcHeight*Ratio; 272 | memset(pDstImage,0,sizeof(T2)*DstWidth*DstHeight*nChannels); 273 | 274 | float x,y; 275 | 276 | if (type == INTER_LINEAR){ 277 | for (int i = 0; i < DstHeight; i++) 278 | for (int j = 0; j < DstWidth; j++) 279 | { 280 | x = (float)(j + 1) / Ratio - 1; 281 | y = (float)(i + 1) / Ratio - 1; 282 | 283 | // bilinear interpolation 284 | BilinearInterpolate(pSrcImage, SrcWidth, SrcHeight, nChannels, x, y, pDstImage + (i*DstWidth + j)*nChannels); 285 | } 286 | }else if (type == INTER_NN){ 287 | int ix, iy; 288 | for (int i = 0; i < DstHeight; i++) 289 | for (int j = 0; j < DstWidth; j++) 290 | { 291 | x = (float)(j + 1) / Ratio - 1; 292 | y = (float)(i + 1) / Ratio - 1; 293 | ix = EnforceRange(x + 0.5, SrcWidth); 294 | iy = EnforceRange(y + 0.5, SrcHeight); 295 | // nearest neighbor interpolation 296 | for (int c = 0; c < nChannels; c++){ 297 | pDstImage[(i*DstWidth + j)*nChannels + c] = pSrcImage[(iy*SrcWidth + ix)*nChannels + c]; 298 | } 299 | } 300 | } 301 | } 302 | 303 | template 304 | void ImageProcessing::ResizeImage(const T1 *pSrcImage, T2 *pDstImage, int SrcWidth, int SrcHeight, int nChannels, int DstWidth, int DstHeight, InterType type/* = INTER_LINEAR*/) 305 | { 306 | float xRatio=(float)DstWidth/SrcWidth; 307 | float yRatio=(float)DstHeight/SrcHeight; 308 | memset(pDstImage, 0, sizeof(T2)*DstWidth*DstHeight*nChannels); 309 | 310 | float x,y; 311 | 312 | if (type == INTER_LINEAR){ 313 | for (int i = 0; i < DstHeight; i++) 314 | for (int j = 0; j < DstWidth; j++) 315 | { 316 | x = (float)(j + 1) / xRatio - 1; 317 | y = (float)(i + 1) / yRatio - 1; 318 | 319 | // bilinear interpolation 320 | BilinearInterpolate(pSrcImage, SrcWidth, SrcHeight, nChannels, x, y, pDstImage + (i*DstWidth + j)*nChannels); 321 | } 322 | }else if (type == INTER_NN){ 323 | int ix, iy; 324 | for (int i = 0; i < DstHeight; i++) 325 | for (int j = 0; j < DstWidth; j++) 326 | { 327 | x = (float)(j + 1) / xRatio - 1; 328 | y = (float)(i + 1) / yRatio - 1; 329 | ix = EnforceRange(x + 0.5, SrcWidth); 330 | iy = EnforceRange(y + 0.5, SrcHeight); 331 | 332 | // nearest neighbor interpolation 333 | for (int c = 0; c < nChannels; c++){ 334 | pDstImage[(i*DstWidth + j)*nChannels + c] = pSrcImage[(iy*SrcWidth + ix)*nChannels + c]; 335 | } 336 | } 337 | } 338 | } 339 | 340 | //------------------------------------------------------------------------------------------------------------ 341 | // horizontal direction filtering 342 | //------------------------------------------------------------------------------------------------------------ 343 | template 344 | void ImageProcessing::hfiltering(const T1* pSrcImage,T2* pDstImage,int width,int height,int nChannels,const float* pfilter1D,int fsize) 345 | { 346 | memset(pDstImage,0,sizeof(T2)*width*height*nChannels); 347 | T2* pBuffer; 348 | float w; 349 | int i,j,l,k,offset,jj; 350 | for(i=0;i 369 | void ImageProcessing::hfiltering_transpose(const T1* pSrcImage,T2* pDstImage,int width,int height,int nChannels,const float* pfilter1D,int fsize) 370 | { 371 | memset(pDstImage,0,sizeof(T2)*width*height*nChannels); 372 | const T1* pBuffer; 373 | float w; 374 | int i,j,l,k,offset,jj; 375 | for(i=0;i 394 | void ImageProcessing::Laplacian(const T1 *pSrcImage, T2 *pDstImage, int width, int height, int nChannels) 395 | { 396 | int LineWidth=width*nChannels; 397 | int nElements=width*height*nChannels; 398 | // first treat the corners 399 | for(int k=0;k 430 | void ImageProcessing::Medianfiltering(const T1* pSrcImage, T2* pDstImage, int width, int height, int nChannels, int fsize) 431 | { 432 | T2* tmpImg = new T2[width*height*nChannels]; 433 | 434 | int regionSize = (2 * fsize + 1) * (2 * fsize + 1); 435 | T1* pTmpSrc = (T1*)malloc(regionSize * sizeof(T1)); 436 | T2* pBuffer = NULL; 437 | float w; 438 | int i, j, l, k, c, offset, ii, jj; 439 | for (i = 0; i < height; i++){ 440 | for (j = 0; j < width; j++){ 441 | pBuffer = tmpImg + (i*width + j)*nChannels; 442 | for (c = 0; c < nChannels; c++){ 443 | int idx = 0; 444 | for (l = -fsize; l <= fsize; l++){ 445 | for (k = -fsize; k <= fsize; k++){ 446 | ii = EnforceRange(i + l, height); 447 | jj = EnforceRange(j + k, width); 448 | pTmpSrc[idx++] = pSrcImage[(ii*width + jj)*nChannels + c]; 449 | } 450 | } 451 | // debug 452 | // printf("\n"); 453 | // for(int kk=0; kk 476 | void ImageProcessing::vfiltering(const T1* pSrcImage,T2* pDstImage,int width,int height,int nChannels,const float* pfilter1D,int fsize) 477 | { 478 | memset(pDstImage,0,sizeof(T2)*width*height*nChannels); 479 | T2* pBuffer; 480 | float w; 481 | int i,j,l,k,offset,ii; 482 | for(i=0;i 500 | void ImageProcessing::vfiltering_transpose(const T1* pSrcImage,T2* pDstImage,int width,int height,int nChannels,const float* pfilter1D,int fsize) 501 | { 502 | memset(pDstImage,0,sizeof(T2)*width*height*nChannels); 503 | const T1* pBuffer; 504 | float w; 505 | int i,j,l,k,offset,ii; 506 | for(i=0;i 527 | void ImageProcessing::filtering(const T1* pSrcImage,T2* pDstImage,int width,int height,int nChannels,const float* pfilter2D,int fsize) 528 | { 529 | float w; 530 | int i,j,u,v,k,ii,jj,wsize,offset; 531 | wsize=fsize*2+1; 532 | float* pBuffer=new float[nChannels]; 533 | for(i=0;i 559 | void ImageProcessing::filtering_transpose(const T1* pSrcImage,T2* pDstImage,int width,int height,int nChannels,const float* pfilter2D,int fsize) 560 | { 561 | float w; 562 | int i,j,u,v,k,ii,jj,wsize,offset; 563 | wsize=fsize*2+1; 564 | memset(pDstImage,0,sizeof(T2)*width*height*nChannels); 565 | for(i=0;i 584 | void ImageProcessing::Integral(const T1* pSrcImage, T2* pDstImage, int width, int height, int nChannels) 585 | { 586 | #if 0 587 | for (int i = 0; i < 10; i++){ 588 | for (int j = 0; j < 10; j++){ 589 | printf("%.2f ", pSrcImage[(i*width + j)*nChannels]); 590 | } 591 | printf("\n"); 592 | } 593 | #endif 594 | 595 | int ti, tj; 596 | double sum; 597 | for (int k = 0; k < nChannels; k++) 598 | { 599 | for (int i = 0; i < height; i++){ 600 | for (int j = 0; j < width; j++){ 601 | sum = pSrcImage[(i*width + j)*nChannels + k]; 602 | 603 | ti = i - 1; 604 | tj = j - 1; 605 | if (tj >= 0){ 606 | sum += pDstImage[(i*width + tj)*nChannels + k]; 607 | } 608 | if (ti >= 0){ 609 | sum += pDstImage[(ti*width + j)*nChannels + k]; 610 | } 611 | if (ti >= 0 && tj >= 0){ 612 | sum -= pDstImage[(ti*width + tj)*nChannels + k]; 613 | } 614 | 615 | pDstImage[(i*width + j)*nChannels + k] = sum; 616 | } 617 | } 618 | } 619 | 620 | #if 0 621 | printf("\n"); 622 | for (int i = 0; i < 10; i++){ 623 | for (int j = 0; j < 10; j++){ 624 | printf("%.2f ", pDstImage[(i*width + j)*nChannels]); 625 | } 626 | printf("\n"); 627 | } 628 | #endif 629 | } 630 | 631 | template 632 | void ImageProcessing::BoxFilter(const T1* pSrcImage, T2* pDstImage, int width, int height, int nChannels, int r, bool norm) 633 | { 634 | double* pBuffer = new double[width*height*nChannels]; 635 | Integral(pSrcImage, pBuffer, width, height, nChannels); 636 | 637 | int ti, tj; 638 | double sum; 639 | int starti, startj, endi, endj; 640 | for (int k = 0; k < nChannels; k++) 641 | { 642 | for (int i = 0; i < height; i++){ 643 | for (int j = 0; j < width; j++){ 644 | ti = EnforceRange(i + r, height); 645 | tj = EnforceRange(j + r, width); 646 | sum = pBuffer[(ti*width + tj)*nChannels + k]; 647 | 648 | starti = 0; 649 | startj = 0; 650 | endi = ti; 651 | endj = tj; 652 | 653 | ti = i - r - 1; 654 | tj = j - r - 1; 655 | 656 | if (ti >= 0){ 657 | sum -= pBuffer[(ti*width + endj)*nChannels + k]; 658 | starti = ti + 1; 659 | } 660 | if (tj >= 0){ 661 | sum -= pBuffer[(endi*width + tj)*nChannels + k]; 662 | startj = tj + 1; 663 | } 664 | if (ti >= 0 && tj >= 0){ 665 | sum += pBuffer[(ti*width + tj)*nChannels + k]; 666 | } 667 | 668 | int cnt = 1; 669 | if (norm){ // normalize 670 | cnt = (endi - starti + 1)*(endj - startj + 1); 671 | } 672 | 673 | pDstImage[(i*width + j)*nChannels + k] = sum / cnt; 674 | } 675 | } 676 | } 677 | delete []pBuffer; 678 | } 679 | 680 | //------------------------------------------------------------------------------------------------------------ 681 | // function to sample a patch from the source image 682 | //------------------------------------------------------------------------------------------------------------ 683 | template 684 | void ImageProcessing::getPatch(const T1* pSrcImage,T2* pPatch,int width,int height,int nChannels,float x0,float y0,int wsize) 685 | { 686 | // suppose pPatch has been allocated and cleared before calling the function 687 | int wlength=wsize*2+1; 688 | float x,y; 689 | for(int i=-wsize;i<=wsize;i++) 690 | for(int j=-wsize;j<=wsize;j++) 691 | { 692 | y=y0+i; 693 | x=x0+j; 694 | if(x<0 || x>width-1 || y<0 || y>height-1) 695 | continue; 696 | BilinearInterpolate(pSrcImage,width,height,nChannels,x,y,pPatch+((i+wsize)*wlength+j+wsize)*nChannels); 697 | } 698 | } 699 | 700 | //------------------------------------------------------------------------------------------------------------ 701 | // function to warp an image with respect to flow field 702 | // pWarpIm2 has to be allocated before hands 703 | //------------------------------------------------------------------------------------------------------------ 704 | template 705 | void ImageProcessing::warpImage(T1 *pWarpIm2, const T1 *pIm1, const T1 *pIm2, const T2 *pVx, const T2 *pVy, int width, int height, int nChannels) 706 | { 707 | memset(pWarpIm2,0,sizeof(T1)*width*height*nChannels); 708 | for(int i=0;iwidth-1 || y<0 || y>height-1) 717 | { 718 | for(int k=0;k 727 | void ImageProcessing::warpImageFlow(T1 *pWarpIm2, const T1 *pIm1, const T1 *pIm2, const T2 *pFlow, int width, int height, int nChannels) 728 | { 729 | memset(pWarpIm2,0,sizeof(T1)*width*height*nChannels); 730 | for(int i=0;iwidth-1 || y<0 || y>height-1) 739 | { 740 | for(int k=0;k 749 | void ImageProcessing::warpImage(T1 *pWarpIm2,const T1 *pIm2, const T2 *pVx, const T2 *pVy, int width, int height, int nChannels) 750 | { 751 | memset(pWarpIm2,0,sizeof(T1)*width*height*nChannels); 752 | for(int i=0;iwidth-1 || y<0 || y>height-1) 761 | continue; 762 | BilinearInterpolate(pIm2,width,height,nChannels,x,y,pWarpIm2+offset); 763 | } 764 | } 765 | 766 | template 767 | void ImageProcessing::warpImage_transpose(T1 *pWarpIm2,const T1 *pIm2, const T2 *pVx, const T2 *pVy, int width, int height, int nChannels) 768 | { 769 | memset(pWarpIm2,0,sizeof(T1)*width*height*nChannels); 770 | for(int i=0;iwidth-1 || y<0 || y>height-1) 779 | continue; 780 | //BilinearInterpolate(pIm2,width,height,nChannels,x,y,pWarpIm2+offset); 781 | BilinearInterpolate_transpose(pIm2+offset,width,height,nChannels,x,y,pWarpIm2); 782 | } 783 | } 784 | 785 | ////////////////////////////////////////////////////////////////////////////////////// 786 | // different format 787 | ////////////////////////////////////////////////////////////////////////////////////// 788 | template 789 | void ImageProcessing::warpImage(T1 *pWarpIm2,const T1 *pIm2, const T2 *flow, int width, int height, int nChannels) 790 | { 791 | memset(pWarpIm2,0,sizeof(T1)*width*height*nChannels); 792 | for(int i=0;iwidth-1 || y<0 || y>height-1) 801 | continue; 802 | BilinearInterpolate(pIm2,width,height,nChannels,x,y,pWarpIm2+offset); 803 | } 804 | } 805 | 806 | template 807 | void ImageProcessing::warpImage_transpose(T1 *pWarpIm2,const T1 *pIm2, const T2 *flow, int width, int height, int nChannels) 808 | { 809 | memset(pWarpIm2,0,sizeof(T1)*width*height*nChannels); 810 | for(int i=0;iwidth-1 || y<0 || y>height-1) 819 | continue; 820 | //BilinearInterpolate(pIm2,width,height,nChannels,x,y,pWarpIm2+offset); 821 | BilinearInterpolate_transpose(pIm2+offset,width,height,nChannels,x,y,pWarpIm2); 822 | } 823 | } 824 | 825 | 826 | template 827 | void ImageProcessing::warpImage(T1 *pWarpIm2, T3* pMask,const T1 *pIm1, const T1 *pIm2, const T2 *pVx, const T2 *pVy, int width, int height, int nChannels) 828 | { 829 | memset(pWarpIm2,0,sizeof(T1)*width*height*nChannels); 830 | for(int i=0;iwidth-1 || y<0 || y>height-1) 839 | { 840 | for(int k=0;k 857 | void ImageProcessing::cropImage(const T1 *pSrcImage, int SrcWidth, int SrcHeight, int nChannels, T2 *pDstImage, int Left, int Top, int DstWidth, int DstHeight) 858 | { 859 | if(typeid(T1)==typeid(T2)) 860 | { 861 | for(int i=0;i 881 | void ImageProcessing::generate2DGaussian(T*& pImage, int wsize, float sigma) 882 | { 883 | if(sigma==-1) 884 | sigma=wsize/2; 885 | float alpha=1/(2*sigma*sigma); 886 | int winlength=wsize*2+1; 887 | if(pImage==NULL) 888 | pImage=new T[winlength*winlength]; 889 | float total = 0; 890 | for(int i=-wsize;i<=wsize;i++) 891 | for(int j=-wsize;j<=wsize;j++) 892 | { 893 | pImage[(i+wsize)*winlength+j+wsize]=exp(-(float)(i*i+j*j)*alpha); 894 | total += pImage[(i+wsize)*winlength+j+wsize]; 895 | } 896 | for(int i = 0;i 905 | void ImageProcessing::generate1DGaussian(T*& pImage, int wsize, float sigma) 906 | { 907 | if(sigma==-1) 908 | sigma=wsize/2; 909 | float alpha=1/(2*sigma*sigma); 910 | int winlength=wsize*2+1; 911 | if(pImage==NULL) 912 | pImage=new T[winlength]; 913 | float total = 0; 914 | for(int i=-wsize;i<=wsize;i++) 915 | { 916 | pImage[i+wsize]=exp(-(float)(i*i)*alpha); 917 | total += pImage[i+wsize]; 918 | } 919 | for(int i = 0;i 7 | class ImagePyramid 8 | { 9 | private: 10 | Image* ImPyramid; 11 | int nLevels; 12 | float fRatio; 13 | public: 14 | ImagePyramid(void){ ImPyramid = NULL; }; 15 | ~ImagePyramid(void){if(ImPyramid != NULL) delete[]ImPyramid;}; 16 | inline Image& operator[](int level) { return ImPyramid[level]; }; 17 | void ConstructPyramid(const FImage& image, float ratio = 0.8, int minWidth = 30); 18 | void ConstructPyramidLevels(const FImage& image, float ratio = 0.8, int _nLevels = 2); 19 | void displayTop(const char* filename){ ImPyramid[nLevels - 1].imwrite(filename); }; 20 | inline int nlevels() const {return nLevels;}; 21 | inline float ratio() const { return fRatio; }; 22 | }; 23 | 24 | typedef ImagePyramid FImagePyramid; 25 | 26 | //--------------------------------------------------------------------------------------- 27 | // function to construct the pyramid 28 | // this is the slow way 29 | //--------------------------------------------------------------------------------------- 30 | /*void GaussianPyramid::ConstructPyramid(const DImage &image, float ratio, int minWidth) 31 | { 32 | // the ratio cannot be arbitrary numbers 33 | if(ratio>0.98 || ratio<0.4) 34 | ratio=0.75; 35 | // first decide how many levels 36 | nLevels=log((float)minWidth/image.width())/log(ratio); 37 | if(ImPyramid!=NULL) 38 | delete []ImPyramid; 39 | ImPyramid=new DImage[nLevels]; 40 | ImPyramid[0].copyData(image); 41 | float baseSigma=(1/ratio-1); 42 | for(int i=1;i 56 | void ImagePyramid::ConstructPyramid(const FImage& image, float ratio /*= 0.8*/, int minWidth /*= 30*/) 57 | { 58 | // the ratio cannot be arbitrary numbers 59 | if (ratio>0.98 || ratio<0.4) 60 | ratio = 0.75; 61 | // first decide how many levels 62 | nLevels = log((float)minWidth / image.width()) / log(ratio); 63 | fRatio = ratio; 64 | if (ImPyramid != NULL) 65 | delete[]ImPyramid; 66 | ImPyramid = new FImage[nLevels]; 67 | ImPyramid[0].copyData(image); 68 | float baseSigma = (1 / ratio - 1); 69 | int n = log(0.25) / log(ratio); 70 | float nSigma = baseSigma*n; 71 | for (int i = 1; i 90 | void ImagePyramid::ConstructPyramidLevels(const FImage& image, float ratio /*= 0.8*/, int _nLevels /*= 2*/) 91 | { 92 | // the ratio cannot be arbitrary numbers 93 | if (ratio>0.98 || ratio<0.4) 94 | ratio = 0.75; 95 | nLevels = _nLevels; 96 | fRatio = ratio; 97 | if (ImPyramid != NULL) 98 | delete[]ImPyramid; 99 | ImPyramid = new FImage[nLevels]; 100 | ImPyramid[0].copyData(image); 101 | float baseSigma = (1 / ratio - 1); 102 | int n = log(0.25) / log(ratio); 103 | float nSigma = baseSigma*n; 104 | for (int i = 1; i 7 | #include 8 | #include 9 | 10 | #include 11 | #include "opencv2/opencv.hpp" // for KITTI 12 | 13 | // read and write our simple .flo flow file format 14 | 15 | // ".flo" file format used for optical flow evaluation 16 | // 17 | // Stores 2-band float image for horizontal (u) and vertical (v) flow components. 18 | // Floats are stored in little-endian order. 19 | // A flow value is considered "unknown" if either |u| or |v| is greater than 1e9. 20 | // 21 | // bytes contents 22 | // 23 | // 0-3 tag: "PIEH" in ASCII, which in little endian happens to be the float 202021.25 24 | // (just a sanity check that floats are represented correctly) 25 | // 4-7 width as an integer 26 | // 8-11 height as an integer 27 | // 12-end data (width*height*2*4 bytes total) 28 | // the float values for u and v, interleaved, in row order, i.e., 29 | // u[row0,col0], v[row0,col0], u[row0,col1], v[row0,col1], ... 30 | // 31 | 32 | // value to use to represent unknown flow 33 | #define UNKNOWN_FLOW 1e10 34 | 35 | typedef struct 36 | { 37 | double aee; // Average Endpoint Error 38 | double aae; // Average Angular Error 39 | }FlowErr; 40 | 41 | class OpticFlowIO 42 | { 43 | public: 44 | // return whether flow vector is unknown 45 | template 46 | static bool unknown_flow(T u, T v); 47 | template 48 | static bool unknown_flow(T *f); 49 | 50 | // read a flow file into 2-band image 51 | template 52 | static int ReadFlowFile(T* U, T* V, int* w, int* h, const char* filename); 53 | 54 | // write a 2-band image into flow file 55 | template 56 | static int WriteFlowFile(T* U, T* V, int w, int h, const char* filename); 57 | 58 | // read a KITTI flow file into 2-band image 59 | template 60 | static int ReadKittiFlowFile(T* U, T* V, int* w, int* h, const char* filename); 61 | 62 | // write a 2-band image into KITTI flow file 63 | template 64 | static int WriteKittiFlowFile(T* U, T* V, int w, int h, const char* filename); 65 | 66 | // render the motion to a 4-band BGRA color image 67 | template 68 | static double MotionToColor(unsigned char* fillPix, T* U, T* V, int w, int h, float range = -1); 69 | 70 | template 71 | static float ShowFlow(const char* winname, T* U, T* V, int w, int h, float range = -1, int waittime = 1); 72 | template 73 | static void SaveFlowAsImage(const char* imgName, T* U, T* V, int w, int h, float range = -1); 74 | static void SaveFlowMatrixAsImage(const char* imgName, cv::Mat2f flowMat); 75 | 76 | static void Match2Flow(FImage& inMat, FImage& ou, FImage& ov, int w, int h); 77 | static void FlowMatrix2Flow(cv::Mat2f inMat, FImage& ou, FImage& ov); 78 | 79 | template 80 | static float ErrorImage(unsigned char* fillPix, T* u1, T* v1, T* u2, T* v2, int w, int h); 81 | template 82 | static float ErrorImage(unsigned char* fillPix, T* u1, T* v1, char* gtName, int w, int h); 83 | template 84 | static float ShowErrorImage(const char* winname, T* U, T* V, char* gtName, int w, int h, int waittime = 1); 85 | template 86 | static float SaveErrorImage(const char* imgName, T* U, T* V, char* gtName, int w, int h); 87 | 88 | template 89 | static FlowErr CalcFlowError(T1* u1, T1* v1, T2* u2, T2*v2, int w, int h); 90 | 91 | private: 92 | // first four bytes, should be the same in little endian 93 | #define TAG_FLOAT 202021.25 // check for this when READING the file 94 | #define TAG_STRING "PIEH" // use this when WRITING the file 95 | 96 | #define M_PI 3.14159265358979323846 97 | 98 | // the "official" threshold - if the absolute value of either 99 | // flow component is greater, it's considered unknown 100 | #define UNKNOWN_FLOW_THRESH 1e9 101 | 102 | #define NUM_BANDS 2 103 | 104 | // Color encoding of flow vectors 105 | // adapted from the color circle idea described at 106 | // http://members.shaw.ca/quadibloc/other/colint.htm 107 | // 108 | // Daniel Scharstein, 4/2007 109 | // added tick marks and out-of-range coding 6/05/07 110 | 111 | #define MAXWHEELCOLS 60 112 | template 113 | static void setcols(T* colorwheel, int r, int g, int b, int k); 114 | template 115 | static int makecolorwheel(T* colorwheel); 116 | template 117 | static void computeColor(double fx, double fy, unsigned char *pix, T* colorwheel, int ncols); 118 | }; 119 | 120 | template 121 | int OpticFlowIO::ReadKittiFlowFile(T* U, T* V, int* w, int* h, const char* filename) 122 | { 123 | if (filename == NULL){ 124 | printf("ReadKittiFlowFile: empty filename\n"); 125 | return -1; 126 | } 127 | 128 | const char *dot = strrchr(filename, '.'); 129 | if (strcmp(dot, ".png") != 0){ 130 | printf("ReadKittiFlowFile (%s): extension .png expected\n", filename); 131 | return -1; 132 | } 133 | 134 | IplImage* img = cvLoadImage(filename, CV_LOAD_IMAGE_COLOR | CV_LOAD_IMAGE_ANYDEPTH); 135 | if (img == NULL){ 136 | printf("ReadKittiFlowFile: could not open %s\n", filename); 137 | return -1; 138 | } 139 | 140 | int width = img->width; 141 | int height = img->height; 142 | for(int i=0; iimageData + i*img->widthStep); 145 | uint16_t validFlag = rowImgData[j*img->nChannels]; 146 | if(validFlag > 0){ 147 | U[i*width+j] = (rowImgData[j*img->nChannels + 2] - 32768.0f)/64.0f; 148 | V[i*width+j] = (rowImgData[j*img->nChannels + 1] - 32768.0f)/64.0f; 149 | }else{ 150 | U[i*width+j] = UNKNOWN_FLOW; 151 | V[i*width+j] = UNKNOWN_FLOW; 152 | } 153 | } 154 | } 155 | 156 | *w = width; 157 | *h = height; 158 | cvReleaseImage(&img); 159 | return 0; 160 | } 161 | 162 | template 163 | int OpticFlowIO::WriteKittiFlowFile(T* U, T* V, int w, int h, const char* filename) 164 | { 165 | if (filename == NULL){ 166 | printf("WriteKittiFlowFile: empty filename\n"); 167 | return -1; 168 | } 169 | 170 | const char *dot = strrchr(filename, '.'); 171 | if (dot == NULL){ 172 | printf("WriteKittiFlowFile: extension required in filename '%s'\n", filename); 173 | return -1; 174 | } 175 | 176 | if (strcmp(dot, ".png") != 0){ 177 | printf("WriteKittiFlowFile: filename '%s' should have extension '.png'\n", filename); 178 | return -1; 179 | } 180 | 181 | int width = w, height = h; 182 | 183 | IplImage* img = cvCreateImage(cvSize(w,h), IPL_DEPTH_16U, 3); 184 | for(int i=0; iimageData + i*img->widthStep); 190 | if(!unknown_flow(u,v)){ 191 | rowImgData[j*img->nChannels + 2] = __max(__min(U[i*width+j]*64.0f+32768.0f, 65535), 0); 192 | rowImgData[j*img->nChannels + 1] = __max(__min(V[i*width+j]*64.0f+32768.0f, 65535), 0); 193 | rowImgData[j*img->nChannels] = 1; 194 | }else{ 195 | rowImgData[j*img->nChannels + 2] = 0; 196 | rowImgData[j*img->nChannels + 1] = 0; 197 | rowImgData[j*img->nChannels] = 0; 198 | } 199 | } 200 | } 201 | 202 | const int params[2]={CV_IMWRITE_PNG_COMPRESSION, 1}; 203 | cvSaveImage(filename, img, params); // slight lossy PNG 204 | cvReleaseImage(&img); 205 | return 0; 206 | } 207 | 208 | template 209 | bool OpticFlowIO::unknown_flow(T u, T v) 210 | { 211 | return (abs(u) > UNKNOWN_FLOW_THRESH) 212 | || (abs(v) > UNKNOWN_FLOW_THRESH) 213 | || u != u || v != v; // isnan() 214 | } 215 | 216 | template 217 | bool OpticFlowIO::unknown_flow(T *f) 218 | { 219 | return unknown_flow(f[0], f[1]); 220 | } 221 | 222 | template 223 | int OpticFlowIO::ReadFlowFile(T* U, T* V, int* w, int* h, const char* filename) 224 | { 225 | if (filename == NULL){ 226 | printf("ReadFlowFile: empty filename\n"); 227 | return -1; 228 | } 229 | 230 | const char *dot = strrchr(filename, '.'); 231 | if (strcmp(dot, ".flo") != 0){ 232 | printf("ReadFlowFile (%s): extension .flo expected\n", filename); 233 | return -1; 234 | } 235 | 236 | FILE *stream = fopen(filename, "rb"); 237 | if (stream == 0){ 238 | printf("ReadFlowFile: could not open %s\n", filename); 239 | return -1; 240 | } 241 | 242 | int width, height; 243 | float tag; 244 | 245 | if ((int)fread(&tag, sizeof(float), 1, stream) != 1 246 | ||(int)fread(&width, sizeof(int), 1, stream) != 1 247 | ||(int)fread(&height, sizeof(int), 1, stream) != 1) 248 | { 249 | printf("ReadFlowFile: problem reading file %s\n", filename); 250 | return -1; 251 | } 252 | 253 | if (tag != TAG_FLOAT) // simple test for correct endian-ness 254 | { 255 | printf("ReadFlowFile(%s): wrong tag (possibly due to big-endian machine?)\n", filename); 256 | return -1; 257 | } 258 | 259 | // another sanity check to see that integers were read correctly (99999 should do the trick...) 260 | if (width < 1 || width > 99999){ 261 | printf("ReadFlowFile(%s): illegal width %d\n", filename, width); 262 | return -1; 263 | } 264 | 265 | if (height < 1 || height > 99999){ 266 | printf("ReadFlowFile(%s): illegal height %d\n", filename, height); 267 | return -1; 268 | } 269 | 270 | for(int i=0; i 295 | int OpticFlowIO::WriteFlowFile(T* U, T* V, int w, int h, const char* filename) 296 | { 297 | if (filename == NULL){ 298 | printf("WriteFlowFile: empty filename\n"); 299 | return -1; 300 | } 301 | 302 | const char *dot = strrchr(filename, '.'); 303 | if (dot == NULL){ 304 | printf("WriteFlowFile: extension required in filename '%s'\n", filename); 305 | return -1; 306 | } 307 | 308 | if (strcmp(dot, ".flo") != 0){ 309 | printf("WriteFlowFile: filename '%s' should have extension '.flo'\n", filename); 310 | return -1; 311 | } 312 | 313 | int width = w, height = h; 314 | 315 | FILE *stream = fopen(filename, "wb"); 316 | if (stream == 0){ 317 | printf("WriteFlowFile: could not open %s\n", filename); 318 | return -1; 319 | } 320 | 321 | // write the header 322 | fprintf(stream, TAG_STRING); 323 | if ((int)fwrite(&width, sizeof(int), 1, stream) != 1 324 | ||(int)fwrite(&height, sizeof(int), 1, stream) != 1) 325 | { 326 | printf("WriteFlowFile(%s): problem writing header\n", filename); 327 | return -1; 328 | } 329 | 330 | // write the rows 331 | for(int i=0; i 348 | double OpticFlowIO::MotionToColor(unsigned char* fillPix, T* U, T* V, int w, int h, float range /*= -1*/) 349 | { 350 | // determine motion range: 351 | double maxrad; 352 | 353 | if (range > 0) { 354 | maxrad = range; 355 | }else{ // obtain the motion range according to the max flow 356 | double maxu = -999, maxv = -999; 357 | double minu = 999, minv = 999; 358 | maxrad = -1; 359 | for (int i = 0; i < h; i++){ 360 | for (int j = 0; j < w; j++){ 361 | double u = U[i*w + j]; 362 | double v = V[i*w + j]; 363 | if (unknown_flow(u, v)) 364 | continue; 365 | maxu = __max(maxu, u); 366 | maxv = __max(maxv, v); 367 | minu = __min(minu, u); 368 | minv = __min(minv, v); 369 | double rad = sqrt(u * u + v * v); 370 | maxrad = __max(maxrad, rad); 371 | } 372 | } 373 | if (maxrad == 0) // if flow == 0 everywhere 374 | maxrad = 1; 375 | } 376 | 377 | //printf("max motion: %.2f motion range: u = [%.2f,%.2f]; v = [%.2f,%.2f]\n", 378 | // maxrad, minu, maxu, minv, maxv); 379 | 380 | int colorwheel[MAXWHEELCOLS*3]; 381 | int ncols = makecolorwheel(colorwheel); 382 | 383 | for(int i=0; i 403 | float OpticFlowIO::ShowFlow(const char* winname, T* U, T* V, int w, int h, 404 | float range /*= -1*/, int waittime /*= 1*/) 405 | { 406 | cv::Mat img(h, w, CV_8UC4); 407 | float maxFlow = OpticFlowIO::MotionToColor(img.data, U, V, w, h, range); 408 | 409 | #if 0 410 | // get corner color 411 | int x = 10, y = 20; 412 | unsigned char color[4]; 413 | unsigned char* pSrc = img.data + y*img.step + x * 4; 414 | color[0] = 255 - pSrc[0]; 415 | color[1] = 255 - pSrc[1]; 416 | color[2] = 255 - pSrc[2]; 417 | char info[256]; 418 | sprintf(info, "max: %.1f", maxFlow); 419 | cv::putText(img, info, cvPoint(x, y), CV_FONT_HERSHEY_SIMPLEX, 0.5, cvScalar(color[0], color[1], color[2])); 420 | #endif 421 | 422 | cv::imshow(winname, img); 423 | cv::waitKey(waittime); 424 | 425 | return maxFlow; 426 | } 427 | 428 | template 429 | void OpticFlowIO::SaveFlowAsImage(const char* imgName, T* U, T* V, int w, int h, float range /*= -1*/) 430 | { 431 | cv::Mat img(h, w, CV_8UC4); 432 | float maxFlow = OpticFlowIO::MotionToColor(img.data, U, V, w, h, range); 433 | 434 | #if 1 435 | // get corner color 436 | int x = 10, y = 20; 437 | unsigned char color[3]; 438 | unsigned char* pSrc = img.data + y*img.step + x * 4; 439 | color[0] = 255 - pSrc[0]; 440 | color[1] = 255 - pSrc[1]; 441 | color[2] = 255 - pSrc[2]; 442 | char info[256]; 443 | sprintf(info, "max: %.1f", maxFlow); 444 | cv::putText(img, info, cvPoint(x, y), CV_FONT_HERSHEY_SIMPLEX, 0.5, cvScalar(color[0], color[1], color[2])); 445 | #endif 446 | 447 | cv::imwrite(imgName, img); 448 | } 449 | 450 | inline void OpticFlowIO::SaveFlowMatrixAsImage(const char* imgName, cv::Mat2f flowMat) 451 | { 452 | int rows = flowMat.rows; int cols = flowMat.cols; 453 | FImage tmp_u2 = FImage(cols, rows, 1); 454 | FImage tmp_v2 = FImage(cols, rows, 1); 455 | OpticFlowIO::FlowMatrix2Flow(flowMat, tmp_u2, tmp_v2); 456 | OpticFlowIO::SaveFlowAsImage(imgName, tmp_u2.pData, tmp_v2.pData, cols, rows); 457 | } 458 | 459 | // draw each match as a 3x3 color block 460 | inline void OpticFlowIO::Match2Flow(FImage& inMat, FImage& ou, FImage& ov, int w, int h) 461 | { 462 | if (!ou.matchDimension(w, h, 1)){ 463 | ou.allocate(w, h, 1); 464 | } 465 | if (!ov.matchDimension(w, h, 1)){ 466 | ov.allocate(w, h, 1); 467 | } 468 | ou.setValue(UNKNOWN_FLOW); 469 | ov.setValue(UNKNOWN_FLOW); 470 | int cnt = inMat.height(); 471 | for (int i = 0; i < cnt; i++){ 472 | float* p = inMat.rowPtr(i); 473 | float x = p[0]; 474 | float y = p[1]; 475 | float u = p[2] - p[0]; //x component of flow velocity 476 | float v = p[3] - p[1]; //y component of flow velocity 477 | for (int di = -1; di <= 1; di++){ 478 | for (int dj = -1; dj <= 1; dj++){ 479 | int tx = ImageProcessing::EnforceRange(x + dj, w); 480 | int ty = ImageProcessing::EnforceRange(y + di, h); 481 | ou[ty*w + tx] = u; 482 | ov[ty*w + tx] = v; 483 | } 484 | } 485 | } 486 | } 487 | 488 | 489 | // draw each match from a dense flow matrix inMat to a 1x1 color block 490 | inline void OpticFlowIO::FlowMatrix2Flow(cv::Mat2f inMat, FImage& ou, FImage& ov) 491 | { 492 | int rows = inMat.rows; 493 | int cols = inMat.cols; 494 | if (!ou.matchDimension(cols, rows, 1)){ 495 | ou.allocate(cols, rows, 1); 496 | } 497 | if (!ov.matchDimension(cols, rows, 1)){ 498 | ov.allocate(cols, rows, 1); 499 | } 500 | for (int j = 0; j < rows; j++){ 501 | for(int i = 0; i < cols; i++){ 502 | float u = inMat.at(j,i)[0]; 503 | float v = inMat.at(j,i)[1]; 504 | ou[j*cols + i] = u; 505 | ov[j*cols + i] = v; 506 | } 507 | } 508 | } 509 | 510 | template 511 | float OpticFlowIO::ErrorImage(unsigned char* fillPix, T* u1, T* v1, T* u2, T* v2, int w, int h) 512 | { 513 | unsigned char pix[4]; 514 | 515 | //#define LOG_COLOR 516 | #ifdef LOG_COLOR 517 | float LC[10][5] = 518 | { { 0, 0.0625, 49, 54, 149 }, 519 | { 0.0625, 0.125, 69, 117, 180 }, 520 | { 0.125, 0.25, 116, 173, 209 }, 521 | { 0.25, 0.5, 171, 217, 233 }, 522 | { 0.5, 1, 224, 243, 248 }, 523 | { 1, 2, 254, 224, 144 }, 524 | { 2, 4, 253, 174, 97 }, 525 | { 4, 8, 244, 109, 67 }, 526 | { 8, 16, 215, 48, 39 }, 527 | { 16, 1000000000.0, 165, 0, 38 } }; 528 | #endif 529 | 530 | int totalCnt = 0; 531 | int validCnt = 0; 532 | for (int i = 0; i < h; i++){ 533 | for (int j = 0; j < w; j++){ 534 | int idx = i*w + j; 535 | 536 | if (unknown_flow(u1[idx], v1[idx]) || unknown_flow(u2[idx], v2[idx])){ 537 | // red: occlusion 538 | pix[0] = 0; pix[1] = 0; pix[2] = 255; 539 | pix[2] = 0; // TODO 540 | pix[3] = 0xFF; // only for alignment 541 | memcpy(fillPix + idx * 4, pix, 4); 542 | continue; 543 | } 544 | 545 | float endPtErr = sqrt(pow(u1[idx] - u2[idx], 2) + pow(v1[idx] - v2[idx], 2)); 546 | 547 | #ifdef LOG_COLOR 548 | float f_err = endPtErr; 549 | float f_mag = sqrt(u2[idx] * u2[idx] + v2[idx] * v2[idx]); 550 | float n_err = std::min(f_err / 3.0, 20.0*f_err / f_mag); 551 | for (int i = 0; i < 10; i++) { 552 | if (n_err >= LC[i][0] && n_err < LC[i][1]) { 553 | pix[3] = 0xFF; // only for alignment 554 | pix[2] = (uint8_t)LC[i][2]; 555 | pix[1] = (uint8_t)LC[i][3]; 556 | pix[0] = (uint8_t)LC[i][4]; 557 | } 558 | } 559 | if (unknown_flow(u1[idx], v1[idx]) || unknown_flow(u2[idx], v2[idx])) { 560 | pix[2] *= 0.5; 561 | pix[1] *= 0.5; 562 | pix[0] *= 0.5; 563 | } 564 | #else 565 | float v = __min(endPtErr, 5.0) / 5.0; 566 | //float v = __min(endPtErr, 3.0) / 3.0; 567 | pix[0] = v * 255; pix[1] = v * 255; pix[2] = v * 255; 568 | pix[3] = 0xFF; // only for alignment 569 | 570 | #if 1 571 | if (endPtErr > 3.0){ // red 572 | pix[0] = pix[1] = 0; 573 | pix[2] = 255; 574 | } 575 | #endif 576 | #endif 577 | if (endPtErr < 3.0){ 578 | validCnt++; 579 | } 580 | memcpy(fillPix + idx * 4, pix, 4); 581 | totalCnt++; 582 | } 583 | } 584 | return 1. - (float)validCnt / totalCnt; 585 | } 586 | 587 | template 588 | float OpticFlowIO::ErrorImage(unsigned char* fillPix, T* u1, T* v1, char* gtName, int w, int h) 589 | { 590 | int gtw, gth; 591 | T* u2 = new T[w*h]; 592 | T* v2 = new T[w*h]; 593 | ReadFlowFile(u2, v2, >w, >h, gtName); 594 | assert(w == gtw&&h == gth); 595 | 596 | float r = ErrorImage(fillPix, u1, v1, u2, v2, w, h); 597 | delete[] u2; 598 | delete[] v2; 599 | return r; 600 | } 601 | 602 | template 603 | float OpticFlowIO::ShowErrorImage(const char* winname, T* U, T* V, char* gtName, int w, int h, int waittime /*= 1*/) 604 | { 605 | cv::Mat img(h, w, CV_8UC4); 606 | float r = OpticFlowIO::ErrorImage(img.data, U, V, gtName, w, h); 607 | 608 | cv::imshow(winname, img); 609 | cv::waitKey(waittime); 610 | 611 | return r; 612 | } 613 | 614 | template 615 | float OpticFlowIO::SaveErrorImage(const char* imgName, T* U, T* V, char* gtName, int w, int h) 616 | { 617 | cv::Mat img(h, w, CV_8UC4); 618 | float r = OpticFlowIO::ErrorImage(img.data, U, V, gtName, w, h); 619 | 620 | cv::imwrite(imgName, img); 621 | return r; 622 | } 623 | 624 | template 625 | FlowErr OpticFlowIO::CalcFlowError(T1* u1, T1* v1, T2* u2, T2*v2, int w, int h) 626 | { 627 | FlowErr stat; 628 | memset(&stat, 0, sizeof(stat)); 629 | 630 | double endPtErr = 0; 631 | double angErr = 0; 632 | int n = 0; 633 | for(int i=0; i 1.0) tmp = 1.0; 646 | 647 | angErr += acos(tmp); 648 | n++; 649 | } 650 | } 651 | 652 | stat.aae = (angErr/n) * 180/M_PI; 653 | stat.aee = endPtErr/n; 654 | 655 | return stat; 656 | } 657 | 658 | template 659 | void OpticFlowIO::setcols(T* colorwheel, int r, int g, int b, int k) 660 | { 661 | colorwheel[k*3+0] = r; 662 | colorwheel[k*3+1] = g; 663 | colorwheel[k*3+2] = b; 664 | } 665 | 666 | template 667 | int OpticFlowIO::makecolorwheel(T* colorwheel) 668 | { 669 | // relative lengths of color transitions: 670 | // these are chosen based on perceptual similarity 671 | // (e.g. one can distinguish more shades between red and yellow 672 | // than between yellow and green) 673 | int RY = 15; 674 | int YG = 6; 675 | int GC = 4; 676 | int CB = 11; 677 | int BM = 13; 678 | int MR = 6; 679 | int ncols = RY + YG + GC + CB + BM + MR; 680 | //printf("ncols = %d\n", ncols); 681 | if (ncols > MAXWHEELCOLS){ 682 | printf("Too Many Columns in ColorWheel!\n"); 683 | //exit(1); 684 | } 685 | int i; 686 | int k = 0; 687 | for (i = 0; i < RY; i++) setcols(colorwheel, 255, 255*i/RY, 0, k++); 688 | for (i = 0; i < YG; i++) setcols(colorwheel, 255-255*i/YG, 255, 0, k++); 689 | for (i = 0; i < GC; i++) setcols(colorwheel, 0, 255, 255*i/GC, k++); 690 | for (i = 0; i < CB; i++) setcols(colorwheel, 0, 255-255*i/CB, 255, k++); 691 | for (i = 0; i < BM; i++) setcols(colorwheel, 255*i/BM, 0, 255, k++); 692 | for (i = 0; i < MR; i++) setcols(colorwheel, 255, 0, 255-255*i/MR, k++); 693 | 694 | return ncols; 695 | } 696 | 697 | template 698 | void OpticFlowIO::computeColor(double fx, double fy, unsigned char *pix, T* colorwheel, int ncols) 699 | { 700 | double rad = sqrt(fx * fx + fy * fy); 701 | double a = atan2(-fy, -fx) / M_PI; 702 | double fk = (a + 1.0) / 2.0 * (ncols-1); 703 | int k0 = (int)fk; 704 | int k1 = (k0 + 1) % ncols; 705 | double f = fk - k0; 706 | //f = 0; // uncomment to see original color wheel 707 | for (int b = 0; b < 3; b++) { 708 | double col0 = colorwheel[k0*3+b] / 255.0; 709 | double col1 = colorwheel[k1*3+b] / 255.0; 710 | double col = (1 - f) * col0 + f * col1; 711 | if (rad <= 1) 712 | col = 1 - rad * (1 - col); // increase saturation with radius 713 | else 714 | col *= .75; // out of range 715 | pix[2 - b] = (int)(255.0 * col); 716 | } 717 | pix[3] = 0xff; // alpha channel, only for alignment 718 | } 719 | 720 | #endif //_OpticFlowIO_H -------------------------------------------------------------------------------- /include/CPM_include/Stochastic.h: -------------------------------------------------------------------------------- 1 | #ifndef STOCHASTIC_H 2 | #define STOCHASTIC_H 3 | 4 | #include "math.h" 5 | #include "stdlib.h" 6 | #include "project.h" 7 | #include "memory.h" 8 | 9 | #define _Release_2DArray(X,i,length) for(i=0;i 12 | T _abs(T x) 13 | { 14 | return x >= 0 ? x:-x; 15 | } 16 | 17 | #ifndef PI 18 | #define PI 3.1415927 19 | #endif 20 | 21 | enum SortType{SortAscending,SortDescending}; 22 | 23 | class CStochastic 24 | { 25 | public: 26 | CStochastic(void); 27 | ~CStochastic(void); 28 | static void ConvertInt2String(int x,char* string,int BitNumber=3); 29 | static double UniformSampling(); 30 | static int UniformSampling(int R); 31 | static double GaussianSampling(); 32 | template static void GetMeanVar(T* signal,int length,double* mean,double* var); 33 | static int Sampling(double* Density,int NumSamples); 34 | static double GetMean(double *signal,int length); 35 | static void Generate1DGaussian(double* pGaussian,int size,double sigma=0); 36 | static void Generate2DGaussian(double* pGaussian,int size,double sigma=0); 37 | static double entropy(double* pDensity,int n); 38 | 39 | template static T sum(int NumData,T* pData); 40 | template static void Normalize(int NumData,T* pData); 41 | template static T mean(int NumData, T* pData); 42 | template static void sort(int number, T* pData,int *pIndex,SortType m_SortType=SortDescending); 43 | template static T Min(int NumData, T* pData); 44 | template static T Min(int NumData, T* pData1,T* pData2); 45 | template static T Max(int NumData ,T* pData); 46 | template static int FindMax(int NumData,T* pData); 47 | template static void ComputeVectorMean(int Dim,int NumData,T1* pData,T2* pMean,double* pWeight=NULL); 48 | template static void ComputeMeanCovariance(int Dim,int NumData,T1* pData,T2* pMean,T2* pCovarance,double* pWeight=NULL); 49 | template static double VectorSquareDistance(int Dim,T1* pVector1,T2* pVector2); 50 | template static void KMeanClustering(int Dim,int NumData,int NumClusters,T1* pData,int *pPartition,double** pClusterMean=NULL,int MaxIterationNum=10,int MinClusterSampleNumber=2); 51 | template static double norm(T* X,int Dim); 52 | template static int FindClosestPoint(T1* pPointSet,int NumPoints,int nDim,T2* QueryPoint); 53 | template static void GaussianFiltering(T1* pSrcArray,T2* pDstArray,int NumPoints,int nChannels,int size,double sigma); 54 | }; 55 | 56 | template 57 | void CStochastic::GetMeanVar(T* signal,int length,double* mean,double* var) 58 | { 59 | double m_mean=0,m_var=0; 60 | 61 | int i; 62 | for (i=0;i 73 | T CStochastic::sum(int NumData, T* pData) 74 | { 75 | T sum=0; 76 | int i; 77 | for(i=0;i 83 | void CStochastic::Normalize(int NumData,T* pData) 84 | { 85 | int i; 86 | T Sum; 87 | Sum=sum(NumData,pData); 88 | for(i=0;i 93 | T CStochastic::mean(int NumData,T* pData) 94 | { 95 | return sum(NumData,pData)/NumData; 96 | } 97 | 98 | //////////////////////////////////////////////////////////// 99 | // sort data in descending order 100 | template 101 | void CStochastic::sort(int Number,T* pData,int *pIndex,SortType m_SortType) 102 | { 103 | int i,j,offset_extreme,*flag; 104 | double extreme; 105 | flag=new int[Number]; 106 | memset(flag,0,sizeof(int)*Number); 107 | for(i=0;ipData[j])) 119 | { 120 | extreme=pData[j]; 121 | offset_extreme=j; 122 | } 123 | } 124 | pIndex[i]=offset_extreme; 125 | flag[offset_extreme]=1; 126 | } 127 | delete flag; 128 | } 129 | 130 | template 131 | T CStochastic::Min(int NumData,T* pData) 132 | { 133 | int i; 134 | T result=pData[0]; 135 | for(i=1;i 141 | T CStochastic::Min(int NumData,T* pData1,T* pData2) 142 | { 143 | int i; 144 | T result=pData1[0]+pData2[0]; 145 | for(i=1;i 151 | T CStochastic::Max(int NumData,T* pData) 152 | { 153 | int i; 154 | T result=pData[0]; 155 | for(i=1;i 161 | int CStochastic::FindMax(int NumData,T* pData) 162 | { 163 | int i,index; 164 | T result=pData[0]; 165 | index=0; 166 | for(i=1;iresult) 168 | { 169 | index=i; 170 | result=pData[i]; 171 | } 172 | return index; 173 | } 174 | 175 | 176 | template 177 | void CStochastic::ComputeMeanCovariance(int Dim,int NumData,T1* pData,T2* pMean,T2* pCovariance,double* pWeight) 178 | { 179 | int i,j,k; 180 | memset(pMean,0,sizeof(T2)*Dim); 181 | memset(pCovariance,0,sizeof(T2)*Dim*Dim); 182 | 183 | bool IsWeightLoaded=false; 184 | double Sum; 185 | if(pWeight!=NULL) 186 | IsWeightLoaded=true; 187 | 188 | // compute mean first 189 | Sum=0; 190 | if(IsWeightLoaded) 191 | for(i=0;i 241 | void CStochastic::ComputeVectorMean(int Dim,int NumData,T1* pData,T2* pMean,double* pWeight) 242 | { 243 | int i,j; 244 | memset(pMean,0,sizeof(T2)*Dim); 245 | bool IsWeightLoaded; 246 | double Sum; 247 | if(pWeight=NULL) 248 | IsWeightLoaded=false; 249 | else 250 | IsWeightLoaded=true; 251 | 252 | Sum=0; 253 | if(IsWeightLoaded) 254 | for(i=0;i 274 | double CStochastic::VectorSquareDistance(int Dim,T1* pVector1,T2* pVector2) 275 | { 276 | double result=0,temp; 277 | int i; 278 | for(i=0;i 287 | void CStochastic::KMeanClustering(int Dim,int NumData,int NumClusters,T1* pData,int *pPartition,double** pClusterMean,int MaxIterationNum, int MinClusterSampleNumber) 288 | { 289 | int i,j,k,l,Index,ClusterSampleNumber; 290 | double MinDistance,Distance; 291 | double** pCenters; 292 | pCenters=new double*[NumClusters]; 293 | for(i=0;i 354 | double CStochastic::norm(T* X,int Dim) 355 | { 356 | double result=0; 357 | int i; 358 | for(i=0;i 365 | int CStochastic::FindClosestPoint(T1* pPointSet,int NumPoints,int nDim,T2* QueryPoint) 366 | { 367 | int i,j,Index=0,offset; 368 | T1 MinDistance,Distance,x; 369 | MinDistance=0; 370 | for(j=0;j 391 | void CStochastic::GaussianFiltering(T1* pSrcArray,T2* pDstArray,int NumPoints,int nChannels,int size,double sigma) 392 | { 393 | int i,j,u,l; 394 | double *pGaussian,temp; 395 | pGaussian=new double[2*size+1]; 396 | Generate1DGaussian(pGaussian,size,sigma); 397 | for(i=0;i 5 | 6 | /************************************************************************/ 7 | /* CTimer */ 8 | /************************************************************************/ 9 | #ifdef WIN32 10 | #include 11 | #else 12 | #include 13 | #endif 14 | 15 | template 16 | class _CTimer 17 | { 18 | public: 19 | _CTimer(); 20 | ~_CTimer(){}; 21 | 22 | void tic(); // time in clock 23 | double toc(const char* msg = NULL); // time out clock 24 | private: 25 | T inT, f; 26 | }; 27 | 28 | template 29 | _CTimer::_CTimer() 30 | { 31 | #ifdef WIN32 32 | QueryPerformanceFrequency(&f); 33 | #endif 34 | tic(); 35 | } 36 | 37 | #ifdef WIN32 38 | typedef _CTimer CTimer; // only CTimer makes sense 39 | #else 40 | typedef _CTimer CTimer; 41 | #endif 42 | 43 | template 44 | void _CTimer::tic() 45 | { 46 | #ifdef WIN32 47 | QueryPerformanceCounter(&inT); 48 | #else 49 | gettimeofday(&inT,NULL); 50 | #endif 51 | } 52 | 53 | template 54 | double _CTimer::toc(const char* msg) 55 | { 56 | #ifdef WIN32 57 | LARGE_INTEGER outT; 58 | QueryPerformanceCounter(&outT); 59 | 60 | double dt = (double)(outT.QuadPart-inT.QuadPart)/f.QuadPart; 61 | #else 62 | struct timeval outT; 63 | gettimeofday(&outT,NULL); 64 | double dt = 1000000 * (outT.tv_sec - inT.tv_sec) + outT.tv_usec - inT.tv_usec; 65 | dt /= 1000000; 66 | #endif 67 | if(msg){ 68 | printf("%s %f [s]\n", msg, dt); 69 | } 70 | 71 | tic(); 72 | return dt; 73 | } 74 | 75 | /************************************************************************/ 76 | /* Gray2ColorTable */ 77 | /************************************************************************/ 78 | template 79 | class _CColorTable 80 | { 81 | public: 82 | _CColorTable(); 83 | ~_CColorTable(){}; 84 | 85 | // function to access the member variables 86 | inline T* operator [] (int index) { return m_colorTbl[index]; }; 87 | 88 | private: 89 | T m_colorTbl[256][3]; 90 | }; 91 | 92 | typedef _CColorTable CColorTable; 93 | 94 | template 95 | _CColorTable::_CColorTable() 96 | { 97 | // BGR table 98 | static unsigned char gray2ColorTb[256][3] = { 99 | {143, 0, 0},{147, 0, 0},{151, 0, 0},{155, 0, 0},{159, 0, 0},{163, 0, 0},{167, 0, 0},{171, 0, 0},{175, 0, 0},{179, 0, 0},{183, 0, 0},{187, 0, 0},{191, 0, 0},{195, 0, 0},{199, 0, 0},{203, 0, 0},{206, 0, 0},{210, 0, 0},{214, 0, 0},{218, 0, 0},{222, 0, 0},{226, 0, 0},{230, 0, 0},{234, 0, 0},{238, 0, 0},{242, 0, 0},{246, 0, 0},{250, 0, 0},{254, 0, 0},{255, 3, 0},{255, 7, 0},{255, 11, 0}, 100 | {255, 14, 0},{255, 18, 0},{255, 22, 0},{255, 26, 0},{255, 30, 0},{255, 34, 0},{255, 38, 0},{255, 42, 0},{255, 46, 0},{255, 50, 0},{255, 54, 0},{255, 58, 0},{255, 62, 0},{255, 66, 0},{255, 70, 0},{255, 74, 0},{255, 77, 0},{255, 81, 0},{255, 85, 0},{255, 89, 0},{255, 93, 0},{255, 97, 0},{255,101, 0},{255,105, 0},{255,109, 0},{255,113, 0},{255,117, 0},{255,121, 0},{255,125, 0},{255,129, 0},{255,133, 0},{255,137, 0}, 101 | {255,140, 0},{255,144, 0},{255,148, 0},{255,152, 0},{255,156, 0},{255,160, 0},{255,164, 0},{255,168, 0},{255,172, 0},{255,176, 0},{255,180, 0},{255,184, 0},{255,188, 0},{255,192, 0},{255,196, 0},{255,200, 0},{255,203, 0},{255,207, 0},{255,211, 0},{255,215, 0},{255,219, 0},{255,223, 0},{255,227, 0},{255,231, 0},{255,235, 0},{255,239, 0},{255,243, 0},{255,247, 0},{255,251, 0},{255,255, 0},{251,255, 4},{247,255, 8}, 102 | {244,255, 11},{240,255, 15},{236,255, 19},{232,255, 23},{228,255, 27},{224,255, 31},{220,255, 35},{216,255, 39},{212,255, 43},{208,255, 47},{204,255, 51},{200,255, 55},{196,255, 59},{192,255, 63},{188,255, 67},{184,255, 71},{181,255, 74},{177,255, 78},{173,255, 82},{169,255, 86},{165,255, 90},{161,255, 94},{157,255, 98},{153,255,102},{149,255,106},{145,255,110},{141,255,114},{137,255,118},{133,255,122},{129,255,126},{125,255,130},{122,255,133}, 103 | {118,255,137},{114,255,141},{110,255,145},{106,255,149},{102,255,153},{ 98,255,157},{ 94,255,161},{ 90,255,165},{ 86,255,169},{ 82,255,173},{ 78,255,177},{ 74,255,181},{ 70,255,185},{ 66,255,189},{ 62,255,193},{ 59,255,196},{ 55,255,200},{ 51,255,204},{ 47,255,208},{ 43,255,212},{ 39,255,216},{ 35,255,220},{ 31,255,224},{ 27,255,228},{ 23,255,232},{ 19,255,236},{ 15,255,240},{ 11,255,244},{ 7,255,248},{ 3,255,252},{ 0,254,255},{ 0,251,255}, 104 | { 0,247,255},{ 0,243,255},{ 0,239,255},{ 0,235,255},{ 0,231,255},{ 0,227,255},{ 0,223,255},{ 0,219,255},{ 0,215,255},{ 0,211,255},{ 0,207,255},{ 0,203,255},{ 0,199,255},{ 0,195,255},{ 0,191,255},{ 0,188,255},{ 0,184,255},{ 0,180,255},{ 0,176,255},{ 0,172,255},{ 0,168,255},{ 0,164,255},{ 0,160,255},{ 0,156,255},{ 0,152,255},{ 0,148,255},{ 0,144,255},{ 0,140,255},{ 0,136,255},{ 0,132,255},{ 0,128,255},{ 0,125,255}, 105 | { 0,121,255},{ 0,117,255},{ 0,113,255},{ 0,109,255},{ 0,105,255},{ 0,101,255},{ 0, 97,255},{ 0, 93,255},{ 0, 89,255},{ 0, 85,255},{ 0, 81,255},{ 0, 77,255},{ 0, 73,255},{ 0, 69,255},{ 0, 65,255},{ 0, 62,255},{ 0, 58,255},{ 0, 54,255},{ 0, 50,255},{ 0, 46,255},{ 0, 42,255},{ 0, 38,255},{ 0, 34,255},{ 0, 30,255},{ 0, 26,255},{ 0, 22,255},{ 0, 18,255},{ 0, 14,255},{ 0, 10,255},{ 0, 6,255},{ 0, 2,255},{ 0, 0,254}, 106 | { 0, 0,250},{ 0, 0,246},{ 0, 0,242},{ 0, 0,238},{ 0, 0,234},{ 0, 0,230},{ 0, 0,226},{ 0, 0,222},{ 0, 0,218},{ 0, 0,214},{ 0, 0,210},{ 0, 0,206},{ 0, 0,202},{ 0, 0,198},{ 0, 0,194},{ 0, 0,191},{ 0, 0,187},{ 0, 0,183},{ 0, 0,179},{ 0, 0,175},{ 0, 0,171},{ 0, 0,167},{ 0, 0,163},{ 0, 0,159},{ 0, 0,155},{ 0, 0,151},{ 0, 0,147},{ 0, 0,143},{ 0, 0,139},{ 0, 0,135},{ 0, 0,131},{ 0, 0,128} 107 | }; 108 | for (int i = 0; i < 256; i++){ 109 | memcpy(m_colorTbl[i], gray2ColorTb[i], 3); 110 | } 111 | } 112 | 113 | #endif // _UTIL_H_ 114 | 115 | -------------------------------------------------------------------------------- /include/CPM_include/Vector.h: -------------------------------------------------------------------------------- 1 | #pragma once 2 | 3 | #include 4 | #include 5 | #include 6 | #include "project.h" 7 | 8 | using namespace std; 9 | 10 | template 11 | class Vector 12 | { 13 | protected: 14 | int nDim; 15 | T* pData; 16 | public: 17 | Vector(void); 18 | Vector(int ndim,const T *data=NULL); 19 | Vector(const Vector& vect); 20 | ~Vector(void); 21 | void releaseData(); 22 | void allocate(int ndim); 23 | void allocate(const Vector& vect){allocate(vect.nDim);}; 24 | void copyData(const Vector& vect); 25 | void dimcheck(const Vector& vect) const; 26 | void reset(); 27 | double norm2() const; 28 | 29 | T sum() const; 30 | 31 | void printVector(); 32 | 33 | // access the members 34 | const T* data() const{return (const T*)pData;}; 35 | T* data() {return pData;}; 36 | int dim() const {return nDim;}; 37 | inline bool matchDimension(int _ndim) const {if(nDim==_ndim) return true;else return false;}; 38 | inline bool matchDimension(const Vector& vect) const {return matchDimension(vect.nDim);}; 39 | 40 | // operators 41 | inline T operator[](int index) const {return pData[index];}; 42 | inline T& operator[](int index){return *(pData+index);}; 43 | Vector& operator=(const Vector& vect); 44 | 45 | //const Vector& operator/(double val) const 46 | //{ 47 | // Vector result(nDim); 48 | // for(int i =0;i& operator+=(const Vector& vect); 54 | Vector& operator*=(const Vector& vect); 55 | Vector& operator-=(const Vector& vect); 56 | Vector& operator/=(const Vector& vect); 57 | 58 | Vector& operator+=(double val); 59 | Vector& operator*=(double val); 60 | Vector& operator-=(double val); 61 | Vector& operator/=(double val); 62 | 63 | //friend const Vector operator+(const Vector& vect1,const Vector& vect2); 64 | //friend const Vector operator*(const Vector& vect1,const Vector& vect2); 65 | //friend const Vector operator-(const Vector& vect1,const Vector& vect2); 66 | //friend const Vector operator/(const Vector& vect1,const Vector& vect2); 67 | 68 | //friend const Vector operator+(const Vector& vect1,double val); 69 | //friend const Vector operator*(const Vector& vect1,double val); 70 | //friend const Vector operator-(const Vector& vect1,double val); 71 | //friend Vector operator/(const Vector& vect,double val); 72 | 73 | friend double innerproduct(const Vector& vect1,const Vector& vect2) 74 | { 75 | double result = 0; 76 | for(int i = 0;i >& vect); 82 | 83 | //friend const Vector concatenate(const vector>& vect){Vector result; result.concatenate(vect); return result;}; 84 | bool write(ofstream& myfile) 85 | { 86 | myfile.write((char *)&nDim,sizeof(int)); 87 | myfile.write((char *)pData,sizeof(T)*nDim); 88 | return true; 89 | } 90 | bool read(ifstream& myfile) 91 | { 92 | myfile.read((char *)&nDim,sizeof(int)); 93 | allocate(nDim); 94 | myfile.read((char *)pData,sizeof(T)*nDim); 95 | return true; 96 | } 97 | T mean(int N=-1) const 98 | { 99 | if(N==-1) 100 | N = nDim; 101 | T result = 0; 102 | for(int i = 0;i 113 | //double innerproduct(const Vector& vect1,const Vector& vect2) 114 | //{ 115 | // double result = 0; 116 | // for(int i = 0;i 122 | Vector::Vector(void) 123 | { 124 | nDim=0; 125 | pData=NULL; 126 | } 127 | 128 | template 129 | Vector::Vector(int ndim, const T *data) 130 | { 131 | nDim=ndim; 132 | pData=new T[nDim]; 133 | if(data!=NULL) 134 | memcpy(pData,data,sizeof(T)*nDim); 135 | else 136 | memset(pData,0,sizeof(T)*nDim); 137 | } 138 | 139 | template 140 | Vector::Vector(const Vector& vect) 141 | { 142 | nDim=0; 143 | pData=NULL; 144 | copyData(vect); 145 | } 146 | 147 | template 148 | Vector::~Vector(void) 149 | { 150 | releaseData(); 151 | } 152 | 153 | template 154 | void Vector::releaseData() 155 | { 156 | if(pData!=NULL) 157 | delete []pData; 158 | pData=NULL; 159 | nDim=0; 160 | } 161 | 162 | template 163 | void Vector::allocate(int ndim) 164 | { 165 | releaseData(); 166 | nDim=ndim; 167 | if(nDim>0) 168 | { 169 | pData=new T[nDim]; 170 | reset(); 171 | } 172 | } 173 | 174 | 175 | template 176 | void Vector::copyData(const Vector &vect) 177 | { 178 | if(nDim!=vect.nDim) 179 | { 180 | releaseData(); 181 | nDim=vect.nDim; 182 | pData=new T[nDim]; 183 | } 184 | memcpy(pData,vect.pData,sizeof(T)*nDim); 185 | } 186 | 187 | template 188 | void Vector::dimcheck(const Vector &vect) const 189 | { 190 | if(nDim!=vect.nDim) 191 | cout<<"The dimensions of the vectors don't match!"< 195 | void Vector::reset() 196 | { 197 | if(pData!=NULL) 198 | memset(pData,0,sizeof(T)*nDim); 199 | } 200 | 201 | 202 | template 203 | T Vector::sum() const 204 | { 205 | T total = 0; 206 | for(int i=0;i 212 | double Vector::norm2() const 213 | { 214 | double temp=0; 215 | for(int i=0;i 221 | void Vector::printVector() 222 | { 223 | for(int i=0;i 233 | Vector& Vector::operator =(const Vector &vect) 234 | { 235 | copyData(vect); 236 | return *this; 237 | } 238 | 239 | template 240 | Vector& Vector::operator +=(const Vector &vect) 241 | { 242 | dimcheck(vect); 243 | for(int i=0;i 249 | Vector& Vector::operator *=(const Vector &vect) 250 | { 251 | dimcheck(vect); 252 | for(int i=0;i 258 | Vector& Vector::operator -=(const Vector &vect) 259 | { 260 | dimcheck(vect); 261 | for(int i=0;i 267 | Vector& Vector::operator /=(const Vector &vect) 268 | { 269 | dimcheck(vect); 270 | for(int i=0;i 276 | Vector& Vector::operator +=(double val) 277 | { 278 | for(int i=0;i 284 | Vector& Vector::operator *=(double val) 285 | { 286 | for(int i=0;i 292 | Vector& Vector::operator -=(double val) 293 | { 294 | for(int i=0;i 300 | Vector& Vector::operator /=(double val) 301 | { 302 | for(int i=0;i 309 | const Vector operator+(const Vector& vect1,const Vector& vect2) 310 | { 311 | vect1.dimcheck(vect2); 312 | Vector result(vect1); 313 | result+=vect2; 314 | return result; 315 | } 316 | 317 | template 318 | const Vector operator-(const Vector& vect1,const Vector& vect2) 319 | { 320 | vect1.dimcheck(vect2); 321 | Vector result(vect1); 322 | result-=vect2; 323 | return result; 324 | } 325 | 326 | template 327 | const Vector operator*(const Vector& vect1,const Vector& vect2) 328 | { 329 | vect1.dimcheck(vect2); 330 | Vector result(vect1); 331 | result*=vect2; 332 | return result; 333 | } 334 | 335 | template 336 | const Vector operator/(const Vector& vect1,const Vector& vect2) 337 | { 338 | vect1.dimcheck(vect2); 339 | Vector result(vect1); 340 | result/=vect2; 341 | return result; 342 | } 343 | 344 | template 345 | Vector operator+(const Vector& vect,double val) 346 | { 347 | Vector result(vect); 348 | result+=val; 349 | return result; 350 | } 351 | 352 | template 353 | Vector operator-(const Vector& vect,double val) 354 | { 355 | Vector result(vect); 356 | result-=val; 357 | return result; 358 | } 359 | 360 | template 361 | Vector operator*(const Vector& vect,double val) 362 | { 363 | Vector result(vect); 364 | result*=val; 365 | return result; 366 | } 367 | 368 | template 369 | Vector operator/(const Vector& vect,double val) 370 | { 371 | Vector result(vect); 372 | result/=val; 373 | return result; 374 | } 375 | 376 | 377 | template 378 | double innerproduct(const Vector& vect1,const Vector& vect2) 379 | { 380 | vect1.dimcheck(vect2); 381 | double result=0; 382 | for(int i=0;i 388 | void Vector::concatenate(const vector< Vector >& vect) 389 | { 390 | releaseData(); 391 | nDim = 0; 392 | for(int i = 0;i0) 421 | { 422 | allocate(nDim); 423 | if(file.read((char *)pData,sizeof(double)*nDim)!=sizeof(double)*nDim) 424 | return false; 425 | } 426 | return true; 427 | } 428 | 429 | #endif 430 | 431 | 432 | #ifdef _MATLAB 433 | 434 | template 435 | void Vector::readVector(const mxArray* prhs) 436 | { 437 | if(pData!=NULL) 438 | delete pData; 439 | int nElements = mxGetNumberOfDimensions(prhs); 440 | if(nElements>2) 441 | mexErrMsgTxt("A vector is expected to be loaded!"); 442 | const int* dims = mxGetDimensions(prhs); 443 | nDim = dims[0]*dims[1]; 444 | pData = new T[nDim]; 445 | double* ptr = (double*)mxGetData(prhs); 446 | for(int i =0;i 451 | void Vector::writeVector(mxArray*& plhs) const 452 | { 453 | int dims[2]; 454 | dims[0]=nDim;dims[1]=1; 455 | plhs=mxCreateNumericArray(2, dims,mxDOUBLE_CLASS, mxREAL); 456 | double *ptr = (double*)mxGetData(plhs); 457 | for(int i =0;i 4 | 5 | template 6 | void _Release1DBuffer(T* pBuffer) 7 | { 8 | if(pBuffer!=NULL) 9 | delete []pBuffer; 10 | pBuffer=NULL; 11 | } 12 | 13 | template 14 | void _Rlease2DBuffer(T** pBuffer,size_t nElements) 15 | { 16 | for(size_t i=0;i 32 | T1 __min(T1 a, T2 b) 33 | { 34 | return (a>b)?b:a; 35 | } 36 | 37 | template 38 | T1 __max(T1 a, T2 b) 39 | { 40 | return (a 14 | #include 15 | #include "constants.h" 16 | #include 17 | #include "guidedfilter.h" 18 | #include "Pixel.h" 19 | #include "Minimization.h" 20 | 21 | void getGlobalColorModel(cv::Mat &image, std::vector &means, std::vector &covs, double tau); 22 | bool getGlobalColorModelVideo(std::vector &means, 23 | std::vector &covs, std::vector frames, int frames_to_stack, double tau); 24 | 25 | void saveColorModelAsImage(const char * filename, std::vector means, std::vector covs); 26 | 27 | float distHistogram(cv::Mat img1, cv::Mat img2); 28 | bool isCMRepresentative(std::vector means, std::vector covs, cv::Mat frame); 29 | 30 | 31 | #endif // COLORMODEL_H_ 32 | -------------------------------------------------------------------------------- /include/Minimization.h: -------------------------------------------------------------------------------- 1 | /* 2 | * Minimization.h 3 | * 4 | * Author: Sebastian Lutz 5 | * University: Trinity College Dublin 6 | * School: Computer Science and Statistics 7 | * Project: V-SENSE 8 | */ 9 | 10 | #ifndef MINIMIZATION_H_ 11 | #define MINIMIZATION_H_ 12 | 13 | #include 14 | #include 15 | #include 16 | #include 17 | #include "constants.h" 18 | 19 | typedef double (* vFunctionCall)(std::vector v, void* params); // pointer to function returning double 20 | typedef std::vector (* vFunctionCall2)(std::vector v, void* params); 21 | 22 | //static variables for debugging (which is reached: maxIterLineSeach, cg_max_iter or isMin) 23 | extern int reach_ls_iter; 24 | extern int total_line_search; 25 | extern int reach_cg_iter; 26 | extern int reach_isMin_iter; 27 | 28 | double energy(std::vector