├── README.md ├── ECO ├── regularization_filter.hpp ├── metrics.hpp ├── optimize_scores.hpp ├── scale_filter.hpp ├── interpolator.hpp ├── metrics.cc ├── wrappers.hpp ├── gradient.hpp ├── feature_operator.hpp ├── feature_extractor.hpp ├── sse.hpp ├── sample_update.hpp ├── eco.hpp ├── training.hpp ├── interpolator.cc ├── regularization_filter.cc ├── ffttools.hpp ├── recttools.hpp ├── optimize_scores.cc ├── fhog.hpp ├── scale_filter.cc ├── parameters.hpp ├── feature_operator.cc ├── eco_unittest.cc ├── sample_update.cc ├── debug.hpp ├── gradient.cpp └── ffttools.cc ├── KCF ├── labdata.hpp ├── recttools.hpp ├── fhog.hpp ├── ffttools.hpp └── kcftracker.hpp ├── MTCNN ├── helpers.hpp ├── face_detector.hpp └── face_detector.cpp └── DaSiamRPN └── dasiamrpntracker.h /README.md: -------------------------------------------------------------------------------- 1 | # Object-tracking-system-based-on-deep-learning 2 | Object tracking system based on deep learning. 3 | 4 | Master-Jetson TX2, ROS-image + control, image (DL) - detection + tracking, control - TurtleBot 5 | 6 | 7 | Video:https://www.bilibili.com/video/av49678702/ 8 | 9 | Blog:https://blog.csdn.net/qq_35999634/article/details/89375456 10 | 11 | Wechat Official Account: ScienceRecord 12 | -------------------------------------------------------------------------------- /ECO/regularization_filter.hpp: -------------------------------------------------------------------------------- 1 | #ifndef REGULARIZATION_FILTER_HPP 2 | #define REGULARIZATION_FILTER_HPP 3 | 4 | #include 5 | #include 6 | 7 | #include "parameters.hpp" 8 | #include "ffttools.hpp" 9 | #include "debug.hpp" 10 | 11 | namespace eco 12 | { 13 | cv::Mat get_regularization_filter(cv::Size sz, 14 | cv::Size2f target_sz, 15 | const EcoParameters ¶ms); 16 | } 17 | #endif -------------------------------------------------------------------------------- /ECO/metrics.hpp: -------------------------------------------------------------------------------- 1 | #ifndef METRICS_HPP 2 | #define METRICS_HPP 3 | 4 | //#include 5 | #include 6 | #include 7 | 8 | class Metrics 9 | { 10 | public: 11 | float center_error(const cv::Rect2f bbox, const cv::Rect2f bboxGroundtruth); 12 | float iou(const cv::Rect2f bbox, const cv::Rect2f bboxGroundtruth); 13 | cv::Rect2f intersection(const cv::Rect2f bbox, 14 | const cv::Rect2f bboxGroundtruth); 15 | float auc(); 16 | }; 17 | 18 | #endif -------------------------------------------------------------------------------- /KCF/labdata.hpp: -------------------------------------------------------------------------------- 1 | namespace kcf 2 | { 3 | const int nClusters = 15; 4 | float data[nClusters][3] = { 5 | {161.317504, 127.223401, 128.609333}, 6 | {142.922425, 128.666965, 127.532319}, 7 | {67.879757, 127.721830, 135.903311}, 8 | {92.705062, 129.965717, 137.399500}, 9 | {120.172257, 128.279647, 127.036493}, 10 | {195.470568, 127.857070, 129.345415}, 11 | {41.257102, 130.059468, 132.675336}, 12 | {12.014861, 129.480555, 127.064714}, 13 | {226.567086, 127.567831, 136.345727}, 14 | {154.664210, 131.676606, 156.481669}, 15 | {121.180447, 137.020793, 153.433743}, 16 | {87.042204, 137.211742, 98.614874}, 17 | {113.809537, 106.577104, 157.818094}, 18 | {81.083293, 170.051905, 148.904079}, 19 | {45.015485, 138.543124, 102.402528}}; 20 | } -------------------------------------------------------------------------------- /ECO/optimize_scores.hpp: -------------------------------------------------------------------------------- 1 | #ifndef OPTIMIZE_SCORES_HPP 2 | #define OPTIMIZE_SCORES_HPP 3 | 4 | //#include 5 | #include 6 | 7 | #include "ffttools.hpp" 8 | #include "debug.hpp" 9 | 10 | namespace eco 11 | { 12 | class OptimizeScores 13 | { 14 | public: 15 | virtual ~OptimizeScores() {} 16 | OptimizeScores() {} 17 | OptimizeScores(std::vector &scores_fs, int ite) 18 | : scores_fs_(scores_fs), iterations_(ite) {} 19 | 20 | void compute_scores(); 21 | 22 | inline int get_scale_ind() const { return scale_ind_; } 23 | inline float get_disp_row() const { return disp_row_; } 24 | inline float get_disp_col() const { return disp_col_; } 25 | inline float get_max_score() const { return max_score_; } 26 | 27 | private: 28 | std::vector scores_fs_; 29 | int iterations_; 30 | 31 | int scale_ind_; 32 | float disp_row_; 33 | float disp_col_; 34 | float max_score_; 35 | }; 36 | } // namespace eco 37 | #endif 38 | -------------------------------------------------------------------------------- /ECO/scale_filter.hpp: -------------------------------------------------------------------------------- 1 | #ifndef SCALE_FILTER_HPP 2 | #define SCALE_FILTER_HPP 3 | 4 | #include "parameters.hpp" 5 | #include "ffttools.hpp" 6 | #include "recttools.hpp" 7 | #include "feature_extractor.hpp" 8 | #include "debug.hpp" 9 | #include 10 | 11 | namespace eco 12 | { 13 | 14 | class ScaleFilter 15 | { 16 | public: 17 | ScaleFilter(){}; 18 | virtual ~ScaleFilter(){}; 19 | void init(int &nScales, float &scale_step, const EcoParameters ¶ms); 20 | float scale_filter_track(const cv::Mat &im, const cv::Point2f &pos, const cv::Size2f &base_target_sz, const float ¤tScaleFactor, const EcoParameters ¶ms); 21 | cv::Mat extract_scale_sample(const cv::Mat &im, const cv::Point2f &posf, const cv::Size2f &base_target_sz, vector &scaleFactors, const cv::Size &scale_model_sz); 22 | 23 | private: 24 | vector scaleSizeFactors_; 25 | vector interpScaleFactors_; 26 | cv::Mat yf_; 27 | vector window_; 28 | bool max_scale_dim_; 29 | }; 30 | } // namespace eco 31 | #endif -------------------------------------------------------------------------------- /ECO/interpolator.hpp: -------------------------------------------------------------------------------- 1 | #ifndef INTERPOLATOR_HPP 2 | #define INTERPOLATOR_HPP 3 | 4 | #include 5 | #include 6 | #include "debug.hpp" 7 | 8 | namespace eco{ 9 | class Interpolator 10 | { 11 | public: 12 | Interpolator(); 13 | virtual ~Interpolator(); 14 | static inline float mat_cos1(float x) 15 | { 16 | return (cos(x * M_PI)); 17 | } 18 | static inline float mat_sin1(float x) 19 | { 20 | return (sin(x * M_PI)); 21 | } 22 | static inline float mat_cos2(float x) 23 | { 24 | return (cos(2 * x * M_PI)); 25 | } 26 | static inline float mat_sin2(float x) 27 | { 28 | return (sin(2 * x * M_PI)); 29 | } 30 | static inline float mat_cos4(float x) 31 | { 32 | return (cos(4 * x * M_PI)); 33 | } 34 | static inline float mat_sin4(float x) 35 | { 36 | return (sin(4 * x * M_PI)); 37 | } 38 | 39 | static void get_interp_fourier(cv::Size filter_sz, 40 | cv::Mat &interp1_fs, 41 | cv::Mat &interp2_fs, 42 | float a); 43 | 44 | static cv::Mat cubic_spline_fourier(cv::Mat f, float a); 45 | }; 46 | } 47 | 48 | #endif -------------------------------------------------------------------------------- /MTCNN/helpers.hpp: -------------------------------------------------------------------------------- 1 | #ifndef _HELPERS_HPP_ 2 | #define _HELPERS_HPP_ 3 | 4 | #include 5 | #include 6 | 7 | class Timer { 8 | private: 9 | std::chrono::time_point t1; 10 | public: 11 | inline void start() { 12 | t1 = std::chrono::system_clock::now(); 13 | } 14 | inline double stop() { 15 | auto t2 = std::chrono::system_clock::now(); 16 | return std::chrono::duration_cast(t2 - t1).count(); 17 | } 18 | }; 19 | 20 | inline cv::Mat cropImage(cv::Mat img, cv::Rect r) { 21 | cv::Mat m = cv::Mat::zeros(r.height, r.width, img.type()); 22 | int dx = std::abs(std::min(0, r.x)); 23 | if (dx > 0) { r.x = 0; } 24 | r.width -= dx; 25 | int dy = std::abs(std::min(0, r.y)); 26 | if (dy > 0) { r.y = 0; } 27 | r.height -= dy; 28 | int dw = std::abs(std::min(0, img.cols - 1 - (r.x + r.width))); 29 | r.width -= dw; 30 | int dh = std::abs(std::min(0, img.rows - 1 - (r.y + r.height))); 31 | r.height -= dh; 32 | if (r.width > 0 && r.height > 0) { 33 | img(r).copyTo(m(cv::Range(dy, dy + r.height), cv::Range(dx, dx + r.width))); 34 | } 35 | return m; 36 | } 37 | 38 | inline void drawAndShowFace(cv::Mat img, cv::Rect r, const std::vector& pts) { 39 | cv::Mat outImg; 40 | img.convertTo(outImg, CV_8UC3); 41 | cv::rectangle(outImg, r, cv::Scalar(0, 0, 255)); 42 | for (size_t i = 0; i < pts.size(); ++i) { 43 | cv::circle(outImg, pts[i], 3, cv::Scalar(0, 0, 255)); 44 | } 45 | cv::imshow("test", outImg); 46 | cv::waitKey(0); 47 | } 48 | 49 | #endif //_HELPERS_HPP_ -------------------------------------------------------------------------------- /ECO/metrics.cc: -------------------------------------------------------------------------------- 1 | #include "metrics.hpp" 2 | 3 | float Metrics::center_error(const cv::Rect2f bbox, const cv::Rect2f bboxGroundtruth) 4 | { 5 | float cx = bbox.x + bbox.width / 2.0f; 6 | float cy = bbox.y + bbox.height / 2.0f; 7 | float cx_gt = bboxGroundtruth.x + bboxGroundtruth.width / 2.0f; 8 | float cy_gt = bboxGroundtruth.y + bboxGroundtruth.height / 2.0f; 9 | float result = std::sqrt(std::pow((cx - cx_gt), 2) + 10 | std::pow((cy - cy_gt), 2)); 11 | return result; 12 | } 13 | 14 | float Metrics::iou(const cv::Rect2f bbox, const cv::Rect2f bboxGroundtruth) 15 | { 16 | cv::Rect2f inter = Metrics::intersection(bbox, bboxGroundtruth); 17 | float area_bbox = bbox.area(); 18 | float area_bbox_gt = bboxGroundtruth.area(); 19 | float area_intersection = inter.area(); 20 | float iou = area_bbox + area_bbox_gt - area_intersection; 21 | iou = area_intersection / (iou + 1e-12); 22 | return iou; 23 | } 24 | 25 | cv::Rect2f Metrics::intersection(const cv::Rect2f bbox, 26 | const cv::Rect2f bboxGroundtruth) 27 | { 28 | float x1, y1, x2, y2, w, h; 29 | x1 = std::max(bbox.x, bboxGroundtruth.x); 30 | y1 = std::max(bbox.y, bboxGroundtruth.y); 31 | x2 = std::min(bbox.x + bbox.width, bboxGroundtruth.x + bboxGroundtruth.width); 32 | y2 = std::min(bbox.y + bbox.height, bboxGroundtruth.y + bboxGroundtruth.height); 33 | w = std::max(0.0f, x2 - x1); 34 | h = std::max(0.0f, y2 - y1); 35 | 36 | cv::Rect2f result(x1, y1, w, h); 37 | return result; 38 | } 39 | 40 | float Metrics::auc() 41 | { 42 | } -------------------------------------------------------------------------------- /ECO/wrappers.hpp: -------------------------------------------------------------------------------- 1 | /******************************************************************************* 2 | * Piotr's Computer Vision Matlab Toolbox Version 3.00 3 | * Copyright 2014 Piotr Dollar. [pdollar-at-gmail.com] 4 | * Licensed under the Simplified BSD License [see external/bsd.txt] 5 | *******************************************************************************/ 6 | #ifndef _WRAPPERS_HPP_ 7 | #define _WRAPPERS_HPP_ 8 | 9 | #include 10 | 11 | // wrapper functions if compiling from C/C++ 12 | inline void wrError(const char *errormsg) { throw errormsg; } 13 | inline void *wrCalloc(size_t num, size_t size) { return calloc(num, size); } 14 | inline void *wrMalloc(size_t size) { return malloc(size); } 15 | inline void wrFree(void *ptr) { free(ptr); } 16 | 17 | // platform independent aligned memory allocation (see also alFree) 18 | // __m128 should be 128/8=16 byte aligned 19 | inline void *alMalloc(size_t size, int alignment) 20 | { 21 | const size_t pSize = sizeof(void *), a = alignment - 1; 22 | void *raw = wrMalloc(size + a + pSize); 23 | // get the aligned address, alignment should be 2^N. 24 | void *aligned = (void *)(((size_t)raw + pSize + a) & ~a); 25 | *(void **)((size_t)aligned - pSize) = raw; // save address of raw in -1 26 | return aligned; 27 | } 28 | 29 | // platform independent alignned memory de-allocation (see also alMalloc) 30 | inline void alFree(void *aligned) 31 | { 32 | // raw: the address of (void *) pointer. 33 | // aligned: the address of a (void *) pointer now point to (char *) 34 | // - sizeof(void *): minus the address by sizeof(void *) 35 | // (void **): the address of a pointer point to a (void *) pointer 36 | // *: the pointer point to a (void *) pointer = the address of (void *)pointer 37 | void *raw = *(void **)((char *)aligned - sizeof(void *)); 38 | wrFree(raw); 39 | } 40 | 41 | #endif 42 | -------------------------------------------------------------------------------- /MTCNN/face_detector.hpp: -------------------------------------------------------------------------------- 1 | #ifndef _FACE_DETECTOR_HPP_ 2 | #define _FACE_DETECTOR_HPP_ 3 | 4 | #include 5 | 6 | #include 7 | #include 8 | 9 | namespace mtcnn { 10 | 11 | const int NUM_REGRESSIONS = 4; 12 | const int NUM_PTS = 5; 13 | 14 | struct BBox { 15 | float x1; 16 | float y1; 17 | float x2; 18 | float y2; 19 | cv::Rect getRect() const; 20 | BBox getSquare() const; 21 | }; 22 | 23 | struct Face { 24 | BBox bbox; 25 | float regression[NUM_REGRESSIONS]; 26 | float score; 27 | float ptsCoords[2 * NUM_PTS]; 28 | 29 | static void applyRegression(std::vector& faces, bool addOne = false); 30 | static void bboxes2Squares(std::vector& faces); 31 | }; 32 | 33 | class FaceDetector { 34 | private: 35 | boost::shared_ptr< caffe::Net > pNet_; 36 | boost::shared_ptr< caffe::Net > rNet_; 37 | boost::shared_ptr< caffe::Net > oNet_; 38 | boost::shared_ptr< caffe::Net > lNet_; 39 | float pThreshold_; 40 | float rThreshold_; 41 | float oThreshold_; 42 | bool useLNet_; 43 | void initNetInput(boost::shared_ptr< caffe::Net > net, cv::Mat img); 44 | void initNetInput(boost::shared_ptr< caffe::Net > net, std::vector& imgs); 45 | std::vector step1(cv::Mat img, float minFaceSize, float scaleFactor); 46 | std::vector step2(cv::Mat img, const std::vector& faces); 47 | std::vector step3(cv::Mat img, const std::vector& faces); 48 | std::vector step4(cv::Mat img, const std::vector& faces); 49 | std::vector composeFaces(const caffe::Blob* regressionsBlob, 50 | const caffe::Blob* scoresBlob, 51 | float scale); 52 | static std::vector nonMaximumSuppression(std::vector faces, float threshold, bool useMin = false); 53 | public: 54 | FaceDetector(const std::string& modelDir, 55 | float pThreshold = 0.6f, 56 | float rThreshold = 0.7f, 57 | float oThreshold = 0.7f, 58 | bool useLNet = false, 59 | bool useGPU = true, 60 | int deviceID = 0); 61 | std::vector detect(cv::Mat img, float minFaceSize, float scaleFactor); 62 | }; 63 | 64 | } // namespace mtcnn 65 | 66 | #endif // _FACE_DETECTOR_HPP_ 67 | -------------------------------------------------------------------------------- /ECO/gradient.hpp: -------------------------------------------------------------------------------- 1 | /******************************************************************************* 2 | * Piotr's Computer Vision Matlab Toolbox Version 3.30 3 | * Copyright 2014 Piotr Dollar & Ron Appel. [pdollar-at-gmail.com] 4 | * Licensed under the Simplified BSD License [see external/bsd.txt] 5 | *******************************************************************************/ 6 | #ifndef GRADIENTMEX_HPP 7 | #define GRADIENTMEX_HPP 8 | 9 | #include "wrappers.hpp" 10 | #include 11 | #include "string.h" 12 | #include "sse.hpp" 13 | #include 14 | 15 | #include 16 | #include 17 | 18 | // compute x and y gradients for just one column (uses sse) 19 | void grad1(float *I, float *Gx, float *Gy, int h, int w, int x); 20 | 21 | // compute x and y gradients at each location (uses sse) 22 | void grad2(float *I, float *Gx, float *Gy, int h, int w, int d); 23 | 24 | // build lookup table a[] s.t. a[x*n]~=acos(x) for x in [-1,1] 25 | float *acosTable(); 26 | 27 | // compute gradient magnitude and orientation at each location (uses sse) 28 | void gradMag(float *I, float *M, float *O, int h, int w, int d, bool full); 29 | 30 | // normalize gradient magnitude at each location (uses sse) 31 | void gradMagNorm(float *M, float *S, int h, int w, float norm); 32 | 33 | // helper for gradHist, quantize O and M into O0, O1 and M0, M1 (uses sse) 34 | void gradQuantize(float *O, float *M, int *O0, int *O1, float *M0, float *M1, 35 | int nb, int n, float norm, int nOrients, bool full, bool interpolate); 36 | 37 | // compute nOrients gradient histograms per bin x bin block of pixels 38 | void gradHist(float *M, float *O, float *H, int h, int w, 39 | int bin, int nOrients, int softBin, bool full); 40 | 41 | /******************************************************************************/ 42 | 43 | // HOG helper: compute 2x2 block normalization values (padded by 1 pixel) 44 | float *hogNormMatrix(float *H, int nOrients, int hb, int wb, int bin); 45 | 46 | // HOG helper: compute HOG or FHOG channels 47 | void hogChannels(float *H, const float *R, const float *N, 48 | int hb, int wb, int nOrients, float clip, int type); 49 | 50 | // compute HOG features 51 | void hog(float *M, float *O, float *H, int h, int w, int binSize, 52 | int nOrients, int softBin, bool full, float clip); 53 | 54 | // compute FHOG features 55 | void fhog(float *M, float *O, float *H, int h, int w, int binSize, 56 | int nOrients, int softBin, float clip); 57 | 58 | #endif -------------------------------------------------------------------------------- /ECO/feature_operator.hpp: -------------------------------------------------------------------------------- 1 | #ifndef FEATURE_OPERATOR_HPP 2 | #define FEATURE_OPERATOR_HPP 3 | 4 | #include 5 | #include 6 | #include 7 | #include "parameters.hpp" 8 | #include "ffttools.hpp" 9 | #include "recttools.hpp" 10 | #include "debug.hpp" 11 | 12 | namespace eco 13 | { 14 | template 15 | extern std::vector operator+(const std::vector &a, 16 | const std::vector &b) 17 | { 18 | assert(a.size() == b.size()); 19 | std::vector result; 20 | for (unsigned int i = 0; i < a.size(); ++i) 21 | { 22 | result.push_back(a[i] + b[i]); 23 | } 24 | return result; 25 | } 26 | 27 | template 28 | extern std::vector operator-(const std::vector &a, 29 | const std::vector &b) 30 | { 31 | assert(a.size() == b.size()); 32 | std::vector result; 33 | for (unsigned int i = 0; i < a.size(); ++i) 34 | { 35 | result.push_back(a[i] - b[i]); 36 | } 37 | return result; 38 | } 39 | 40 | template 41 | extern std::vector operator*(const std::vector &a, const float scale) 42 | { 43 | std::vector result; 44 | for (unsigned int i = 0; i < a.size(); ++i) 45 | { 46 | result.push_back(a[i] * scale); 47 | } 48 | return result; 49 | } 50 | 51 | extern ECO_FEATS do_dft(const ECO_FEATS &xlw); 52 | extern ECO_FEATS do_windows(const ECO_FEATS &xl, vector &cos_win); 53 | 54 | extern void FilterSymmetrize(ECO_FEATS &hf); 55 | extern vector init_projection_matrix(const ECO_FEATS &init_sample, 56 | const vector &compressed_dim, 57 | const vector &feature_dim); 58 | extern ECO_FEATS FeatureProjection(const ECO_FEATS &x, 59 | const std::vector &projection_matrix); 60 | extern ECO_FEATS FeatureProjectionMultScale(const ECO_FEATS &x, 61 | const std::vector &projection_matrix); 62 | 63 | extern float FeatureComputeInnerProduct(const ECO_FEATS &feat1, 64 | const ECO_FEATS &feat2); 65 | extern float FeatureComputeEnergy(const ECO_FEATS &feat); 66 | extern ECO_FEATS FeautreComputePower2(const ECO_FEATS &feats); 67 | extern std::vector FeatureComputeScores(const ECO_FEATS &x, 68 | const ECO_FEATS &f); 69 | extern std::vector FeatureVectorization(const ECO_FEATS &x); 70 | 71 | extern ECO_FEATS FeatureVectorMultiply(const ECO_FEATS &x, 72 | const std::vector &y, 73 | const bool _conj = 0); // feature * yf 74 | 75 | extern ECO_FEATS FeatureDotMultiply(const ECO_FEATS &a, const ECO_FEATS &b); 76 | extern ECO_FEATS FeatureDotDivide(const ECO_FEATS &a, const ECO_FEATS &b); 77 | } // namespace eco 78 | 79 | #endif -------------------------------------------------------------------------------- /ECO/feature_extractor.hpp: -------------------------------------------------------------------------------- 1 | #ifndef FEATURE_EXTRACTOR_HPP 2 | #define FEATURE_EXTRACTOR_HPP 3 | 4 | #include 5 | #include 6 | #include 7 | #include 8 | #include 9 | #include 10 | #include 11 | #include 12 | 13 | #include "parameters.hpp" 14 | #include "ffttools.hpp" 15 | #include "recttools.hpp" 16 | #include "fhog.hpp" 17 | #include "debug.hpp" 18 | 19 | #ifdef USE_SIMD 20 | #include "gradient.hpp" 21 | #endif 22 | 23 | #ifdef USE_CAFFE 24 | #include 25 | #include 26 | #include 27 | #endif 28 | 29 | namespace eco 30 | { 31 | class FeatureExtractor 32 | { 33 | public: 34 | FeatureExtractor() {} 35 | virtual ~FeatureExtractor(){}; 36 | 37 | ECO_FEATS extractor(const cv::Mat image, 38 | const cv::Point2f pos, 39 | const vector scales, 40 | const EcoParameters ¶ms, 41 | const bool &is_color_image); 42 | 43 | cv::Mat sample_patch(const cv::Mat im, 44 | const cv::Point2f pos, 45 | cv::Size2f sample_sz, 46 | cv::Size2f input_sz); 47 | 48 | #ifdef USE_SIMD 49 | vector get_hog_features_simd(const vector ims); 50 | #else 51 | vector get_hog_features(const vector ims); 52 | #endif 53 | vector hog_feature_normalization(vector &hog_feat_maps); 54 | inline vector get_hog_feats() const { return hog_feat_maps_; } 55 | 56 | vector get_cn_features(const vector ims); 57 | vector cn_feature_normalization(vector &cn_feat_maps); 58 | inline vector get_cn_feats() const { return cn_feat_maps_; } 59 | 60 | #ifdef USE_CAFFE 61 | ECO_FEATS get_cnn_layers(vector im, const cv::Mat &deep_mean_mat); 62 | cv::Mat sample_pool(const cv::Mat &im, int smaple_factor, int stride); 63 | void cnn_feature_normalization(ECO_FEATS &feature); 64 | inline ECO_FEATS get_cnn_feats() const { return cnn_feat_maps_; } 65 | #endif 66 | 67 | private: 68 | EcoParameters params_; 69 | 70 | HogFeatures hog_features_; 71 | int hog_feat_ind_ = -1; 72 | vector hog_feat_maps_; 73 | 74 | ColorspaceFeatures colorspace_features_; 75 | int colorspace_feat_ind_ = -1; 76 | vector colorspace_feat_maps_; 77 | 78 | CnFeatures cn_features_; 79 | int cn_feat_ind_ = -1; 80 | vector cn_feat_maps_; 81 | 82 | IcFeatures ic_features_; 83 | int ic_feat_ind_ = -1; 84 | vector ic_feat_maps_; 85 | 86 | #ifdef USE_CAFFE 87 | boost::shared_ptr> net_; 88 | CnnFeatures cnn_features_; 89 | int cnn_feat_ind_ = -1; 90 | ECO_FEATS cnn_feat_maps_; 91 | #endif 92 | }; 93 | } // namespace eco 94 | #endif 95 | -------------------------------------------------------------------------------- /ECO/sse.hpp: -------------------------------------------------------------------------------- 1 | /******************************************************************************* 2 | * Piotr's Computer Vision Matlab Toolbox Version 3.23 3 | * Copyright 2014 Piotr Dollar. [pdollar-at-gmail.com] 4 | * Licensed under the Simplified BSD License [see external/bsd.txt] 5 | *******************************************************************************/ 6 | // Intel Intrinsics Guide: https://software.intel.com/sites/landingpage/IntrinsicsGuide/# 7 | 8 | #ifndef _SSE_HPP_ 9 | #define _SSE_HPP_ 10 | 11 | #ifdef USE_NEON 12 | #include "sse2neon.h" 13 | #else 14 | #include // SSE2:, SSE3:, SSE4: 15 | #endif 16 | 17 | #define RETf inline __m128 18 | #define RETi inline __m128i 19 | 20 | // set, load and store values 21 | RETf SET( const float &x ) { return _mm_set1_ps(x); } 22 | RETf SET( float x, float y, float z, float w ) { return _mm_set_ps(x,y,z,w); } 23 | RETi SET( const int &x ) { return _mm_set1_epi32(x); } 24 | RETf LD( const float &x ) { return _mm_load_ps(&x); } 25 | RETf LDu( const float &x ) { return _mm_loadu_ps(&x); } 26 | RETf STR( float &x, const __m128 y ) { _mm_store_ps(&x,y); return y; } 27 | RETf STR1( float &x, const __m128 y ) { _mm_store_ss(&x,y); return y; } 28 | RETf STRu( float &x, const __m128 y ) { _mm_storeu_ps(&x,y); return y; } 29 | RETf STR( float &x, const float y ) { return STR(x,SET(y)); } 30 | 31 | // arithmetic operators 32 | RETi ADD( const __m128i x, const __m128i y ) { return _mm_add_epi32(x,y); } 33 | RETf ADD( const __m128 x, const __m128 y ) { return _mm_add_ps(x,y); } 34 | RETf ADD( const __m128 x, const __m128 y, const __m128 z ) { 35 | return ADD(ADD(x,y),z); } 36 | RETf ADD( const __m128 a, const __m128 b, const __m128 c, const __m128 &d ) { 37 | return ADD(ADD(ADD(a,b),c),d); } 38 | RETf SUB( const __m128 x, const __m128 y ) { return _mm_sub_ps(x,y); } 39 | RETf MUL( const __m128 x, const __m128 y ) { return _mm_mul_ps(x,y); } 40 | RETf MUL( const __m128 x, const float y ) { return MUL(x,SET(y)); } 41 | RETf MUL( const float x, const __m128 y ) { return MUL(SET(x),y); } 42 | RETf INC( __m128 &x, const __m128 y ) { return x = ADD(x,y); } 43 | RETf INC( float &x, const __m128 y ) { __m128 t=ADD(LD(x),y); return STR(x,t); } 44 | RETf DEC( __m128 &x, const __m128 y ) { return x = SUB(x,y); } 45 | RETf DEC( float &x, const __m128 y ) { __m128 t=SUB(LD(x),y); return STR(x,t); } 46 | RETf MINN( const __m128 x, const __m128 y ) { return _mm_min_ps(x,y); } 47 | RETf RCP( const __m128 x ) { return _mm_rcp_ps(x); } 48 | RETf RCPSQRT( const __m128 x ) { return _mm_rsqrt_ps(x); } 49 | 50 | // logical operators 51 | RETf AND( const __m128 x, const __m128 y ) { return _mm_and_ps(x,y); } 52 | RETi AND( const __m128i x, const __m128i y ) { return _mm_and_si128(x,y); } 53 | RETf ANDNOT( const __m128 x, const __m128 y ) { return _mm_andnot_ps(x,y); } 54 | RETf OR( const __m128 x, const __m128 y ) { return _mm_or_ps(x,y); } 55 | RETf XOR( const __m128 x, const __m128 y ) { return _mm_xor_ps(x,y); } 56 | 57 | // comparison operators 58 | RETf CMPGT( const __m128 x, const __m128 y ) { return _mm_cmpgt_ps(x,y); } 59 | RETf CMPLT( const __m128 x, const __m128 y ) { return _mm_cmplt_ps(x,y); } 60 | RETi CMPGT( const __m128i x, const __m128i y ) { return _mm_cmpgt_epi32(x,y); } 61 | RETi CMPLT( const __m128i x, const __m128i y ) { return _mm_cmplt_epi32(x,y); } 62 | 63 | // conversion operators 64 | RETf CVT( const __m128i x ) { return _mm_cvtepi32_ps(x); } 65 | RETi CVT( const __m128 x ) { return _mm_cvttps_epi32(x); } 66 | 67 | #undef RETf 68 | #undef RETi 69 | #endif 70 | -------------------------------------------------------------------------------- /ECO/sample_update.hpp: -------------------------------------------------------------------------------- 1 | #ifndef SAMPLE_UPDATE_HPP 2 | #define SAMPLE_UPDATE_HPP 3 | 4 | #include 5 | #include 6 | 7 | #include 8 | 9 | #include "parameters.hpp" 10 | #include "ffttools.hpp" 11 | #include "feature_operator.hpp" 12 | #include "debug.hpp" 13 | 14 | namespace eco 15 | { 16 | 17 | class SampleUpdate 18 | { 19 | public: 20 | SampleUpdate(){}; 21 | virtual ~SampleUpdate(){}; 22 | 23 | void init(const std::vector &filter, 24 | const std::vector &feature_dim, 25 | const size_t nSamples, 26 | const float learning_rate); 27 | 28 | void update_sample_space_model(const ECO_FEATS &new_train_sample); 29 | 30 | void update_distance_matrix(cv::Mat &gram_vector, float new_sample_norm, 31 | int id1, int id2, float w1, float w2); 32 | 33 | inline cv::Mat find_gram_vector(const ECO_FEATS &new_train_sample) 34 | { 35 | cv::Mat result(cv::Size(1, nSamples_), CV_32FC2); 36 | for (size_t i = 0; i < (size_t)result.rows; i++) // init to INF; 37 | result.at>(i, 0) = cv::Vec(INF, 0); 38 | 39 | std::vector distance_vector; 40 | for (size_t i = 0; i < num_training_samples_; i++) // calculate the distance; 41 | distance_vector.push_back(2 * 42 | FeatureComputeInnerProduct(samples_f_[i], new_train_sample)); 43 | 44 | for (size_t i = 0; i < distance_vector.size(); i++) 45 | result.at>(i, 0) = 46 | cv::Vec(distance_vector[i], 0); 47 | 48 | return result; 49 | }; 50 | // find the minimum element in prior_weights_; 51 | inline void findMin(float &min_w, size_t &index) const 52 | { 53 | std::vector::const_iterator pos = std::min_element(prior_weights_.begin(), prior_weights_.end()); 54 | min_w = *pos; 55 | index = pos - prior_weights_.begin(); 56 | }; 57 | 58 | inline ECO_FEATS merge_samples(const ECO_FEATS &sample1, 59 | const ECO_FEATS &sample2, 60 | const float w1, const float w2, 61 | const std::string sample_merge_type = "merge") 62 | { 63 | float alpha1 = w1 / (w1 + w2); 64 | float alpha2 = 1 - alpha1; 65 | ECO_FEATS merged_sample = sample1; 66 | 67 | if (sample_merge_type == std::string("replace")) 68 | { 69 | } 70 | else if (sample_merge_type == std::string("merge")) 71 | { 72 | for (size_t i = 0; i < sample1.size(); i++) 73 | for (size_t j = 0; j < sample1[i].size(); j++) 74 | merged_sample[i][j] = alpha1 * sample1[i][j] + alpha2 * sample2[i][j]; 75 | } 76 | return merged_sample; 77 | }; 78 | 79 | inline void replace_sample(const ECO_FEATS &new_sample, const size_t idx) 80 | { 81 | samples_f_[idx] = new_sample; 82 | }; 83 | 84 | inline void set_gram_matrix(const int r, const int c, const float val) 85 | { 86 | gram_matrix_.at(r, c) = val; 87 | }; 88 | 89 | int get_merged_sample_id() const { return merged_sample_id_; } 90 | 91 | int get_new_sample_id() const { return new_sample_id_; } 92 | 93 | std::vector get_prior_weights() const { return prior_weights_; } 94 | 95 | std::vector get_samples() const { return samples_f_; } 96 | 97 | private: 98 | cv::Mat distance_matrix_, gram_matrix_; // distance matrix and its kernel 99 | 100 | size_t nSamples_ = 50; 101 | 102 | float learning_rate_ = 0.009; 103 | 104 | const float minmum_sample_weight_ = 0.0036; 105 | 106 | std::vector sample_weight_; 107 | 108 | std::vector samples_f_; // all samples frontier 109 | 110 | size_t num_training_samples_ = 0; 111 | 112 | std::vector prior_weights_; 113 | 114 | ECO_FEATS new_sample_, merged_sample_; 115 | 116 | int new_sample_id_ = -1, merged_sample_id_ = -1; 117 | }; 118 | 119 | } // namespace eco 120 | 121 | #endif -------------------------------------------------------------------------------- /ECO/eco.hpp: -------------------------------------------------------------------------------- 1 | #ifndef ECO_HPP 2 | #define ECO_HPP 3 | 4 | #include 5 | #include 6 | #include 7 | #include 8 | #include 9 | #include 10 | 11 | #ifdef USE_CAFFE 12 | #include 13 | #include 14 | #endif 15 | /* 16 | #ifdef USE_CUDA 17 | #include 18 | #include 19 | #endif 20 | */ 21 | #ifdef USE_MULTI_THREAD 22 | #include 23 | #include 24 | #endif 25 | 26 | #include "parameters.hpp" 27 | #include "interpolator.hpp" 28 | #include "regularization_filter.hpp" 29 | #include "feature_extractor.hpp" 30 | #include "feature_operator.hpp" 31 | #include "sample_update.hpp" 32 | #include "optimize_scores.hpp" 33 | #include "training.hpp" 34 | #include "ffttools.hpp" 35 | #include "scale_filter.hpp" 36 | #include "debug.hpp" 37 | 38 | namespace eco 39 | { 40 | class ECO 41 | { 42 | public: 43 | ECO() {}; 44 | virtual ~ECO() {} 45 | 46 | void init(cv::Mat &im, const cv::Rect2f &rect, const eco::EcoParameters ¶mters); 47 | 48 | bool update(const cv::Mat &frame, cv::Rect2f &roi); 49 | 50 | void init_parameters(const eco::EcoParameters ¶meters); 51 | 52 | void init_features(); 53 | #ifdef USE_CAFFE 54 | void read_deep_mean(const string &mean_file); 55 | #endif 56 | void yf_gaussian(); // the desired outputs of features, real part of (9) in paper C-COT 57 | 58 | void cos_window(); // construct cosine window of features; 59 | 60 | ECO_FEATS interpolate_dft(const ECO_FEATS &xlf, 61 | vector &interp1_fs, 62 | vector &interp2_fs); 63 | 64 | ECO_FEATS compact_fourier_coeff(const ECO_FEATS &xf); 65 | 66 | ECO_FEATS full_fourier_coeff(const ECO_FEATS &xf); 67 | 68 | vector project_mat_energy(vector proj, 69 | vector yf); 70 | 71 | ECO_FEATS shift_sample(ECO_FEATS &xf, 72 | cv::Point2f shift, 73 | std::vector kx, 74 | std::vector ky); 75 | #ifdef USE_MULTI_THREAD 76 | static void *thread_train(void *params); 77 | #endif 78 | 79 | private: 80 | bool is_color_image_; 81 | EcoParameters params_; 82 | cv::Point2f pos_; // final result 83 | size_t frames_since_last_train_; // used for update; 84 | 85 | // The max size of feature and its index, output_sz is T in (9) of C-COT paper 86 | size_t output_size_, output_index_; 87 | 88 | cv::Size2f base_target_size_; // target size without scale 89 | cv::Size2i img_sample_size_; // base_target_sz * sarch_area_scale 90 | cv::Size2i img_support_size_; // the corresponding size in the image 91 | 92 | vector feature_size_, filter_size_; 93 | vector feature_dim_, compressed_dim_; 94 | 95 | ScaleFilter scale_filter_; 96 | int nScales_; // number of scales; 97 | float scale_step_; 98 | vector scale_factors_; 99 | float currentScaleFactor_; // current img scale 100 | 101 | // Compute the Fourier series indices 102 | // kx_, ky_ is the k in (9) of C-COT paper, yf_ is the left part of (9); 103 | vector ky_, kx_, yf_; 104 | vector interp1_fs_, interp2_fs_; 105 | vector cos_window_; 106 | vector projection_matrix_; 107 | 108 | vector reg_filter_; 109 | vector reg_energy_; 110 | 111 | FeatureExtractor feature_extractor_; 112 | 113 | SampleUpdate sample_update_; 114 | ECO_FEATS sample_energy_; 115 | 116 | EcoTrain eco_trainer_; 117 | 118 | ECO_FEATS hf_full_; 119 | 120 | #ifdef USE_MULTI_THREAD 121 | bool thread_flag_train_; 122 | public: 123 | pthread_t thread_train_; 124 | #endif 125 | 126 | }; 127 | 128 | } // namespace eco 129 | 130 | #endif 131 | -------------------------------------------------------------------------------- /ECO/training.hpp: -------------------------------------------------------------------------------- 1 | #ifndef TRAINING_HPP 2 | #define TRAINING_HPP 3 | 4 | #include 5 | #include 6 | #include 7 | #include 8 | #include 9 | 10 | #include 11 | 12 | #include "ffttools.hpp" 13 | #include "recttools.hpp" 14 | #include "parameters.hpp" 15 | #include "feature_operator.hpp" 16 | #include "debug.hpp" 17 | 18 | namespace eco 19 | { 20 | class EcoTrain 21 | { 22 | public: 23 | EcoTrain(); 24 | virtual ~EcoTrain(); 25 | 26 | struct STATE 27 | { 28 | ECO_FEATS p, r_prev; 29 | float rho; 30 | }; 31 | // the right and left side of the equation (18) of suppl. paper ECO 32 | struct ECO_EQ 33 | { 34 | ECO_EQ() {} 35 | ECO_EQ(ECO_FEATS up_part, std::vector low_part) : up_part_(up_part), low_part_(low_part) {} 36 | 37 | ECO_FEATS up_part_; // this is f + delta(f) 38 | std::vector low_part_; // this is delta(P) 39 | 40 | ECO_EQ operator+(const ECO_EQ data); 41 | ECO_EQ operator-(const ECO_EQ data); 42 | ECO_EQ operator*(const float scale); 43 | }; 44 | 45 | void train_init(const ECO_FEATS &hf, 46 | const ECO_FEATS &hf_inc, 47 | const vector &proj_matrix, 48 | const ECO_FEATS &xlf, 49 | const vector &yf, 50 | const vector ®_filter, 51 | const ECO_FEATS &sample_energy, 52 | const vector ®_energy, 53 | const vector &proj_energy, 54 | const EcoParameters ¶ms); 55 | 56 | // Filter training and Projection updating(for the 1st Frame)============== 57 | void train_joint(); 58 | 59 | ECO_EQ pcg_eco_joint(const ECO_FEATS &init_samplef_proj, 60 | const vector ®_filter, 61 | const ECO_FEATS &init_samplef, 62 | const vector &init_samplesf_H, 63 | const ECO_FEATS &init_hf, 64 | const ECO_EQ &rhs_samplef, 65 | const ECO_EQ &diag_M, // preconditionor 66 | const ECO_EQ &hf); 67 | 68 | ECO_EQ lhs_operation_joint(const ECO_EQ &hf, 69 | const ECO_FEATS &samplesf, 70 | const vector ®_filter, 71 | const ECO_FEATS &init_samplef, 72 | const vector &XH, 73 | const ECO_FEATS &init_hf); 74 | // Only filter training(for tracker update)=============================== 75 | void train_filter(const vector &samplesf, 76 | const vector &sample_weights, 77 | const ECO_FEATS &sample_energy); 78 | 79 | ECO_FEATS pcg_eco_filter(const vector &samplesf, 80 | const vector ®_filter, 81 | const vector &sample_weights, 82 | const ECO_FEATS &rhs_samplef, 83 | const ECO_FEATS &diag_M, 84 | const ECO_FEATS &hf); 85 | 86 | ECO_FEATS lhs_operation_filter(const ECO_FEATS &hf, 87 | const vector &samplesf, 88 | const vector ®_filter, 89 | const vector &sample_weights); 90 | // joint structure basic operation================================ 91 | ECO_EQ jointDotDivision(const ECO_EQ &a, const ECO_EQ &b); 92 | float inner_product_joint(const ECO_EQ &a, const ECO_EQ &b); 93 | float inner_product_filter(const ECO_FEATS &a, const ECO_FEATS &b); 94 | vector get_proj() const { return projection_matrix_; } 95 | ECO_FEATS get_hf() const { return hf_; } 96 | 97 | private: 98 | ECO_FEATS hf_, hf_inc_; // filter parameters and its increament 99 | 100 | ECO_FEATS xlf_, sample_energy_; 101 | 102 | vector yf_; // the label of sample 103 | 104 | vector reg_filter_; 105 | vector reg_energy_; 106 | 107 | vector projection_matrix_, proj_energy_; 108 | 109 | EcoParameters params_; 110 | STATE state_; 111 | }; // end of class 112 | } // namespace eco 113 | #endif -------------------------------------------------------------------------------- /ECO/interpolator.cc: -------------------------------------------------------------------------------- 1 | #include "interpolator.hpp" 2 | 3 | namespace eco 4 | { 5 | Interpolator::Interpolator() {} 6 | 7 | Interpolator::~Interpolator() {} 8 | 9 | void Interpolator::get_interp_fourier(cv::Size filter_sz, 10 | cv::Mat &interp1_fs, 11 | cv::Mat &interp2_fs, 12 | float a) 13 | { 14 | cv::Mat temp1(filter_sz.height, 1, CV_32FC1); 15 | cv::Mat temp2(1, filter_sz.width, CV_32FC1); 16 | for (int j = 0; j < temp1.rows; j++) 17 | { 18 | temp1.at(j, 0) = j - temp1.rows / 2; 19 | } 20 | for (int j = 0; j < temp2.cols; j++) 21 | { 22 | temp2.at(0, j) = j - temp2.cols / 2; 23 | } 24 | 25 | interp1_fs = cubic_spline_fourier(temp1 / filter_sz.height, a) / filter_sz.height; 26 | interp2_fs = cubic_spline_fourier(temp2 / filter_sz.width, a) / filter_sz.width; 27 | 28 | // Multiply Fourier coeff with e ^ (-i*pi*k / N):[cos(pi*k/N), -sin(pi*k/N)] 29 | cv::Mat result1(temp1.size(), CV_32FC1), result2(temp1.size(), CV_32FC1); 30 | temp1 = temp1 / filter_sz.height; 31 | temp2 = temp2 / filter_sz.width; 32 | std::transform(temp1.begin(), temp1.end(), result1.begin(), Interpolator::mat_cos1); 33 | std::transform(temp1.begin(), temp1.end(), result2.begin(), Interpolator::mat_sin1); 34 | 35 | //cv::Mat planes1[] = {interp1_fs.mul(result1), -interp1_fs.mul(result2)}; 36 | //cv::merge(planes1, 2, interp1_fs); 37 | //interp2_fs = interp1_fs.t(); 38 | cv::Mat temp = cv::Mat(interp1_fs.size(), CV_32FC2); 39 | cv::Mat tempT = cv::Mat(interp1_fs.cols, interp1_fs.rows, CV_32FC2); 40 | for(int r = 0; r < temp1.rows; r++) 41 | { 42 | for(int c = 0; c < temp1.cols; c++) 43 | { 44 | 45 | temp.at(r, c)[0] = interp1_fs.at(r, c) * result1.at(r, c); 46 | temp.at(r, c)[1] = -interp1_fs.at(r, c) * result2.at(r, c); 47 | tempT.at(c, r)[0] = temp.at(r, c)[0]; 48 | tempT.at(c, r)[1] = temp.at(r, c)[1]; 49 | } 50 | } 51 | interp1_fs = temp; 52 | interp2_fs = tempT; 53 | } 54 | 55 | cv::Mat Interpolator::cubic_spline_fourier(cv::Mat f, float a) 56 | { 57 | if (f.empty()) 58 | { 59 | assert(0 && "error: input mat is empty!"); 60 | } 61 | /* 62 | cv::Mat bf(f.size(), CV_32FC1), 63 | temp_cos2(f.size(), CV_32FC1), 64 | temp_cos4(f.size(), CV_32FC1), 65 | temp_sin2(f.size(), CV_32FC1), 66 | temp_sin4(f.size(), CV_32FC1); 67 | std::transform(f.begin(), f.end(), temp_cos2.begin(), Interpolator::mat_cos2); 68 | std::transform(f.begin(), f.end(), temp_cos4.begin(), Interpolator::mat_cos4); 69 | std::transform(f.begin(), f.end(), temp_sin2.begin(), Interpolator::mat_sin2); 70 | std::transform(f.begin(), f.end(), temp_sin4.begin(), Interpolator::mat_sin4); 71 | 72 | bf = 6 * (cv::Mat::ones(f.size(), CV_32FC1) - temp_cos2) + 3 * a * (cv::Mat::ones(f.size(), CV_32FC1) - temp_cos4) - (6 + a * 8) * CV_PI * f.mul(temp_sin2) - 2 * a * CV_PI * f.mul(temp_sin4); 73 | 74 | cv::Mat L(f.size(), CV_32FC1); 75 | cv::pow(f, 4, L); 76 | cv::divide(bf, 4 * L * cv::pow(CV_PI, 4), bf); 77 | bf.at(bf.rows / 2, bf.cols / 2) = 1; 78 | */ 79 | cv::Mat bf(f.size(), CV_32FC1); 80 | for(int r = 0; r < bf.rows; r++) 81 | { 82 | for(int c = 0; c < bf.cols; c++) 83 | { 84 | bf.at(r, c) = 6.0f * (1 - cos(2.0f * f.at(r, c) * M_PI)) 85 | + 3.0f * a * (1.0f - cos(4 * f.at(r, c) * M_PI)) 86 | - (6.0f + a * 8.0f) * M_PI * f.at(r, c) * sin(2.0f * f.at(r, c) * M_PI) 87 | - 2.0f * a * M_PI * f.at(r, c) * sin(4.0f * f.at(r, c) * M_PI); 88 | float L = 4.0f * pow(f.at(r, c) * M_PI, 4); 89 | bf.at(r, c) /= L; 90 | } 91 | } 92 | bf.at(bf.rows / 2, bf.cols / 2) = 1; 93 | //printMat(bf); 94 | //showmat1channels(bf, 2); 95 | 96 | return bf; 97 | } 98 | } // namespace eco -------------------------------------------------------------------------------- /ECO/regularization_filter.cc: -------------------------------------------------------------------------------- 1 | #include "regularization_filter.hpp" 2 | 3 | namespace eco 4 | { 5 | cv::Mat get_regularization_filter(cv::Size sz, 6 | cv::Size2f target_sz, 7 | const EcoParameters ¶ms) 8 | { 9 | cv::Mat result; 10 | 11 | if (params.use_reg_window) 12 | { 13 | cv::Size2d reg_scale = cv::Size2d(target_sz.width * 0.5, 14 | target_sz.height * 0.5); 15 | 16 | // construct the regularization window 17 | cv::Mat reg_window(sz, CV_64FC1); 18 | for (double x = -0.5 * (sz.height - 1), counter1 = 0; 19 | counter1 < sz.height; x += 1, ++counter1) 20 | for (double y = -0.5 * (sz.width - 1), counter2 = 0; 21 | counter2 < sz.width; y += 1, ++counter2) 22 | { // use abs() directly will cause error because it returns int!!! 23 | reg_window.at(counter1, counter2) = 24 | (params.reg_window_edge - params.reg_window_min) * 25 | (std::pow(std::abs(x / reg_scale.height), params.reg_window_power) + 26 | std::pow(std::abs(y / reg_scale.width), params.reg_window_power)) + 27 | params.reg_window_min; 28 | } 29 | /* debug 30 | debug("%f %f", reg_scale.height, reg_scale.width); 31 | debug("%d %d", sz.height, sz.width); 32 | debug("Channels: %d",reg_window.channels()); 33 | printMat(reg_window); 34 | //showmat1channels(reg_window, 3); 35 | debug("%lf, %lf", reg_window.at(46, 23), reg_window.at(143,89)); 36 | */ 37 | 38 | // compute the DFT and enforce sparsity 39 | cv::Mat reg_window_dft = dft(reg_window) / sz.area(); 40 | cv::Mat reg_win_abs(sz, CV_64FC1); 41 | reg_win_abs = magnitude(reg_window_dft); 42 | double minv = 0.0, maxv = 0.0; 43 | cv::minMaxLoc(reg_win_abs, &minv, &maxv); 44 | // set to zero while the element smaller than threshold 45 | for (size_t i = 0; i < (size_t)reg_window_dft.rows; i++) 46 | for (size_t j = 0; j < (size_t)reg_window_dft.cols; j++) 47 | { 48 | if (reg_win_abs.at(i, j) < (params.reg_sparsity_threshold * maxv)) 49 | reg_window_dft.at>(i, j) = cv::Vec(0.0, 0.0); 50 | } 51 | /* debug 52 | showmat2channels(reg_window_dft, 3); 53 | debug("%lf, %lf", reg_window_dft.at>(0, 0)[0], reg_window_dft.at>(0,1)[0]); 54 | */ 55 | 56 | // do the inverse transform, correct window minimum 57 | cv::Mat reg_window_sparse = real(dft(reg_window_dft, true)); 58 | //showmat1channels(reg_window_sparse, 3); 59 | cv::minMaxLoc(reg_window_sparse, &minv, &maxv); 60 | //debug("%lf, %lf, %lf, %d", minv, maxv, params.reg_window_min, sz.area()); 61 | reg_window_dft.at(0, 0) = reg_window_dft.at(0, 0) - sz.area() * minv + params.reg_window_min; 62 | reg_window_dft = fftshift(reg_window_dft); 63 | 64 | // find the regularization filter by removing the zeros 65 | cv::Mat tmp; 66 | for (size_t i = 0; i < (size_t)reg_window_dft.rows; i++) 67 | { 68 | for (size_t j = 0; j < (size_t)reg_window_dft.cols; j++) 69 | { 70 | if (((reg_window_dft.at>(i, j) != 71 | cv::Vec(0, 0)) && 72 | (reg_window_dft.at>(i, j) != 73 | cv::Vec(2, 0)))) 74 | { 75 | tmp.push_back(reg_window_dft.row(i)); 76 | break; 77 | } 78 | } //end for 79 | } //end for 80 | 81 | tmp = tmp.t(); 82 | for (size_t i = 0; i < (size_t)tmp.rows; i++) 83 | { 84 | for (size_t j = 0; j < (size_t)tmp.cols; j++) 85 | { 86 | if (((tmp.at>(i, j) != 87 | cv::Vec(0, 0)) && 88 | (tmp.at>(i, j) != 89 | cv::Vec(1, 0)))) 90 | { 91 | result.push_back(real(tmp.row(i))); 92 | break; 93 | } 94 | } //end for 95 | } //end for 96 | result = result.t(); 97 | } // if params.use_reg_window 98 | else 99 | { 100 | result.push_back(params.reg_window_min); 101 | } 102 | 103 | return result; 104 | } 105 | } // namespace eco -------------------------------------------------------------------------------- /ECO/ffttools.hpp: -------------------------------------------------------------------------------- 1 | /* 2 | Author: Christian Bailer 3 | Contact address: Christian.Bailer@dfki.de 4 | Department Augmented Vision DFKI 5 | 6 | License Agreement 7 | For Open Source Computer Vision Library 8 | (3-clause BSD License) 9 | 10 | Redistribution and use in source and binary forms, with or without modification, 11 | are permitted provided that the following conditions are met: 12 | 13 | * Redistributions of source code must retain the above copyright notice, 14 | this list of conditions and the following disclaimer. 15 | 16 | * Redistributions in binary form must reproduce the above copyright notice, 17 | this list of conditions and the following disclaimer in the documentation 18 | and/or other materials provided with the distribution. 19 | 20 | * Neither the names of the copyright holders nor the names of the contributors 21 | may be used to endorse or promote products derived from this software 22 | without specific prior written permission. 23 | 24 | This software is provided by the copyright holders and contributors "as is" and 25 | any express or implied warranties, including, but not limited to, the implied 26 | warranties of merchantability and fitness for a particular purpose are disclaimed. 27 | In no event shall copyright holders or contributors be liable for any direct, 28 | indirect, incidental, special, exemplary, or consequential damages 29 | (including, but not limited to, procurement of substitute goods or services; 30 | loss of use, data, or profits; or business interruption) however caused 31 | and on any theory of liability, whether in contract, strict liability, 32 | or tort (including negligence or otherwise) arising in any way out of 33 | the use of this software, even if advised of the possibility of such damage. 34 | */ 35 | 36 | #ifndef FFTTOOLS_HPP 37 | #define FFTTOOLS_HPP 38 | 39 | #include 40 | #include "debug.hpp" 41 | /* 42 | #ifdef USE_CUDA 43 | #include 44 | #include 45 | #endif 46 | */ 47 | #ifdef USE_SIMD 48 | #include "sse.hpp" 49 | #include "wrappers.hpp" 50 | #endif 51 | 52 | #ifdef USE_FFTW 53 | #include 54 | #endif 55 | 56 | namespace eco 57 | { 58 | cv::Mat dft(const cv::Mat img_org, const bool backwards = false); 59 | cv::Mat fftshift(const cv::Mat img_org, 60 | const bool rowshift = true, 61 | const bool colshift = true, 62 | const bool reverse = 0); 63 | 64 | cv::Mat real(const cv::Mat img); 65 | cv::Mat imag(const cv::Mat img); 66 | cv::Mat magnitude(const cv::Mat img); 67 | cv::Mat complexDotMultiplication(const cv::Mat &a, const cv::Mat &b); 68 | cv::Mat complexDotMultiplicationCPU(const cv::Mat &a, const cv::Mat &b); 69 | #ifdef USE_SIMD 70 | cv::Mat complexDotMultiplicationSIMD(const cv::Mat &a, const cv::Mat &b); 71 | #endif 72 | /* 73 | #ifdef USE_CUDA 74 | cv::Mat complexDotMultiplicationGPU(const cv::Mat &a, const cv::Mat &b); 75 | #endif 76 | */ 77 | cv::Mat complexDotDivision(const cv::Mat a, const cv::Mat b); 78 | cv::Mat complexMatrixMultiplication(const cv::Mat &a, const cv::Mat &b); 79 | cv::Mat complexConvolution(const cv::Mat a_input, 80 | const cv::Mat b_input, 81 | const bool valid = 0); 82 | 83 | cv::Mat real2complex(const cv::Mat &x); 84 | cv::Mat mat_conj(const cv::Mat &org); 85 | float mat_sum_f(const cv::Mat &org); 86 | double mat_sum_d(const cv::Mat &org); 87 | 88 | inline bool SizeCompare(cv::Size &a, cv::Size &b) 89 | { 90 | return a.height < b.height; 91 | } 92 | 93 | inline void rot90(cv::Mat &matImage, int rotflag) 94 | { 95 | if (rotflag == 1) 96 | { 97 | cv::transpose(matImage, matImage); 98 | cv::flip(matImage, matImage, 1); // flip around y-axis 99 | } 100 | else if (rotflag == 2) 101 | { 102 | cv::transpose(matImage, matImage); 103 | cv::flip(matImage, matImage, 0); // flip around x-axis 104 | } 105 | else if (rotflag == 3) 106 | { 107 | cv::flip(matImage, matImage, -1); // flip around both axis 108 | } 109 | else if (rotflag != 0) // 0: keep the same 110 | { 111 | assert(0 && "error: unknown rotation flag!"); 112 | } 113 | } 114 | 115 | } // namespace eco 116 | 117 | #endif -------------------------------------------------------------------------------- /ECO/recttools.hpp: -------------------------------------------------------------------------------- 1 | /* 2 | Author: Christian Bailer 3 | Contact address: Christian.Bailer@dfki.de 4 | Department Augmented Vision DFKI 5 | 6 | License Agreement 7 | For Open Source Computer Vision Library 8 | (3-clause BSD License) 9 | 10 | Redistribution and use in source and binary forms, with or without modification, 11 | are permitted provided that the following conditions are met: 12 | 13 | * Redistributions of source code must retain the above copyright notice, 14 | this list of conditions and the following disclaimer. 15 | 16 | * Redistributions in binary form must reproduce the above copyright notice, 17 | this list of conditions and the following disclaimer in the documentation 18 | and/or other materials provided with the distribution. 19 | 20 | * Neither the names of the copyright holders nor the names of the contributors 21 | may be used to endorse or promote products derived from this software 22 | without specific prior written permission. 23 | 24 | This software is provided by the copyright holders and contributors "as is" and 25 | any express or implied warranties, including, but not limited to, the implied 26 | warranties of merchantability and fitness for a particular purpose are disclaimed. 27 | In no event shall copyright holders or contributors be liable for any direct, 28 | indirect, incidental, special, exemplary, or consequential damages 29 | (including, but not limited to, procurement of substitute goods or services; 30 | loss of use, data, or profits; or business interruption) however caused 31 | and on any theory of liability, whether in contract, strict liability, 32 | or tort (including negligence or otherwise) arising in any way out of 33 | the use of this software, even if advised of the possibility of such damage. 34 | */ 35 | 36 | #ifndef RECTTOOLS_HPP 37 | #define RECTTOOLS_HPP 38 | 39 | #include 40 | #include 41 | #include "debug.hpp" 42 | 43 | namespace eco 44 | { 45 | template 46 | inline cv::Vec center(const cv::Rect_ &rect) 47 | { 48 | return cv::Vec(rect.x + rect.width / (t)2.0f, rect.y + rect.height / (t)2.0f); 49 | } 50 | 51 | template 52 | inline t x2(const cv::Rect_ &rect) 53 | { 54 | return rect.x + rect.width; 55 | } 56 | 57 | template 58 | inline t y2(const cv::Rect_ &rect) 59 | { 60 | return rect.y + rect.height; 61 | } 62 | 63 | template 64 | inline void resize(cv::Rect_ &rect, float scalex, float scaley = 0) 65 | { 66 | if (!scaley) 67 | { 68 | scaley = scalex; 69 | } 70 | rect.x -= rect.width * (scalex - 1.0f) / 2.0f; 71 | rect.width *= scalex; 72 | 73 | rect.y -= rect.height * (scaley - 1.0f) / 2.0f; 74 | rect.height *= scaley; 75 | } 76 | 77 | template 78 | inline void limit(cv::Rect_ &rect, cv::Rect_ limit) 79 | { 80 | if (rect.x + rect.width > limit.x + limit.width) 81 | { 82 | rect.width = limit.x + limit.width - rect.x; 83 | } 84 | if (rect.y + rect.height > limit.y + limit.height) 85 | { 86 | rect.height = limit.y + limit.height - rect.y; 87 | } 88 | if (rect.x < limit.x) 89 | { 90 | rect.width -= (limit.x - rect.x); 91 | rect.x = limit.x; 92 | } 93 | if (rect.y < limit.y) 94 | { 95 | rect.height -= (limit.y - rect.y); 96 | rect.y = limit.y; 97 | } 98 | if (rect.width < 0) 99 | { 100 | rect.width = 0; 101 | } 102 | if (rect.height < 0) 103 | { 104 | rect.height = 0; 105 | } 106 | } 107 | 108 | template 109 | inline void limit(cv::Rect_ &rect, t width, t height, t x = 0, t y = 0) 110 | { 111 | limit(rect, cv::Rect_(x, y, width, height)); 112 | } 113 | 114 | template 115 | inline cv::Rect getBorder(const cv::Rect_ &original, cv::Rect_ &limited) 116 | { 117 | cv::Rect_ res; 118 | res.x = limited.x - original.x; 119 | res.y = limited.y - original.y; 120 | res.width = x2(original) - x2(limited); 121 | res.height = y2(original) - y2(limited); 122 | assert(res.x >= 0 && res.y >= 0 && res.width >= 0 && res.height >= 0); 123 | return res; 124 | } 125 | // cut "window" out from "input". 126 | inline cv::Mat subwindow(const cv::Mat &input, const cv::Rect &window, int borderType = cv::BORDER_CONSTANT) 127 | { 128 | cv::Mat res; 129 | cv::Rect cutWindow = window; 130 | limit(cutWindow, input.cols, input.rows); 131 | //debug("cutWindow: %d x %d", cutWindow.height, cutWindow.width); 132 | if (cutWindow.height <= 0 || cutWindow.width <= 0) 133 | { 134 | //assert(0 && "error: cutWindow size error!\n"); 135 | return res;//cv::Mat(window.height,window.width,input.type(),0) ; 136 | } 137 | cv::Rect border = getBorder(window, cutWindow); 138 | res = input(cutWindow); 139 | if (border != cv::Rect(0, 0, 0, 0)) 140 | { 141 | cv::copyMakeBorder(res, res, border.y, border.height, border.x, border.width, borderType); 142 | } 143 | return res; 144 | } 145 | 146 | inline cv::Mat getGrayImage(cv::Mat img) 147 | { 148 | cv::cvtColor(img, img, CV_BGR2GRAY); 149 | img.convertTo(img, CV_32F, 1 / 255.f); 150 | return img; 151 | } 152 | 153 | } // namespace eco 154 | 155 | #endif -------------------------------------------------------------------------------- /DaSiamRPN/dasiamrpntracker.h: -------------------------------------------------------------------------------- 1 | /* DaSiamRPNCaffe2 2 | # Licensed under The MIT License 3 | # Written by wzq*/ 4 | #ifndef DASIAMRPNTRACKER_H 5 | #define DASIAMRPNTRACKER_H 6 | #include 7 | #include 8 | #include 9 | #include 10 | #include 11 | #include 12 | #include 13 | #include 14 | #include 15 | #include 16 | 17 | #include 18 | #include 19 | #define DEBUG_ 0 20 | static std::string global_init_net_file = "/home/nvidia/Develop/Project/ROS/Tracking/src/tracking/DaSiamRPN/Model/global_init_net.pb"; 21 | static std::string temple_net_file = "/home/nvidia/Develop/Project/ROS/Tracking/src/tracking/DaSiamRPN/Model/temple_pred_net.pb"; 22 | static std::string track_net_file = "/home/nvidia/Develop/Project/ROS/Tracking/src/tracking/DaSiamRPN/Model/track_pred_net.pb"; 23 | 24 | static std::string adjust_init_net_file = "/home/nvidia/Develop/Project/ROS/Tracking/src/tracking/DaSiamRPN/Model/adjust_init_net.pb"; 25 | static std::string adjust_pred_net_file = "/home/nvidia/Develop/Project/ROS/Tracking/src/tracking/DaSiamRPN/Model/adjust_pred_net.pb"; 26 | 27 | static std::string Correlation_init_net_file = "/home/nvidia/Develop/Project/ROS/Tracking/src/tracking/DaSiamRPN/Model/Correlation_init_net.pb"; 28 | static std::string Correlation_pred_net_file = "/home/nvidia/Develop/Project/ROS/Tracking/src/tracking/DaSiamRPN/Model/Correlation_pred_net.pb"; 29 | 30 | struct TrackerConfig{ 31 | // These are the default hyper-params for DaSiamRPN 0.3827 32 | std::string windowing = "cosine";// # to penalize large displacements [cosine/uniform] 33 | Eigen::Matrix window; 34 | // Params from the network architecture, have to be consistent with the training 35 | int exemplar_size = 127; // input z size 36 | int instance_size = 271; // input x size (search region) 37 | int total_stride = 8; 38 | int score_size = (instance_size-exemplar_size)/total_stride+1; 39 | float context_amount = 0.5; // context amount for the exemplar 40 | Eigen::Array ratios; 41 | Eigen::Array scales; 42 | int anchor_num; 43 | Eigen::Matrix anchor; 44 | float penalty_k = 0.055; 45 | float window_influence = 0.42; 46 | float lr = 0.295; 47 | TrackerConfig(){ 48 | ratios <<0.33,0.5,1,2,3; 49 | scales << 8; 50 | anchor_num = ratios.size()*scales.size(); 51 | } 52 | }; 53 | struct BoxInfo{ 54 | float xc; 55 | float yc; 56 | float w; 57 | float h; 58 | float best_score; 59 | }; 60 | 61 | struct TrackInfo{ 62 | int im_h; 63 | int im_w; 64 | BoxInfo binfo; 65 | std::string window; 66 | TrackerConfig cfg; 67 | cv::Scalar avg_chans; 68 | }; 69 | 70 | 71 | using namespace caffe2; 72 | class DaSiamRPNTracker 73 | { 74 | public: 75 | DaSiamRPNTracker(); 76 | void SiamRPN_init(const cv::Mat& mat,BoxInfo&info,TrackInfo& output,const std::string&global_init_net_file, 77 | const std::string temple_net_file,const std::string& track_net_file,caffe2::DeviceType d,int gpuid); 78 | void tracker_eval(cv::Mat x_crop, 79 | BoxInfo &binfo, 80 | float& scale_z, 81 | TrackerConfig &p); 82 | void SiamRPN_track(cv::Mat mat,TrackInfo&info); 83 | 84 | private: 85 | std::unique_ptr global_init_net; 86 | std::unique_ptr temple_net; 87 | std::unique_ptr track_net; 88 | std::unique_ptr adjust_net; 89 | std::unique_ptr adjsut_init_net; 90 | std::shared_ptr trackerEngine; 91 | caffe2::DeviceType mode; 92 | int gpuid; 93 | caffe2::DeviceOption devOption; 94 | TrackInfo trackInfo; 95 | //for gpu inference 96 | std::vectorcuda_r1_kernels; 97 | std::vectorcuda_cls_kernels; 98 | //for cpu inference 99 | std::vectorcpu_r1_kernels; 100 | std::vectorcpu_cls_kernels; 101 | protected: 102 | //these functions are only called internal, set them protected. 103 | void GetTensorToHost(const Tensor* tensor,std::vector& data ) { 104 | data.resize(tensor->size()); 105 | CUDAContext context_; 106 | context_.template Copy( 107 | data.size(),tensor->template data(),data.data()); 108 | } 109 | 110 | void GetTensorToHost( Tensor* tensor, Tensor* ctensor ) { 111 | ctensor->Resize(tensor->dims()); 112 | CUDAContext context_; 113 | context_.template Copy( 114 | ctensor->size(),tensor->template data(),ctensor->template mutable_data()); 115 | } 116 | 117 | void FeedInputToNet(cv::Mat& input,const std::string& blob_name); 118 | void regress_adjust(); 119 | }; 120 | 121 | #endif // DASIAMRPNTRACKER_H 122 | -------------------------------------------------------------------------------- /ECO/optimize_scores.cc: -------------------------------------------------------------------------------- 1 | #include"optimize_scores.hpp" 2 | 3 | namespace eco{ 4 | void OptimizeScores::compute_scores() 5 | { 6 | std::vector sampled_scores; 7 | // Do inverse fft to the scores in the Fourier domain back to spacial domain 8 | for (size_t i = 0; i < scores_fs_.size(); ++i) // for each scale 9 | { 10 | int area = scores_fs_[i].size().area(); 11 | cv::Mat tmp = dft(fftshift(scores_fs_[i], 1, 1, 1), 1);// inverse dft 12 | sampled_scores.push_back(real(tmp * area)); // spacial domain only contains real part 13 | } 14 | 15 | // to store the position of maximum value of response 16 | std::vector row, col; 17 | std::vector init_max_score; // inialized max score 18 | for (size_t i = 0; i < scores_fs_.size(); ++i) // for each scale 19 | { 20 | cv::Point pos; 21 | double maxValue = 0, minValue = 0; 22 | cv::minMaxLoc(sampled_scores[i], &minValue, &maxValue, NULL, &pos); 23 | row.push_back(pos.y); 24 | col.push_back(pos.x); 25 | init_max_score.push_back(sampled_scores[i].at(pos.y, pos.x)); 26 | //debug("init_max_score %lu: value: %lf %lf y:%d x:%d", i, minValue, maxValue, pos.y, pos.x); 27 | } 28 | 29 | // Shift and rescale the coordinate system to [-pi, pi] 30 | int h = scores_fs_[0].rows, w = scores_fs_[0].cols; 31 | std::vector max_pos_y, max_pos_x, init_pos_y, init_pos_x; 32 | for (size_t i = 0; i < row.size(); ++i) 33 | { 34 | max_pos_y.push_back( (row[i] + (h - 1) / 2) % h - (h - 1) / 2); 35 | max_pos_y[i] *= 2 * CV_PI / h; 36 | max_pos_x.push_back( (col[i] + (w - 1) / 2) % w - (w - 1) / 2); 37 | max_pos_x[i] *= 2 * CV_PI / w; 38 | } 39 | init_pos_y = max_pos_y; init_pos_x = max_pos_x; 40 | // Construct grid 41 | std::vector ky, kx, ky2, kx2; 42 | for (int i = 0; i < h; ++i) 43 | { 44 | ky.push_back(i - (h - 1) / 2); 45 | ky2.push_back(ky[i] * ky[i]); 46 | } 47 | for (int i = 0; i < w; ++i) 48 | { 49 | kx.push_back(i - (w - 1) / 2); 50 | kx2.push_back(kx[i] * kx[i]); 51 | } 52 | // Pre-compute complex exponential 53 | std::vector exp_iky, exp_ikx; 54 | for (unsigned int i = 0; i < scores_fs_.size(); ++i) 55 | { 56 | cv::Mat tempy(1, h, CV_32FC2); 57 | cv::Mat tempx(w, 1, CV_32FC2); 58 | for (int y = 0; y < h; ++y) 59 | tempy.at>(0, y) = cv::Vec(cos(ky[y] * max_pos_y[i]), sin(ky[y] * max_pos_y[i])); 60 | for (int x = 0; x < w; ++x) 61 | tempx.at>(x, 0) = cv::Vec(cos(kx[x] * max_pos_x[i]), sin(kx[x] * max_pos_x[i])); 62 | exp_iky.push_back(tempy); 63 | exp_ikx.push_back(tempx); 64 | } 65 | 66 | cv::Mat kyMat(1, h, CV_32FC1, &ky[0]); 67 | cv::Mat ky2Mat(1, h, CV_32FC1, &ky2[0]); 68 | cv::Mat kxMat(w, 1, CV_32FC1, &kx[0]); 69 | cv::Mat kx2Mat(w, 1, CV_32FC1, &kx2[0]); 70 | 71 | for (int ite = 0; ite < iterations_; ++ite) 72 | { 73 | // Compute gradient 74 | std::vector ky_exp_ky, kx_exp_kx, y_resp, resp_x, grad_y, grad_x; 75 | std::vector ival, H_yy, H_xx, H_xy, det_H; 76 | for (unsigned int i = 0; i < scores_fs_.size(); i++) 77 | { 78 | ky_exp_ky.push_back(complexDotMultiplication(kyMat, exp_iky[i])); 79 | kx_exp_kx.push_back(complexDotMultiplication(kxMat, exp_ikx[i])); 80 | 81 | y_resp.push_back(exp_iky[i] * scores_fs_[i]); 82 | resp_x.push_back(scores_fs_[i] * exp_ikx[i]); 83 | 84 | grad_y.push_back(-1 * imag(ky_exp_ky[i] * resp_x[i])); 85 | grad_x.push_back(-1 * imag(y_resp[i] * kx_exp_kx[i])); 86 | 87 | // Compute Hessian 88 | ival.push_back(exp_iky[i] * resp_x[i]); 89 | std::vector tmp; 90 | cv::split(ival[i], tmp); 91 | cv::merge(std::vector({-1 * tmp[1], tmp[0]}), ival[i]); 92 | 93 | H_yy.push_back(real(-1 * complexDotMultiplication(ky2Mat, exp_iky[i]) * resp_x[i] + ival[i])); 94 | H_xx.push_back(real(-1 * y_resp[i] * complexDotMultiplication(kx2Mat, exp_ikx[i]) + ival[i])); 95 | H_xy.push_back(real(-1 * ky_exp_ky[i] * (scores_fs_[i] * kx_exp_kx[i]))); 96 | 97 | det_H.push_back(H_yy[i].mul(H_xx[i]) - H_xy[i].mul(H_xy[i])); 98 | 99 | // Compute new position using newtons method 100 | cv::Mat tmp1, tmp2; 101 | cv::divide(H_xx[i].mul(grad_y[i]) - H_xy[i].mul(grad_x[i]), det_H[i], tmp1); 102 | max_pos_y[i] -= tmp1.at(0, 0); 103 | cv::divide(H_yy[i].mul(grad_x[i]) - H_xy[i].mul(grad_y[i]), det_H[i], tmp2); 104 | max_pos_x[i] -= tmp2.at(0, 0); 105 | 106 | // Evaluate maximum 107 | cv::Mat tempy(1, h, CV_32FC2), tempx(w, 1, CV_32FC2); 108 | for (int y = 0; y < h; ++y) 109 | tempy.at>(0, y) = cv::Vec(cos(ky[y] * max_pos_y[i]), sin(ky[y] * max_pos_y[i])); 110 | for (int x = 0; x < w; ++x) 111 | tempx.at>(x, 0) = cv::Vec(cos(kx[x] * max_pos_x[i]), sin(kx[x] * max_pos_x[i])); 112 | exp_iky[i] = tempy; 113 | exp_ikx[i] = tempx; 114 | } 115 | } 116 | // Evaluate the Fourier series at the estimated locations to find the corresponding scores. 117 | std::vector max_score; 118 | for (size_t i = 0; i < sampled_scores.size(); ++i) 119 | { 120 | float new_scores = real(exp_iky[i] * scores_fs_[i] * exp_ikx[i]).at(0, 0); 121 | // check for scales that have not increased in score 122 | if (new_scores > init_max_score[i]) 123 | { 124 | max_score.push_back(new_scores); 125 | } 126 | else 127 | { 128 | max_score.push_back(init_max_score[i]); 129 | max_pos_y[i] = init_pos_y[i]; 130 | max_pos_x[i] = init_pos_x[i]; 131 | } 132 | 133 | } 134 | 135 | // Find the scale with the maximum response 136 | std::vector::iterator pos = max_element(max_score.begin(), max_score.end()); 137 | scale_ind_ = pos - max_score.begin(); 138 | max_score_ = *pos; 139 | 140 | // Scale the coordinate system to output_sz 141 | disp_row_ = (fmod(max_pos_y[scale_ind_] + CV_PI, CV_PI * 2.0) - CV_PI) / (CV_PI * 2.0) * h; 142 | disp_col_ = (fmod(max_pos_x[scale_ind_] + CV_PI, CV_PI * 2.0) - CV_PI) / (CV_PI * 2.0) * w; 143 | //return sampled_scores; 144 | } 145 | } -------------------------------------------------------------------------------- /KCF/recttools.hpp: -------------------------------------------------------------------------------- 1 | /* 2 | Author: Christian Bailer 3 | Contact address: Christian.Bailer@dfki.de 4 | Department Augmented Vision DFKI 5 | 6 | License Agreement 7 | For Open Source Computer Vision Library 8 | (3-clause BSD License) 9 | 10 | Redistribution and use in source and binary forms, with or without modification, 11 | are permitted provided that the following conditions are met: 12 | 13 | * Redistributions of source code must retain the above copyright notice, 14 | this list of conditions and the following disclaimer. 15 | 16 | * Redistributions in binary form must reproduce the above copyright notice, 17 | this list of conditions and the following disclaimer in the documentation 18 | and/or other materials provided with the distribution. 19 | 20 | * Neither the names of the copyright holders nor the names of the contributors 21 | may be used to endorse or promote products derived from this software 22 | without specific prior written permission. 23 | 24 | This software is provided by the copyright holders and contributors "as is" and 25 | any express or implied warranties, including, but not limited to, the implied 26 | warranties of merchantability and fitness for a particular purpose are disclaimed. 27 | In no event shall copyright holders or contributors be liable for any direct, 28 | indirect, incidental, special, exemplary, or consequential damages 29 | (including, but not limited to, procurement of substitute goods or services; 30 | loss of use, data, or profits; or business interruption) however caused 31 | and on any theory of liability, whether in contract, strict liability, 32 | or tort (including negligence or otherwise) arising in any way out of 33 | the use of this software, even if advised of the possibility of such damage. 34 | */ 35 | 36 | #pragma once 37 | 38 | //#include 39 | #include 40 | 41 | #ifndef _OPENCV_RECTTOOLS_HPP_ 42 | #define _OPENCV_RECTTOOLS_HPP_ 43 | #endif 44 | 45 | namespace kcf 46 | { 47 | 48 | template 49 | inline cv::Vec center(const cv::Rect_ &rect) 50 | { 51 | return cv::Vec (rect.x + rect.width / (t) 2, rect.y + rect.height / (t) 2); 52 | } 53 | 54 | template 55 | inline t x2(const cv::Rect_ &rect) 56 | { 57 | return rect.x + rect.width; 58 | } 59 | 60 | template 61 | inline t y2(const cv::Rect_ &rect) 62 | { 63 | return rect.y + rect.height; 64 | } 65 | 66 | template 67 | inline void resize(cv::Rect_ &rect, float scalex, float scaley = 0) 68 | { 69 | if (!scaley)scaley = scalex; 70 | rect.x -= rect.width * (scalex - 1.f) / 2.f; 71 | rect.width *= scalex; 72 | 73 | rect.y -= rect.height * (scaley - 1.f) / 2.f; 74 | rect.height *= scaley; 75 | 76 | } 77 | 78 | template 79 | inline void limit(cv::Rect_ &rect, cv::Rect_ limit) 80 | { 81 | if (rect.x + rect.width > limit.x + limit.width) 82 | rect.width = (limit.x + limit.width - rect.x); 83 | if (rect.y + rect.height > limit.y + limit.height) 84 | rect.height = (limit.y + limit.height - rect.y); 85 | if (rect.x < limit.x) 86 | { 87 | rect.width -= (limit.x - rect.x); 88 | rect.x = limit.x; 89 | } 90 | if (rect.y < limit.y) 91 | { 92 | rect.height -= (limit.y - rect.y); 93 | rect.y = limit.y; 94 | } 95 | 96 | if(rect.width<0)rect.width=0; 97 | if(rect.height<0)rect.height=0; 98 | } 99 | 100 | template 101 | inline void limit(cv::Rect_ &rect, t width, t height, t x = 0, t y = 0) 102 | { 103 | limit(rect, cv::Rect_ (x, y, width, height)); 104 | 105 | } 106 | 107 | template 108 | inline cv::Rect getBorder(const cv::Rect_ &original, cv::Rect_ & limited) 109 | { 110 | cv::Rect_ res; 111 | res.x = limited.x - original.x; 112 | res.y = limited.y - original.y; 113 | res.width = x2(original) - x2(limited); 114 | res.height = y2(original) - y2(limited); 115 | assert(res.x >= 0 && res.y >= 0 && res.width >= 0 && res.height >= 0); 116 | return res; 117 | } 118 | 119 | inline cv::Mat subwindow(const cv::Mat &in, const cv::Rect & window, int borderType = cv::BORDER_CONSTANT) 120 | { 121 | cv::Rect cutWindow = window; 122 | limit(cutWindow, in.cols, in.rows); //limit cutwindow inside Mat in; 123 | 124 | if (cutWindow.height <= 0 || cutWindow.width <= 0) assert(0); 125 | // return cv::Mat(window.height,window.width,in.type(),0) ; 126 | 127 | cv::Rect border = getBorder(window, cutWindow); //get the border of cutWindow in window; 128 | cv::Mat res = in(cutWindow); 129 | 130 | if (border != cv::Rect(0, 0, 0, 0)) 131 | {// back to the same size of window with border filled with constant 132 | cv::copyMakeBorder(res, res, border.y, border.height, border.x, border.width, borderType); 133 | } 134 | return res; 135 | } 136 | 137 | inline cv::Mat getGrayImage(cv::Mat img) 138 | { 139 | cv::cvtColor(img, img, CV_BGR2GRAY); 140 | img.convertTo(img, CV_32F, 1 / 255.f); 141 | return img; 142 | } 143 | 144 | inline void cutOutsize(float &num, int limit) 145 | { 146 | if(num < 0) 147 | num = 0; 148 | else if(num > limit - 1) 149 | num = limit - 1; 150 | } 151 | 152 | inline cv::Mat extractImage(const cv::Mat &in, float cx, float cy, float patch_width, float patch_height) 153 | { 154 | 155 | float xs_s = floor(cx) - floor(patch_width / 2); 156 | cutOutsize(xs_s, in.cols); 157 | 158 | float xs_e = floor(cx + patch_width - 1) - floor(patch_width / 2); 159 | cutOutsize(xs_e, in.cols); 160 | 161 | float ys_s = floor(cy) - floor(patch_height / 2); 162 | cutOutsize(ys_s, in.rows); 163 | 164 | float ys_e = floor(cy + patch_height - 1) - floor(patch_height / 2); 165 | cutOutsize(ys_e, in.rows); 166 | 167 | 168 | return in(cv::Rect(xs_s, ys_s, xs_e - xs_s, ys_e - ys_s)); 169 | } 170 | 171 | } 172 | 173 | 174 | 175 | -------------------------------------------------------------------------------- /ECO/fhog.hpp: -------------------------------------------------------------------------------- 1 | /*M/////////////////////////////////////////////////////////////////////////////////////// 2 | // 3 | // IMPORTANT: READ BEFORE DOWNLOADING, COPYING, INSTALLING OR USING. 4 | // 5 | // By downloading, copying, installing or using the software you agree to this license. 6 | // If you do not agree to this license, do not download, install, 7 | // copy or use the software. 8 | // 9 | // 10 | // License Agreement 11 | // For Open Source Computer Vision Library 12 | // 13 | // Copyright (C) 2010-2013, University of Nizhny Novgorod, all rights reserved. 14 | // Third party copyrights are property of their respective owners. 15 | // 16 | // Redistribution and use in source and binary forms, with or without modification, 17 | // are permitted provided that the following conditions are met: 18 | // 19 | // * Redistribution's of source code must retain the above copyright notice, 20 | // this list of conditions and the following disclaimer. 21 | // 22 | // * Redistribution's in binary form must reproduce the above copyright notice, 23 | // this list of conditions and the following disclaimer in the documentation 24 | // and/or other materials provided with the distribution. 25 | // 26 | // * The name of the copyright holders may not be used to endorse or promote products 27 | // derived from this software without specific prior written permission. 28 | // 29 | // This software is provided by the copyright holders and contributors "as is" and 30 | // any express or implied warranties, including, but not limited to, the implied 31 | // warranties of merchantability and fitness for a particular purpose are disclaimed. 32 | // In no event shall the Intel Corporation or contributors be liable for any direct, 33 | // indirect, incidental, special, exemplary, or consequential damages 34 | // (including, but not limited to, procurement of substitute goods or services; 35 | // loss of use, data, or profits; or business interruption) however caused 36 | // and on any theory of liability, whether in contract, strict liability, 37 | // or tort (including negligence or otherwise) arising in any way out of 38 | // the use of this software, even if advised of the possibility of such damage. 39 | // 40 | //M*/ 41 | 42 | //Modified from latentsvm module's "_lsvmc_latentsvm.h". 43 | 44 | /*****************************************************************************/ 45 | /* Latent SVM prediction API */ 46 | /*****************************************************************************/ 47 | 48 | #ifndef _FHOG_H_ 49 | #define _FHOG_H_ 50 | 51 | #include 52 | 53 | #include 54 | 55 | namespace eco 56 | { 57 | // DataType: STRUCT featureMap 58 | // FEATURE MAP DESCRIPTION 59 | // Rectangular map (sizeX x sizeY), 60 | // every cell stores feature vector (dimension = numFeatures) 61 | // map - matrix of feature vectors 62 | // to set and get feature vectors (i,j) 63 | // used formula map[(j * sizeX + i) * p + k], where 64 | // k - component of feature vector in cell (i, j) 65 | typedef struct 66 | { 67 | int sizeX; 68 | int sizeY; 69 | int numFeatures; 70 | float *map; 71 | } CvLSVMFeatureMapCaskade; 72 | 73 | #include "float.h" 74 | 75 | #define PI CV_PI 76 | #define EPS 0.000001 77 | #define F_MAX FLT_MAX 78 | #define F_MIN -FLT_MAX 79 | 80 | // The number of elements in bin 81 | // The number of sectors in gradient histogram building 82 | #define NUM_SECTOR 9 83 | 84 | // The number of levels in image resize procedure 85 | // We need Lambda levels to resize image twice 86 | #define LAMBDA 10 87 | 88 | // Block size. Used in feature pyramid building procedure 89 | #define SIDE_LENGTH 8 90 | 91 | #define VAL_OF_TRUNCATE 0.2f 92 | 93 | //modified from "_lsvm_error.h" 94 | #define LATENT_SVM_OK 0 95 | #define LATENT_SVM_MEM_NULL 2 96 | #define DISTANCE_TRANSFORM_OK 1 97 | #define DISTANCE_TRANSFORM_GET_INTERSECTION_ERROR -1 98 | #define DISTANCE_TRANSFORM_ERROR -2 99 | #define DISTANCE_TRANSFORM_EQUAL_POINTS -3 100 | #define LATENT_SVM_GET_FEATURE_PYRAMID_FAILED -4 101 | #define LATENT_SVM_SEARCH_OBJECT_FAILED -5 102 | #define LATENT_SVM_FAILED_SUPERPOSITION -6 103 | #define FILTER_OUT_OF_BOUNDARIES -7 104 | #define LATENT_SVM_TBB_SCHEDULE_CREATION_FAILED -8 105 | #define LATENT_SVM_TBB_NUMTHREADS_NOT_CORRECT -9 106 | #define FFT_OK 2 107 | #define FFT_ERROR -10 108 | #define LSVM_PARSER_FILE_NOT_FOUND -11 109 | 110 | /* 111 | // Getting feature map for the selected subimage 112 | // 113 | // API 114 | // int getFeatureMaps(const IplImage * image, const int k, featureMap **map); 115 | // INPUT 116 | // image - selected subimage 117 | // k - size of cells 118 | // OUTPUT 119 | // map - feature map 120 | // RESULT 121 | // Error status 122 | */ 123 | int getFeatureMaps(const IplImage *image, const int k, 124 | CvLSVMFeatureMapCaskade **map); 125 | 126 | /* 127 | // Feature map Normalization and Truncation 128 | // 129 | // API 130 | // int normalizationAndTruncationFeatureMaps(featureMap *map, const float alfa); 131 | // INPUT 132 | // map - feature map 133 | // alfa - truncation threshold 134 | // OUTPUT 135 | // map - truncated and normalized feature map 136 | // RESULT 137 | // Error status 138 | */ 139 | int normalizeAndTruncate(CvLSVMFeatureMapCaskade *map, const float alfa); 140 | 141 | /* 142 | // Feature map reduction 143 | // In each cell we reduce dimension of the feature vector 144 | // according to original paper special procedure 145 | // 146 | // API 147 | // int PCAFeatureMaps(featureMap *map) 148 | // INPUT 149 | // map - feature map 150 | // OUTPUT 151 | // map - feature map 152 | // RESULT 153 | // Error status 154 | */ 155 | int PCAFeatureMaps(CvLSVMFeatureMapCaskade *map); 156 | 157 | int allocFeatureMapObject(CvLSVMFeatureMapCaskade **obj, 158 | const int sizeX, const int sizeY, const int p); 159 | 160 | int freeFeatureMapObject(CvLSVMFeatureMapCaskade **obj); 161 | } // namespace eco 162 | 163 | #endif 164 | -------------------------------------------------------------------------------- /KCF/fhog.hpp: -------------------------------------------------------------------------------- 1 | /*M/////////////////////////////////////////////////////////////////////////////////////// 2 | // 3 | // IMPORTANT: READ BEFORE DOWNLOADING, COPYING, INSTALLING OR USING. 4 | // 5 | // By downloading, copying, installing or using the software you agree to this license. 6 | // If you do not agree to this license, do not download, install, 7 | // copy or use the software. 8 | // 9 | // 10 | // License Agreement 11 | // For Open Source Computer Vision Library 12 | // 13 | // Copyright (C) 2010-2013, University of Nizhny Novgorod, all rights reserved. 14 | // Third party copyrights are property of their respective owners. 15 | // 16 | // Redistribution and use in source and binary forms, with or without modification, 17 | // are permitted provided that the following conditions are met: 18 | // 19 | // * Redistribution's of source code must retain the above copyright notice, 20 | // this list of conditions and the following disclaimer. 21 | // 22 | // * Redistribution's in binary form must reproduce the above copyright notice, 23 | // this list of conditions and the following disclaimer in the documentation 24 | // and/or other materials provided with the distribution. 25 | // 26 | // * The name of the copyright holders may not be used to endorse or promote products 27 | // derived from this software without specific prior written permission. 28 | // 29 | // This software is provided by the copyright holders and contributors "as is" and 30 | // any express or implied warranties, including, but not limited to, the implied 31 | // warranties of merchantability and fitness for a particular purpose are disclaimed. 32 | // In no event shall the Intel Corporation or contributors be liable for any direct, 33 | // indirect, incidental, special, exemplary, or consequential damages 34 | // (including, but not limited to, procurement of substitute goods or services; 35 | // loss of use, data, or profits; or business interruption) however caused 36 | // and on any theory of liability, whether in contract, strict liability, 37 | // or tort (including negligence or otherwise) arising in any way out of 38 | // the use of this software, even if advised of the possibility of such damage. 39 | // 40 | //M*/ 41 | 42 | 43 | //Modified from latentsvm module's "_lsvmc_latentsvm.h". 44 | 45 | 46 | /*****************************************************************************/ 47 | /* Latent SVM prediction API */ 48 | /*****************************************************************************/ 49 | 50 | #ifndef _FHOG_H_ 51 | #define _FHOG_H_ 52 | 53 | #include 54 | //#include "_lsvmc_types.h" 55 | //#include "_lsvmc_error.h" 56 | //#include "_lsvmc_routine.h" 57 | 58 | //#include "opencv2/imgproc.hpp" 59 | #include "opencv2/imgproc/imgproc_c.h" 60 | 61 | namespace kcf 62 | { 63 | //modified from "_lsvmc_types.h" 64 | 65 | // DataType: STRUCT featureMap 66 | // FEATURE MAP DESCRIPTION 67 | // Rectangular map (sizeX x sizeY), 68 | // every cell stores feature vector (dimension = numFeatures) 69 | // map - matrix of feature vectors 70 | // to set and get feature vectors (i,j) 71 | // used formula map[(j * sizeX + i) * p + k], where 72 | // k - component of feature vector in cell (i, j) 73 | typedef struct{ 74 | int sizeX; 75 | int sizeY; 76 | int numFeatures; 77 | float *map; 78 | } CvLSVMFeatureMapCaskade; 79 | 80 | 81 | #include "float.h" 82 | 83 | #define PI CV_PI 84 | 85 | #define EPS 0.000001 86 | 87 | #define F_MAX FLT_MAX 88 | #define F_MIN -FLT_MAX 89 | 90 | // The number of elements in bin 91 | // The number of sectors in gradient histogram building 92 | #define NUM_SECTOR 9 93 | 94 | // The number of levels in image resize procedure 95 | // We need Lambda levels to resize image twice 96 | #define LAMBDA 10 97 | 98 | // Block size. Used in feature pyramid building procedure 99 | #define SIDE_LENGTH 8 100 | 101 | #define VAL_OF_TRUNCATE 0.2f 102 | 103 | 104 | //modified from "_lsvm_error.h" 105 | #define LATENT_SVM_OK 0 106 | #define LATENT_SVM_MEM_NULL 2 107 | #define DISTANCE_TRANSFORM_OK 1 108 | #define DISTANCE_TRANSFORM_GET_INTERSECTION_ERROR -1 109 | #define DISTANCE_TRANSFORM_ERROR -2 110 | #define DISTANCE_TRANSFORM_EQUAL_POINTS -3 111 | #define LATENT_SVM_GET_FEATURE_PYRAMID_FAILED -4 112 | #define LATENT_SVM_SEARCH_OBJECT_FAILED -5 113 | #define LATENT_SVM_FAILED_SUPERPOSITION -6 114 | #define FILTER_OUT_OF_BOUNDARIES -7 115 | #define LATENT_SVM_TBB_SCHEDULE_CREATION_FAILED -8 116 | #define LATENT_SVM_TBB_NUMTHREADS_NOT_CORRECT -9 117 | #define FFT_OK 2 118 | #define FFT_ERROR -10 119 | #define LSVM_PARSER_FILE_NOT_FOUND -11 120 | 121 | 122 | 123 | /* 124 | // Getting feature map for the selected subimage 125 | // 126 | // API 127 | // int getFeatureMaps(const IplImage * image, const int k, featureMap **map); 128 | // INPUT 129 | // image - selected subimage 130 | // k - size of cells 131 | // OUTPUT 132 | // map - feature map 133 | // RESULT 134 | // Error status 135 | */ 136 | int getFeatureMaps(const IplImage * image, const int k, CvLSVMFeatureMapCaskade **map); 137 | 138 | 139 | /* 140 | // Feature map Normalization and Truncation 141 | // 142 | // API 143 | // int normalizationAndTruncationFeatureMaps(featureMap *map, const float alfa); 144 | // INPUT 145 | // map - feature map 146 | // alfa - truncation threshold 147 | // OUTPUT 148 | // map - truncated and normalized feature map 149 | // RESULT 150 | // Error status 151 | */ 152 | int normalizeAndTruncate(CvLSVMFeatureMapCaskade *map, const float alfa); 153 | 154 | /* 155 | // Feature map reduction 156 | // In each cell we reduce dimension of the feature vector 157 | // according to original paper special procedure 158 | // 159 | // API 160 | // int PCAFeatureMaps(featureMap *map) 161 | // INPUT 162 | // map - feature map 163 | // OUTPUT 164 | // map - feature map 165 | // RESULT 166 | // Error status 167 | */ 168 | int PCAFeatureMaps(CvLSVMFeatureMapCaskade *map); 169 | 170 | 171 | //modified from "lsvmc_routine.h" 172 | 173 | int allocFeatureMapObject(CvLSVMFeatureMapCaskade **obj, const int sizeX, const int sizeY, 174 | const int p); 175 | 176 | int freeFeatureMapObject (CvLSVMFeatureMapCaskade **obj); 177 | 178 | } 179 | 180 | #endif 181 | -------------------------------------------------------------------------------- /KCF/ffttools.hpp: -------------------------------------------------------------------------------- 1 | /* 2 | Author: Christian Bailer 3 | Contact address: Christian.Bailer@dfki.de 4 | Department Augmented Vision DFKI 5 | 6 | License Agreement 7 | For Open Source Computer Vision Library 8 | (3-clause BSD License) 9 | 10 | Redistribution and use in source and binary forms, with or without modification, 11 | are permitted provided that the following conditions are met: 12 | 13 | * Redistributions of source code must retain the above copyright notice, 14 | this list of conditions and the following disclaimer. 15 | 16 | * Redistributions in binary form must reproduce the above copyright notice, 17 | this list of conditions and the following disclaimer in the documentation 18 | and/or other materials provided with the distribution. 19 | 20 | * Neither the names of the copyright holders nor the names of the contributors 21 | may be used to endorse or promote products derived from this software 22 | without specific prior written permission. 23 | 24 | This software is provided by the copyright holders and contributors "as is" and 25 | any express or implied warranties, including, but not limited to, the implied 26 | warranties of merchantability and fitness for a particular purpose are disclaimed. 27 | In no event shall copyright holders or contributors be liable for any direct, 28 | indirect, incidental, special, exemplary, or consequential damages 29 | (including, but not limited to, procurement of substitute goods or services; 30 | loss of use, data, or profits; or business interruption) however caused 31 | and on any theory of liability, whether in contract, strict liability, 32 | or tort (including negligence or otherwise) arising in any way out of 33 | the use of this software, even if advised of the possibility of such damage. 34 | */ 35 | 36 | #pragma once 37 | 38 | //#include 39 | 40 | #ifndef _OPENCV_FFTTOOLS_HPP_ 41 | #define _OPENCV_FFTTOOLS_HPP_ 42 | #endif 43 | 44 | namespace kcf 45 | { 46 | cv::Mat dft_d(cv::Mat img, bool backwards = false, bool byRow = false); //byRow=true: 1d trasform, else 2d; 47 | cv::Mat real(cv::Mat img); 48 | cv::Mat imag(cv::Mat img); 49 | cv::Mat magnitude(cv::Mat img); 50 | cv::Mat complexDotMultiplication(cv::Mat a, cv::Mat b); 51 | cv::Mat complexDotDivision(cv::Mat a, cv::Mat b); 52 | void rearrange(cv::Mat &img); 53 | void normalizedLogTransform(cv::Mat &img); 54 | 55 | cv::Mat dft_d(cv::Mat img, bool backwards, bool byRow) 56 | { 57 | if (img.channels() == 1) 58 | { 59 | cv::Mat planes[] = {cv::Mat_(img), 60 | cv::Mat_::zeros(img.size())}; 61 | cv::merge(planes, 2, img); 62 | } 63 | if (byRow) 64 | cv::dft(img, img, (cv::DFT_ROWS | cv::DFT_COMPLEX_OUTPUT)); 65 | else 66 | cv::dft(img, img, backwards ? (cv::DFT_INVERSE | cv::DFT_SCALE) : 0); //do scale when ifft; 67 | 68 | return img; 69 | } 70 | 71 | cv::Mat real(cv::Mat img) 72 | { 73 | std::vector planes; 74 | cv::split(img, planes); 75 | return planes[0]; 76 | } 77 | 78 | cv::Mat imag(cv::Mat img) 79 | { 80 | std::vector planes; 81 | cv::split(img, planes); 82 | return planes[1]; 83 | } 84 | 85 | cv::Mat magnitude(cv::Mat img) 86 | { 87 | cv::Mat res; 88 | std::vector planes; 89 | cv::split(img, planes); // planes[0] = Re(DFT(I), planes[1] = Im(DFT(I)) 90 | if (planes.size() == 1) 91 | res = cv::abs(img); 92 | else if (planes.size() == 2) 93 | cv::magnitude(planes[0], planes[1], res); // planes[0] = magnitude 94 | else 95 | assert(0); 96 | return res; 97 | } 98 | 99 | cv::Mat complexDotMultiplication(cv::Mat a, cv::Mat b) 100 | { 101 | std::vector pa; 102 | std::vector pb; 103 | cv::split(a, pa); 104 | cv::split(b, pb); 105 | 106 | std::vector pres; 107 | pres.push_back(pa[0].mul(pb[0]) - pa[1].mul(pb[1])); 108 | pres.push_back(pa[0].mul(pb[1]) + pa[1].mul(pb[0])); 109 | 110 | cv::Mat res; 111 | cv::merge(pres, res); 112 | 113 | return res; 114 | } 115 | 116 | cv::Mat complexDotDivisionReal(cv::Mat a, cv::Mat b) 117 | { 118 | std::vector pa; 119 | cv::split(a, pa); 120 | 121 | std::vector pres; 122 | 123 | cv::Mat divisor = 1. / b; 124 | 125 | pres.push_back(pa[0].mul(divisor)); 126 | pres.push_back(pa[1].mul(divisor)); 127 | 128 | cv::Mat res; 129 | cv::merge(pres, res); 130 | return res; 131 | } 132 | 133 | cv::Mat complexDotDivision(cv::Mat a, cv::Mat b) 134 | { 135 | std::vector pa; 136 | std::vector pb; 137 | cv::split(a, pa); 138 | cv::split(b, pb); 139 | 140 | cv::Mat divisor = 1. / (pb[0].mul(pb[0]) + pb[1].mul(pb[1])); 141 | 142 | std::vector pres; 143 | 144 | pres.push_back((pa[0].mul(pb[0]) + pa[1].mul(pb[1])).mul(divisor)); 145 | pres.push_back((pa[1].mul(pb[0]) + pa[0].mul(pb[1])).mul(divisor)); 146 | 147 | cv::Mat res; 148 | cv::merge(pres, res); 149 | return res; 150 | } 151 | 152 | void rearrange(cv::Mat &img) //KCF page 11 Figure 6; 153 | { 154 | // img = img(cv::Rect(0, 0, img.cols & -2, img.rows & -2)); 155 | int cx = img.cols / 2; 156 | int cy = img.rows / 2; 157 | 158 | cv::Mat q0(img, cv::Rect(0, 0, cx, cy)); // Top-Left - Create a ROI per quadrant 159 | cv::Mat q1(img, cv::Rect(cx, 0, cx, cy)); // Top-Right 160 | cv::Mat q2(img, cv::Rect(0, cy, cx, cy)); // Bottom-Left 161 | cv::Mat q3(img, cv::Rect(cx, cy, cx, cy)); // Bottom-Right 162 | 163 | cv::Mat tmp; // swap quadrants (Top-Left with Bottom-Right) 164 | q0.copyTo(tmp); 165 | q3.copyTo(q0); 166 | tmp.copyTo(q3); 167 | q1.copyTo(tmp); // swap quadrant (Top-Right with Bottom-Left) 168 | q2.copyTo(q1); 169 | tmp.copyTo(q2); 170 | } 171 | /* 172 | template < typename type> 173 | cv::Mat fouriertransFull(const cv::Mat & in) 174 | { 175 | return dft_d(in); 176 | 177 | cv::Mat planes[] = {cv::Mat_ (in), cv::Mat_::zeros(in.size())}; 178 | cv::Mat t; 179 | assert(planes[0].depth() == planes[1].depth()); 180 | assert(planes[0].size == planes[1].size); 181 | cv::merge(planes, 2, t); 182 | cv::dft(t, t); 183 | 184 | //cv::normalize(a, a, 0, 1, CV_MINMAX); 185 | //cv::normalize(t, t, 0, 1, CV_MINMAX); 186 | 187 | // cv::imshow("a",real(a)); 188 | // cv::imshow("b",real(t)); 189 | // cv::waitKey(0); 190 | 191 | return t; 192 | }*/ 193 | 194 | void normalizedLogTransform(cv::Mat &img) 195 | { 196 | img = cv::abs(img); 197 | img += cv::Scalar::all(1); 198 | cv::log(img, img); 199 | // cv::normalize(img, img, 0, 1, CV_MINMAX); 200 | } 201 | } // namespace kcf 202 | -------------------------------------------------------------------------------- /ECO/scale_filter.cc: -------------------------------------------------------------------------------- 1 | #include "scale_filter.hpp" 2 | 3 | namespace eco 4 | { 5 | void ScaleFilter::init(int &nScales, float &scale_step, const EcoParameters ¶ms) 6 | { 7 | nScales = params.number_of_scales_filter; 8 | scale_step = params.scale_step_filter; 9 | float scale_sigma = params.number_of_interp_scales * params.scale_sigma_factor; 10 | vector scale_exp, scale_exp_shift; 11 | int scalemin = floor((1.0 - (float)nScales) / 2.0); 12 | int scalemax = floor(((float)nScales - 1.0) / 2.0); 13 | for (int i = scalemin; i <= scalemax; i++) 14 | { 15 | scale_exp.push_back(i * params.number_of_interp_scales / (float)nScales); 16 | } 17 | for (int i = 0; i < nScales; i++) 18 | { 19 | scale_exp_shift.push_back(scale_exp[(i + nScales / 2) % nScales]); 20 | } 21 | /* debug("scale: min:%d, max:%d", scalemin, scalemax); 22 | debug("scale_exp_shift:"); 23 | for (int i = 0; i < nScales; i++) 24 | { 25 | printf("%d:%f; ", i, scale_exp_shift[i]); 26 | } 27 | printf("\n"); 28 | */ 29 | vector interp_scale_exp, interp_scale_exp_shift; 30 | scalemin = floor((1.0 - (float)params.number_of_interp_scales) / 2.0); 31 | scalemax = floor(((float)params.number_of_interp_scales - 1.0) / 2.0); 32 | for (int i = scalemin; i <= scalemax; i++) 33 | { 34 | interp_scale_exp.push_back(i); 35 | } 36 | for (int i = 0; i < params.number_of_interp_scales; i++) 37 | { 38 | interp_scale_exp_shift.push_back(interp_scale_exp[(i + params.number_of_interp_scales / 2) % params.number_of_interp_scales]); 39 | } 40 | /* debug("scale: min:%d, max:%d", scalemin, scalemax); 41 | debug("interp_scale_exp_shift:"); 42 | for (int i = 0; i < params.number_of_interp_scales; i++) 43 | { 44 | printf("%d:%f; ", i, interp_scale_exp_shift[i]); 45 | } 46 | printf("\n"); 47 | */ 48 | for (int i = 0; i < nScales; i++) 49 | { 50 | scaleSizeFactors_.push_back(std::pow(scale_step, scale_exp[i])); 51 | } 52 | /* debug("scaleSizeFactors_:"); 53 | for (int i = 0; i < nScales; i++) 54 | { 55 | printf("%d:%f; ", i, scaleSizeFactors_[i]); 56 | } 57 | printf("\n"); 58 | */ 59 | for (int i = 0; i < params.number_of_interp_scales; i++) 60 | { 61 | interpScaleFactors_.push_back(std::pow(scale_step, interp_scale_exp_shift[i])); 62 | } 63 | /* debug("interpScaleFactors_:"); 64 | for (int i = 0; i < params.number_of_interp_scales; i++) 65 | { 66 | printf("%d:%f; ", i, interpScaleFactors_[i]); 67 | } 68 | printf("\n"); 69 | */ 70 | 71 | cv::Mat ys_mat = cv::Mat(cv::Size(nScales, 1), CV_32FC1); 72 | for (int i = 0; i < nScales; i++) 73 | { 74 | ys_mat.at(0, i) = std::exp(-0.5f * scale_exp_shift[i] * scale_exp_shift[i] / scale_sigma / scale_sigma); 75 | } 76 | /* 77 | debug("ys:"); 78 | printMat(ys_mat); 79 | showmat1channels(ys_mat,2); 80 | */ 81 | yf_ = real(dft(ys_mat, false)); 82 | /* 83 | debug("yf:"); 84 | printMat(yf_); 85 | showmat1channels(yf_,2); 86 | */ 87 | 88 | for (int i = 0; i < nScales; i++) 89 | { 90 | window_.push_back(0.5f * (1.0f - std::cos(2 * M_PI * i / (nScales - 1.0f)))); 91 | } 92 | /* 93 | debug("window_:"); 94 | for (int i = 0; i < nScales; i++) 95 | { 96 | printf("%d:%f; ", i, window_[i]); 97 | } 98 | */ 99 | //max_scale_dim_ = !params.s_num_compressed_dim.compare("MAX"); 100 | //debug("max_scale_dim_: %d", max_scale_dim_); 101 | } 102 | 103 | float ScaleFilter::scale_filter_track(const cv::Mat &im, const cv::Point2f &pos, const cv::Size2f &base_target_sz, const float ¤tScaleFactor, const EcoParameters ¶ms) 104 | { 105 | debug("%f", currentScaleFactor); 106 | vector scales; 107 | for (unsigned int i = 0; i < scaleSizeFactors_.size(); i++) 108 | { 109 | scales.push_back(scaleSizeFactors_[i] * currentScaleFactor); 110 | //printf("%f ", scaleSizeFactors_[i]); 111 | } 112 | cv::Mat xs = extract_scale_sample(im, pos, base_target_sz, scales, params.scale_model_sz); 113 | 114 | debug("Not finished!-------------------"); 115 | assert(0); 116 | 117 | float scale_change_factor; 118 | return scale_change_factor; 119 | } 120 | 121 | cv::Mat ScaleFilter::extract_scale_sample(const cv::Mat &im, const cv::Point2f &posf, const cv::Size2f &base_target_sz, vector &scaleFactors, const cv::Size &scale_model_sz) 122 | { 123 | //printMat(new_im); 124 | //showmat3channels(new_im, 0); 125 | //debug("pos: %f %f", posf.x, posf.y); 126 | cv::Point2i pos(posf); 127 | int nScales = scaleFactors.size(); 128 | int df = std::floor(*std::min_element(std::begin(scaleFactors), std::end(scaleFactors))); 129 | // debug("df:%d", df); 130 | 131 | cv::Mat new_im; 132 | im.copyTo(new_im); 133 | if (df > 1) 134 | { 135 | // compute offset and new center position 136 | cv::Point os((pos.x - 1) % df, ((pos.y - 1) % df)); 137 | pos.x = (pos.x - os.x - 1) / df + 1; 138 | pos.y = (pos.y - os.y - 1) / df + 1; 139 | 140 | for (unsigned int i = 0; i < scaleFactors.size(); i++) 141 | { 142 | scaleFactors[i] /= df; 143 | } 144 | // down sample image 145 | int r = (im.rows - os.y) / df + 1; 146 | int c = (im.cols - os.x) / df; 147 | cv::Mat new_im2(r, c, im.type()); 148 | new_im = new_im2; 149 | for (size_t i = 0 + os.y, m = 0; 150 | i < (size_t)im.rows && m < (size_t)new_im.rows; 151 | i += df, ++m) 152 | { 153 | for (size_t j = 0 + os.x, n = 0; 154 | j < (size_t)im.cols && n < (size_t)new_im.cols; 155 | j += df, ++n) 156 | { 157 | 158 | if (im.channels() == 1) 159 | { 160 | new_im.at(m, n) = im.at(i, j); 161 | } 162 | else 163 | { 164 | new_im.at(m, n) = im.at(i, j); 165 | } 166 | } 167 | } 168 | } 169 | 170 | for (int s = 0; s < nScales; s++) 171 | { 172 | cv::Size patch_sz; 173 | patch_sz.width = std::max(std::floor(base_target_sz.width * scaleFactors[s]), 2.0f); 174 | patch_sz.height = std::max(std::floor(base_target_sz.height * scaleFactors[s]), 2.0f); 175 | //debug("patch_sz:%d %d", patch_sz.height, patch_sz.width); 176 | 177 | cv::Point pos2(pos.x - floor((patch_sz.width + 1) / 2), 178 | pos.y - floor((patch_sz.height + 1) / 2)); 179 | 180 | cv::Mat im_patch = subwindow(new_im, cv::Rect(pos2, patch_sz), IPL_BORDER_REPLICATE); 181 | 182 | cv::Mat im_patch_resized; 183 | if (im_patch.cols == 0 || im_patch.rows == 0) 184 | { 185 | return im_patch_resized; 186 | } 187 | cv::resize(im_patch, im_patch_resized, scale_model_sz); 188 | //printMat(im_patch); 189 | //showmat3channels(im_patch, 0); 190 | //printMat(im_patch_resized); 191 | //showmat3channels(im_patch_resized, 0); 192 | 193 | vector im_vector, temp_hog; 194 | im_vector.push_back(im_patch); 195 | FeatureExtractor feature_extractor; 196 | #ifdef USE_SIMD 197 | temp_hog = feature_extractor.get_hog_features_simd(im_vector); 198 | #else 199 | temp_hog = feature_extractor.get_hog_features(im_vector); 200 | #endif 201 | temp_hog = feature_extractor.hog_feature_normalization(temp_hog); 202 | 203 | debug("Not finished!-------------------"); 204 | assert(0); 205 | } 206 | 207 | cv::Mat scale_sample; 208 | return scale_sample; 209 | } 210 | 211 | } // namespace eco -------------------------------------------------------------------------------- /KCF/kcftracker.hpp: -------------------------------------------------------------------------------- 1 | /* 2 | 3 | Tracker based on Kernelized Correlation Filter (KCF) [1] and Circulant Structure with Kernels (CSK) [2]. 4 | CSK is implemented by using raw gray level features, since it is a single-channel filter. 5 | KCF is implemented by using HOG features (the default), since it extends CSK to multiple channels. 6 | 7 | [1] J. F. Henriques, R. Caseiro, P. Martins, J. Batista, 8 | "High-Speed Tracking with Kernelized Correlation Filters", TPAMI 2015. 9 | 10 | [2] J. F. Henriques, R. Caseiro, P. Martins, J. Batista, 11 | "Exploiting the Circulant Structure of Tracking-by-detection with Kernels", ECCV 2012. 12 | 13 | Authors: Joao Faro, Christian Bailer, Joao F. Henriques 14 | Contacts: joaopfaro@gmail.com, Christian.Bailer@dfki.de, henriques@isr.uc.pt 15 | Institute of Systems and Robotics - University of Coimbra / Department Augmented Vision DFKI 16 | 17 | 18 | Constructor parameters, all boolean: 19 | hog: use HOG features (default), otherwise use raw pixels 20 | fixed_window: fix window size (default), otherwise use ROI size (slower but more accurate) 21 | multiscale: use multi-scale tracking (default; cannot be used with fixed_window = true) 22 | 23 | Default values are set for all properties of the tracker depending on the above choices. 24 | Their values can be customized further before calling init(): 25 | interp_factor: linear interpolation factor for adaptation 26 | sigma: gaussian kernel bandwidth 27 | lambda: regularization 28 | cell_size: HOG cell size 29 | padding: horizontal area surrounding the target, relative to its size 30 | output_sigma_factor: bandwidth of gaussian target 31 | template_size: template size in pixels, 0 to use ROI size 32 | scale_step: scale step for multi-scale estimation, 1 to disable it 33 | scale_weight: to downweight detection scores of other scales for added stability 34 | 35 | For speed, the value (template_size/cell_size) should be a power of 2 or a product of small prime numbers. 36 | 37 | Inputs to init(): 38 | image is the initial frame. 39 | roi is a cv::Rect with the target positions in the initial frame 40 | 41 | Inputs to update(): 42 | image is the current frame. 43 | 44 | Outputs of update(): 45 | cv::Rect with target positions for the current frame 46 | 47 | 48 | By downloading, copying, installing or using the software you agree to this license. 49 | If you do not agree to this license, do not download, install, 50 | copy or use the software. 51 | 52 | 53 | License Agreement 54 | For Open Source Computer Vision Library 55 | (3-clause BSD License) 56 | 57 | Redistribution and use in source and binary forms, with or without modification, 58 | are permitted provided that the following conditions are met: 59 | 60 | * Redistributions of source code must retain the above copyright notice, 61 | this list of conditions and the following disclaimer. 62 | 63 | * Redistributions in binary form must reproduce the above copyright notice, 64 | this list of conditions and the following disclaimer in the documentation 65 | and/or other materials provided with the distribution. 66 | 67 | * Neither the names of the copyright holders nor the names of the contributors 68 | may be used to endorse or promote products derived from this software 69 | without specific prior written permission. 70 | 71 | This software is provided by the copyright holders and contributors "as is" and 72 | any express or implied warranties, including, but not limited to, the implied 73 | warranties of merchantability and fitness for a particular purpose are disclaimed. 74 | In no event shall copyright holders or contributors be liable for any direct, 75 | indirect, incidental, special, exemplary, or consequential damages 76 | (including, but not limited to, procurement of substitute goods or services; 77 | loss of use, data, or profits; or business interruption) however caused 78 | and on any theory of liability, whether in contract, strict liability, 79 | or tort (including negligence or otherwise) arising in any way out of 80 | the use of this software, even if advised of the possibility of such damage. 81 | */ 82 | 83 | #pragma once 84 | #include 85 | #include 86 | #ifndef _OPENCV_KCFTRACKER_HPP_ 87 | #define _OPENCV_KCFTRACKER_HPP_ 88 | #endif 89 | 90 | namespace kcf 91 | { 92 | class KCFTracker 93 | { 94 | public: 95 | // Constructor 96 | KCFTracker(bool hog = true, bool fixed_window = true, bool multiscale = true, bool lab = true, bool dsst = false); 97 | 98 | // Initialize tracker 99 | void init( const cv::Mat image, const cv::Rect2d& roi); 100 | 101 | // Update position based on the new frame 102 | //cv::Rect update(cv::Mat image); 103 | bool update( const cv::Mat image, cv::Rect2d& roi); 104 | 105 | float detect_thresh_kcf; // thresh hold for tracking error or not 106 | float sigma; // gaussian kernel bandwidth 107 | float lambda; // regularization 108 | float interp_factor; // linear interpolation factor for adaptation 109 | int cell_size; // HOG cell size 110 | int cell_sizeQ; // cell size^2, to avoid repeated operations 111 | float padding; // extra area surrounding the target 112 | float output_sigma_factor; // bandwidth of gaussian target 113 | int template_size; // template size 114 | 115 | float scale_step; // scale step for multi-scale estimation 116 | float scale_weight; // to downweight detection scores of other scales for added stability 117 | 118 | //=====dsst==== 119 | float detect_thresh_dsst; // thresh hold for tracking error or not 120 | int base_width_dsst; // initial ROI widt 121 | int base_height_dsst; // initial ROI height 122 | int scale_max_area; // max ROI size before compressing 123 | float scale_padding; // extra area surrounding the target for scaling 124 | // float scale_step; // scale step for multi-scale estimation 125 | float scale_sigma_factor; // bandwidth of gaussian target 126 | int n_scales; // # of scaling windows 127 | float scale_lr; // scale learning rate 128 | float *scaleFactors; // all scale changing rate, from larger to smaller with 1 to be the middle 129 | int scale_model_width; // the model width for scaling 130 | int scale_model_height; // the model height for scaling 131 | float min_scale_factor; // min scaling rate 132 | float max_scale_factor; // max scaling rate 133 | float scale_lambda; // regularization 134 | //=========== 135 | 136 | protected: 137 | bool update_kcf( const cv::Mat image, cv::Rect2d& roi); 138 | // Detect object in the current frame. 139 | cv::Point2f detect(cv::Mat z, cv::Mat x, float &peak_value); // paper Algorithm 1 , _alpha updated in train(); 140 | 141 | // train tracker with a single image, to update _alphaf; 142 | void train(cv::Mat x, float train_interp_factor); 143 | 144 | // Evaluates a Gaussian kernel with bandwidth SIGMA for all relative shifts between input images X and Y, which must both be MxN. They must also be periodic (ie., pre-processed with a cosine window). 145 | cv::Mat gaussianCorrelation(cv::Mat x1, cv::Mat x2); // paper (30) 146 | 147 | // Create Gaussian Peak. Function called only in the first frame. 148 | cv::Mat createGaussianPeak(int sizey, int sizex); 149 | 150 | // Obtain sub-window from image, with replication-padding and extract features 151 | cv::Mat getFeatures(const cv::Mat & image, bool inithann, float scale_adjust = 1.0f); 152 | 153 | // Initialize Hanning window. Function called only in the first frame. 154 | void createHanningMats(); 155 | 156 | // Calculate sub-pixel peak for one dimension 157 | float subPixelPeak(float left, float center, float right); 158 | 159 | //=====dsst==== 160 | // Initialization for scales 161 | void init_dsst(const cv::Mat image, const cv::Rect2d& roi); 162 | 163 | bool update_dsst( const cv::Mat image, cv::Rect2d& roi); 164 | // Detect the new scaling rate 165 | cv::Point2i detect_dsst(cv::Mat image); 166 | 167 | // Train method for scaling 168 | void train_dsst(cv::Mat image, bool ini = false); 169 | 170 | // Compute the F^l in the paper 171 | cv::Mat get_sample_dsst(const cv::Mat & image); 172 | 173 | // Compute the FFT Guassian Peak for scaling 174 | cv::Mat createGaussianPeak_dsst(); 175 | 176 | // Compute the hanning window for scaling 177 | cv::Mat createHanningMats_dsst(); 178 | //=========== 179 | 180 | cv::Mat _alphaf;//alpha in paper, use this to calculate the detect result, changed in train(); 181 | cv::Mat _prob; //Gaussian Peak(training outputs); 182 | cv::Mat _tmpl; //features of image (or the normalized gray image itself when raw), changed in train(); 183 | cv::Mat _num; //numerator: use to update as MOSSE 184 | cv::Mat _den; //denumerator: use to update as MOSSE 185 | cv::Mat _labCentroids; 186 | 187 | cv::Rect_ _roi; 188 | 189 | private: 190 | int _size_patch[3];//0:rows;1:cols;2:numFeatures; init in getFeatures(); 191 | cv::Mat _hann; 192 | cv::Size _tmpl_sz; 193 | float _scale; 194 | int _gaussian_size; 195 | bool _hogfeatures; 196 | bool _labfeatures; 197 | float _peak_value; 198 | 199 | //=====dsst==== 200 | bool _dsst; 201 | float _scale_dsst; 202 | cv::Mat _den_dsst; 203 | cv::Mat _num_dsst; 204 | cv::Mat _hann_dsst; 205 | cv::Mat _prob_dsst; 206 | //============ 207 | }; 208 | } 209 | -------------------------------------------------------------------------------- /ECO/parameters.hpp: -------------------------------------------------------------------------------- 1 | // Set the value the same as testing_ECO_gpu.m 2 | #ifndef PARAMETERS_HPP 3 | #define PARAMETERS_HPP 4 | 5 | #ifdef USE_CAFFE 6 | #include 7 | #include 8 | #endif 9 | 10 | #include 11 | #include 12 | #include 13 | 14 | #define INF 0x7f800000 //0x7fffffff 15 | 16 | using std::string; 17 | using std::vector; 18 | 19 | namespace eco 20 | { 21 | // ECO feature[Num_features][Dimension_of_the_feature]; 22 | typedef std::vector> ECO_FEATS; 23 | typedef cv::Vec COMPLEX; // represent a complex number; 24 | 25 | // cnn feature configuration ========================================= 26 | #ifdef USE_CAFFE 27 | struct CnnParameters 28 | { 29 | string proto = "/home/nvidia/Develop/Project/Tracker/OpenTracker/eco/model/imagenet-vgg-m-2048.prototxt"; 30 | string model = "/home/nvidia/Develop/Project/Tracker/OpenTracker/eco/model/VGG_CNN_M_2048.caffemodel"; 31 | string mean_file = "/home/nvidia/Develop/Project/Tracker/OpenTracker/eco/model/VGG_mean.binaryproto"; 32 | 33 | boost::shared_ptr> net; 34 | cv::Mat deep_mean_mat, deep_mean_mean_mat; 35 | 36 | string nn_name = "imagenet-vgg-m-2048.mat"; 37 | vector stride = {2, 16}; // stride in total 38 | vector cell_size = {4, 16}; // downsample_factor 39 | vector output_layer = {3, 14}; // Which layers to use 40 | vector downsample_factor = {2, 1}; // How much to downsample each output layer 41 | int input_size_scale = 1; // Extra scale factor of the input samples to the network (1 is no scaling) 42 | vector nDim = {96, 512}; // Original dimension of features (ECO Paper Table 1) 43 | vector compressed_dim = {16, 64}; // Compressed dimensionality of each output layer (ECO Paper Table 1) 44 | vector penalty = {0, 0}; 45 | 46 | vector start_ind = {3, 3, 1, 1}; // sample feature start index 47 | vector